drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

   1 /*
   2  * Copyright 2008 Advanced Micro Devices, Inc.
   3  * Copyright 2008 Red Hat Inc.
   4  * Copyright 2009 Jerome Glisse.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining a
   7  * copy of this software and associated documentation files (the "Software"),
   8  * to deal in the Software without restriction, including without limitation
   9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10  * and/or sell copies of the Software, and to permit persons to whom the
  11  * Software is furnished to do so, subject to the following conditions:
  12  *
  13  * The above copyright notice and this permission notice shall be included in
  14  * all copies or substantial portions of the Software.
  15  *
  16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22  * OTHER DEALINGS IN THE SOFTWARE.
  23  *
  24  * Authors: Dave Airlie
  25  *          Alex Deucher
  26  *          Jerome Glisse
  27  */
  28 #include <linux/power_supply.h>
  29 #include <linux/kthread.h>
  30 #include <linux/module.h>
  31 #include <linux/console.h>
  32 #include <linux/slab.h>
  33 #include <linux/iommu.h>
  34 #include <linux/pci.h>
  35 #include <linux/pci-p2pdma.h>
  36 #include <linux/apple-gmux.h>
  37
  38 #include <drm/drm_aperture.h>
  39 #include <drm/drm_atomic_helper.h>
  40 #include <drm/drm_crtc_helper.h>
  41 #include <drm/drm_fb_helper.h>
  42 #include <drm/drm_probe_helper.h>
  43 #include <drm/amdgpu_drm.h>
  44 #include <linux/device.h>
  45 #include <linux/vgaarb.h>
  46 #include <linux/vga_switcheroo.h>
  47 #include <linux/efi.h>
  48 #include "amdgpu.h"
  49 #include "amdgpu_trace.h"
  50 #include "amdgpu_i2c.h"
  51 #include "atom.h"
  52 #include "amdgpu_atombios.h"
  53 #include "amdgpu_atomfirmware.h"
  54 #include "amd_pcie.h"
  55 #ifdef CONFIG_DRM_AMDGPU_SI
  56 #include "si.h"
  57 #endif
  58 #ifdef CONFIG_DRM_AMDGPU_CIK
  59 #include "cik.h"
  60 #endif
  61 #include "vi.h"
  62 #include "soc15.h"
  63 #include "nv.h"
  64 #include "bif/bif_4_1_d.h"
  65 #include <linux/firmware.h>
  66 #include "amdgpu_vf_error.h"
  67
  68 #include "amdgpu_amdkfd.h"
  69 #include "amdgpu_pm.h"
  70
  71 #include "amdgpu_xgmi.h"
  72 #include "amdgpu_ras.h"
  73 #include "amdgpu_pmu.h"
  74 #include "amdgpu_fru_eeprom.h"
  75 #include "amdgpu_reset.h"
  76 #include "amdgpu_virt.h"
  77 #include "amdgpu_dev_coredump.h"
  78
  79 #include <linux/suspend.h>
  80 #include <drm/task_barrier.h>
  81 #include <linux/pm_runtime.h>
  82
  83 #include <drm/drm_drv.h>
  84
  85 #if IS_ENABLED(CONFIG_X86)
  86 #include <asm/intel-family.h>
  87 #endif
  88
  89 MODULE_FIRMWARE("amdgpu/vega10_gpu_info.bin");
  90 MODULE_FIRMWARE("amdgpu/vega12_gpu_info.bin");
  91 MODULE_FIRMWARE("amdgpu/raven_gpu_info.bin");
  92 MODULE_FIRMWARE("amdgpu/picasso_gpu_info.bin");
  93 MODULE_FIRMWARE("amdgpu/raven2_gpu_info.bin");
  94 MODULE_FIRMWARE("amdgpu/arcturus_gpu_info.bin");
  95 MODULE_FIRMWARE("amdgpu/navi12_gpu_info.bin");
  96
  97 #define AMDGPU_RESUME_MS                2000
  98 #define AMDGPU_MAX_RETRY_LIMIT          2
  99 #define AMDGPU_RETRY_SRIOV_RESET(r) ((r) == -EBUSY || (r) == -ETIMEDOUT || (r) == -EINVAL)
 100 #define AMDGPU_PCIE_INDEX_FALLBACK (0x38 >> 2)
 101 #define AMDGPU_PCIE_INDEX_HI_FALLBACK (0x44 >> 2)
 102 #define AMDGPU_PCIE_DATA_FALLBACK (0x3C >> 2)
 103
 104 static const struct drm_driver amdgpu_kms_driver;
 105
 106 const char *amdgpu_asic_name[] = {
 107         "TAHITI",
 108         "PITCAIRN",
 109         "VERDE",
 110         "OLAND",
 111         "HAINAN",
 112         "BONAIRE",
 113         "KAVERI",
 114         "KABINI",
 115         "HAWAII",
 116         "MULLINS",
 117         "TOPAZ",
 118         "TONGA",
 119         "FIJI",
 120         "CARRIZO",
 121         "STONEY",
 122         "POLARIS10",
 123         "POLARIS11",
 124         "POLARIS12",
 125         "VEGAM",
 126         "VEGA10",
 127         "VEGA12",
 128         "VEGA20",
 129         "RAVEN",
 130         "ARCTURUS",
 131         "RENOIR",
 132         "ALDEBARAN",
 133         "NAVI10",
 134         "CYAN_SKILLFISH",
 135         "NAVI14",
 136         "NAVI12",
 137         "SIENNA_CICHLID",
 138         "NAVY_FLOUNDER",
 139         "VANGOGH",
 140         "DIMGREY_CAVEFISH",
 141         "BEIGE_GOBY",
 142         "YELLOW_CARP",
 143         "IP DISCOVERY",
 144         "LAST",
 145 };
 146
 147 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev);
 148
 149 /**
 150  * DOC: pcie_replay_count
 151  *
 152  * The amdgpu driver provides a sysfs API for reporting the total number
 153  * of PCIe replays (NAKs)
 154  * The file pcie_replay_count is used for this and returns the total
 155  * number of replays as a sum of the NAKs generated and NAKs received
 156  */
 157
 158 static ssize_t amdgpu_device_get_pcie_replay_count(struct device *dev,
 159                 struct device_attribute *attr, char *buf)
 160 {
 161         struct drm_device *ddev = dev_get_drvdata(dev);
 162         struct amdgpu_device *adev = drm_to_adev(ddev);
 163         uint64_t cnt = amdgpu_asic_get_pcie_replay_count(adev);
 164
 165         return sysfs_emit(buf, "%llu\n", cnt);
 166 }
 167
 168 static DEVICE_ATTR(pcie_replay_count, 0444,
 169                 amdgpu_device_get_pcie_replay_count, NULL);
 170
 171 static ssize_t amdgpu_sysfs_reg_state_get(struct file *f, struct kobject *kobj,
 172                                           struct bin_attribute *attr, char *buf,
 173                                           loff_t ppos, size_t count)
 174 {
 175         struct device *dev = kobj_to_dev(kobj);
 176         struct drm_device *ddev = dev_get_drvdata(dev);
 177         struct amdgpu_device *adev = drm_to_adev(ddev);
 178         ssize_t bytes_read;
 179
 180         switch (ppos) {
 181         case AMDGPU_SYS_REG_STATE_XGMI:
 182                 bytes_read = amdgpu_asic_get_reg_state(
 183                         adev, AMDGPU_REG_STATE_TYPE_XGMI, buf, count);
 184                 break;
 185         case AMDGPU_SYS_REG_STATE_WAFL:
 186                 bytes_read = amdgpu_asic_get_reg_state(
 187                         adev, AMDGPU_REG_STATE_TYPE_WAFL, buf, count);
 188                 break;
 189         case AMDGPU_SYS_REG_STATE_PCIE:
 190                 bytes_read = amdgpu_asic_get_reg_state(
 191                         adev, AMDGPU_REG_STATE_TYPE_PCIE, buf, count);
 192                 break;
 193         case AMDGPU_SYS_REG_STATE_USR:
 194                 bytes_read = amdgpu_asic_get_reg_state(
 195                         adev, AMDGPU_REG_STATE_TYPE_USR, buf, count);
 196                 break;
 197         case AMDGPU_SYS_REG_STATE_USR_1:
 198                 bytes_read = amdgpu_asic_get_reg_state(
 199                         adev, AMDGPU_REG_STATE_TYPE_USR_1, buf, count);
 200                 break;
 201         default:
 202                 return -EINVAL;
 203         }
 204
 205         return bytes_read;
 206 }
 207
 208 BIN_ATTR(reg_state, 0444, amdgpu_sysfs_reg_state_get, NULL,
 209          AMDGPU_SYS_REG_STATE_END);
 210
 211 int amdgpu_reg_state_sysfs_init(struct amdgpu_device *adev)
 212 {
 213         int ret;
 214
 215         if (!amdgpu_asic_get_reg_state_supported(adev))
 216                 return 0;
 217
 218         ret = sysfs_create_bin_file(&adev->dev->kobj, &bin_attr_reg_state);
 219
 220         return ret;
 221 }
 222
 223 void amdgpu_reg_state_sysfs_fini(struct amdgpu_device *adev)
 224 {
 225         if (!amdgpu_asic_get_reg_state_supported(adev))
 226                 return;
 227         sysfs_remove_bin_file(&adev->dev->kobj, &bin_attr_reg_state);
 228 }
 229
 230 /**
 231  * DOC: board_info
 232  *
 233  * The amdgpu driver provides a sysfs API for giving board related information.
 234  * It provides the form factor information in the format
 235  *
 236  *   type : form factor
 237  *
 238  * Possible form factor values
 239  *
 240  * - "cem"              - PCIE CEM card
 241  * - "oam"              - Open Compute Accelerator Module
 242  * - "unknown"  - Not known
 243  *
 244  */
 245
 246 static ssize_t amdgpu_device_get_board_info(struct device *dev,
 247                                             struct device_attribute *attr,
 248                                             char *buf)
 249 {
 250         struct drm_device *ddev = dev_get_drvdata(dev);
 251         struct amdgpu_device *adev = drm_to_adev(ddev);
 252         enum amdgpu_pkg_type pkg_type = AMDGPU_PKG_TYPE_CEM;
 253         const char *pkg;
 254
 255         if (adev->smuio.funcs && adev->smuio.funcs->get_pkg_type)
 256                 pkg_type = adev->smuio.funcs->get_pkg_type(adev);
 257
 258         switch (pkg_type) {
 259         case AMDGPU_PKG_TYPE_CEM:
 260                 pkg = "cem";
 261                 break;
 262         case AMDGPU_PKG_TYPE_OAM:
 263                 pkg = "oam";
 264                 break;
 265         default:
 266                 pkg = "unknown";
 267                 break;
 268         }
 269
 270         return sysfs_emit(buf, "%s : %s\n", "type", pkg);
 271 }
 272
 273 static DEVICE_ATTR(board_info, 0444, amdgpu_device_get_board_info, NULL);
 274
 275 static struct attribute *amdgpu_board_attrs[] = {
 276         &dev_attr_board_info.attr,
 277         NULL,
 278 };
 279
 280 static umode_t amdgpu_board_attrs_is_visible(struct kobject *kobj,
 281                                              struct attribute *attr, int n)
 282 {
 283         struct device *dev = kobj_to_dev(kobj);
 284         struct drm_device *ddev = dev_get_drvdata(dev);
 285         struct amdgpu_device *adev = drm_to_adev(ddev);
 286
 287         if (adev->flags & AMD_IS_APU)
 288                 return 0;
 289
 290         return attr->mode;
 291 }
 292
 293 static const struct attribute_group amdgpu_board_attrs_group = {
 294         .attrs = amdgpu_board_attrs,
 295         .is_visible = amdgpu_board_attrs_is_visible
 296 };
 297
 298 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev);
 299
 300
 301 /**
 302  * amdgpu_device_supports_px - Is the device a dGPU with ATPX power control
 303  *
 304  * @dev: drm_device pointer
 305  *
 306  * Returns true if the device is a dGPU with ATPX power control,
 307  * otherwise return false.
 308  */
 309 bool amdgpu_device_supports_px(struct drm_device *dev)
 310 {
 311         struct amdgpu_device *adev = drm_to_adev(dev);
 312
 313         if ((adev->flags & AMD_IS_PX) && !amdgpu_is_atpx_hybrid())
 314                 return true;
 315         return false;
 316 }
 317
 318 /**
 319  * amdgpu_device_supports_boco - Is the device a dGPU with ACPI power resources
 320  *
 321  * @dev: drm_device pointer
 322  *
 323  * Returns true if the device is a dGPU with ACPI power control,
 324  * otherwise return false.
 325  */
 326 bool amdgpu_device_supports_boco(struct drm_device *dev)
 327 {
 328         struct amdgpu_device *adev = drm_to_adev(dev);
 329
 330         if (adev->has_pr3 ||
 331             ((adev->flags & AMD_IS_PX) && amdgpu_is_atpx_hybrid()))
 332                 return true;
 333         return false;
 334 }
 335
 336 /**
 337  * amdgpu_device_supports_baco - Does the device support BACO
 338  *
 339  * @dev: drm_device pointer
 340  *
 341  * Return:
 342  * 1 if the device supporte BACO;
 343  * 3 if the device support MACO (only works if BACO is supported)
 344  * otherwise return 0.
 345  */
 346 int amdgpu_device_supports_baco(struct drm_device *dev)
 347 {
 348         struct amdgpu_device *adev = drm_to_adev(dev);
 349
 350         return amdgpu_asic_supports_baco(adev);
 351 }
 352
 353 void amdgpu_device_detect_runtime_pm_mode(struct amdgpu_device *adev)
 354 {
 355         struct drm_device *dev;
 356         int bamaco_support;
 357
 358         dev = adev_to_drm(adev);
 359
 360         adev->pm.rpm_mode = AMDGPU_RUNPM_NONE;
 361         bamaco_support = amdgpu_device_supports_baco(dev);
 362
 363         switch (amdgpu_runtime_pm) {
 364         case 2:
 365                 if (bamaco_support & MACO_SUPPORT) {
 366                         adev->pm.rpm_mode = AMDGPU_RUNPM_BAMACO;
 367                         dev_info(adev->dev, "Forcing BAMACO for runtime pm\n");
 368                 } else if (bamaco_support == BACO_SUPPORT) {
 369                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 370                         dev_info(adev->dev, "Requested mode BAMACO not available,fallback to use BACO\n");
 371                 }
 372                 break;
 373         case 1:
 374                 if (bamaco_support & BACO_SUPPORT) {
 375                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 376                         dev_info(adev->dev, "Forcing BACO for runtime pm\n");
 377                 }
 378                 break;
 379         case -1:
 380         case -2:
 381                 if (amdgpu_device_supports_px(dev)) { /* enable PX as runtime mode */
 382                         adev->pm.rpm_mode = AMDGPU_RUNPM_PX;
 383                         dev_info(adev->dev, "Using ATPX for runtime pm\n");
 384                 } else if (amdgpu_device_supports_boco(dev)) { /* enable boco as runtime mode */
 385                         adev->pm.rpm_mode = AMDGPU_RUNPM_BOCO;
 386                         dev_info(adev->dev, "Using BOCO for runtime pm\n");
 387                 } else {
 388                         if (!bamaco_support)
 389                                 goto no_runtime_pm;
 390
 391                         switch (adev->asic_type) {
 392                         case CHIP_VEGA20:
 393                         case CHIP_ARCTURUS:
 394                                 /* BACO are not supported on vega20 and arctrus */
 395                                 break;
 396                         case CHIP_VEGA10:
 397                                 /* enable BACO as runpm mode if noretry=0 */
 398                                 if (!adev->gmc.noretry)
 399                                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 400                                 break;
 401                         default:
 402                                 /* enable BACO as runpm mode on CI+ */
 403                                 adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 404                                 break;
 405                         }
 406
 407                         if (adev->pm.rpm_mode == AMDGPU_RUNPM_BACO) {
 408                                 if (bamaco_support & MACO_SUPPORT) {
 409                                         adev->pm.rpm_mode = AMDGPU_RUNPM_BAMACO;
 410                                         dev_info(adev->dev, "Using BAMACO for runtime pm\n");
 411                                 } else {
 412                                         dev_info(adev->dev, "Using BACO for runtime pm\n");
 413                                 }
 414                         }
 415                 }
 416                 break;
 417         case 0:
 418                 dev_info(adev->dev, "runtime pm is manually disabled\n");
 419                 break;
 420         default:
 421                 break;
 422         }
 423
 424 no_runtime_pm:
 425         if (adev->pm.rpm_mode == AMDGPU_RUNPM_NONE)
 426                 dev_info(adev->dev, "Runtime PM not available\n");
 427 }
 428 /**
 429  * amdgpu_device_supports_smart_shift - Is the device dGPU with
 430  * smart shift support
 431  *
 432  * @dev: drm_device pointer
 433  *
 434  * Returns true if the device is a dGPU with Smart Shift support,
 435  * otherwise returns false.
 436  */
 437 bool amdgpu_device_supports_smart_shift(struct drm_device *dev)
 438 {
 439         return (amdgpu_device_supports_boco(dev) &&
 440                 amdgpu_acpi_is_power_shift_control_supported());
 441 }
 442
 443 /*
 444  * VRAM access helper functions
 445  */
 446
 447 /**
 448  * amdgpu_device_mm_access - access vram by MM_INDEX/MM_DATA
 449  *
 450  * @adev: amdgpu_device pointer
 451  * @pos: offset of the buffer in vram
 452  * @buf: virtual address of the buffer in system memory
 453  * @size: read/write size, sizeof(@buf) must > @size
 454  * @write: true - write to vram, otherwise - read from vram
 455  */
 456 void amdgpu_device_mm_access(struct amdgpu_device *adev, loff_t pos,
 457                              void *buf, size_t size, bool write)
 458 {
 459         unsigned long flags;
 460         uint32_t hi = ~0, tmp = 0;
 461         uint32_t *data = buf;
 462         uint64_t last;
 463         int idx;
 464
 465         if (!drm_dev_enter(adev_to_drm(adev), &idx))
 466                 return;
 467
 468         BUG_ON(!IS_ALIGNED(pos, 4) || !IS_ALIGNED(size, 4));
 469
 470         spin_lock_irqsave(&adev->mmio_idx_lock, flags);
 471         for (last = pos + size; pos < last; pos += 4) {
 472                 tmp = pos >> 31;
 473
 474                 WREG32_NO_KIQ(mmMM_INDEX, ((uint32_t)pos) | 0x80000000);
 475                 if (tmp != hi) {
 476                         WREG32_NO_KIQ(mmMM_INDEX_HI, tmp);
 477                         hi = tmp;
 478                 }
 479                 if (write)
 480                         WREG32_NO_KIQ(mmMM_DATA, *data++);
 481                 else
 482                         *data++ = RREG32_NO_KIQ(mmMM_DATA);
 483         }
 484
 485         spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
 486         drm_dev_exit(idx);
 487 }
 488
 489 /**
 490  * amdgpu_device_aper_access - access vram by vram aperature
 491  *
 492  * @adev: amdgpu_device pointer
 493  * @pos: offset of the buffer in vram
 494  * @buf: virtual address of the buffer in system memory
 495  * @size: read/write size, sizeof(@buf) must > @size
 496  * @write: true - write to vram, otherwise - read from vram
 497  *
 498  * The return value means how many bytes have been transferred.
 499  */
 500 size_t amdgpu_device_aper_access(struct amdgpu_device *adev, loff_t pos,
 501                                  void *buf, size_t size, bool write)
 502 {
 503 #ifdef CONFIG_64BIT
 504         void __iomem *addr;
 505         size_t count = 0;
 506         uint64_t last;
 507
 508         if (!adev->mman.aper_base_kaddr)
 509                 return 0;
 510
 511         last = min(pos + size, adev->gmc.visible_vram_size);
 512         if (last > pos) {
 513                 addr = adev->mman.aper_base_kaddr + pos;
 514                 count = last - pos;
 515
 516                 if (write) {
 517                         memcpy_toio(addr, buf, count);
 518                         /* Make sure HDP write cache flush happens without any reordering
 519                          * after the system memory contents are sent over PCIe device
 520                          */
 521                         mb();
 522                         amdgpu_device_flush_hdp(adev, NULL);
 523                 } else {
 524                         amdgpu_device_invalidate_hdp(adev, NULL);
 525                         /* Make sure HDP read cache is invalidated before issuing a read
 526                          * to the PCIe device
 527                          */
 528                         mb();
 529                         memcpy_fromio(buf, addr, count);
 530                 }
 531
 532         }
 533
 534         return count;
 535 #else
 536         return 0;
 537 #endif
 538 }
 539
 540 /**
 541  * amdgpu_device_vram_access - read/write a buffer in vram
 542  *
 543  * @adev: amdgpu_device pointer
 544  * @pos: offset of the buffer in vram
 545  * @buf: virtual address of the buffer in system memory
 546  * @size: read/write size, sizeof(@buf) must > @size
 547  * @write: true - write to vram, otherwise - read from vram
 548  */
 549 void amdgpu_device_vram_access(struct amdgpu_device *adev, loff_t pos,
 550                                void *buf, size_t size, bool write)
 551 {
 552         size_t count;
 553
 554         /* try to using vram apreature to access vram first */
 555         count = amdgpu_device_aper_access(adev, pos, buf, size, write);
 556         size -= count;
 557         if (size) {
 558                 /* using MM to access rest vram */
 559                 pos += count;
 560                 buf += count;
 561                 amdgpu_device_mm_access(adev, pos, buf, size, write);
 562         }
 563 }
 564
 565 /*
 566  * register access helper functions.
 567  */
 568
 569 /* Check if hw access should be skipped because of hotplug or device error */
 570 bool amdgpu_device_skip_hw_access(struct amdgpu_device *adev)
 571 {
 572         if (adev->no_hw_access)
 573                 return true;
 574
 575 #ifdef CONFIG_LOCKDEP
 576         /*
 577          * This is a bit complicated to understand, so worth a comment. What we assert
 578          * here is that the GPU reset is not running on another thread in parallel.
 579          *
 580          * For this we trylock the read side of the reset semaphore, if that succeeds
 581          * we know that the reset is not running in paralell.
 582          *
 583          * If the trylock fails we assert that we are either already holding the read
 584          * side of the lock or are the reset thread itself and hold the write side of
 585          * the lock.
 586          */
 587         if (in_task()) {
 588                 if (down_read_trylock(&adev->reset_domain->sem))
 589                         up_read(&adev->reset_domain->sem);
 590                 else
 591                         lockdep_assert_held(&adev->reset_domain->sem);
 592         }
 593 #endif
 594         return false;
 595 }
 596
 597 /**
 598  * amdgpu_device_rreg - read a memory mapped IO or indirect register
 599  *
 600  * @adev: amdgpu_device pointer
 601  * @reg: dword aligned register offset
 602  * @acc_flags: access flags which require special behavior
 603  *
 604  * Returns the 32 bit value from the offset specified.
 605  */
 606 uint32_t amdgpu_device_rreg(struct amdgpu_device *adev,
 607                             uint32_t reg, uint32_t acc_flags)
 608 {
 609         uint32_t ret;
 610
 611         if (amdgpu_device_skip_hw_access(adev))
 612                 return 0;
 613
 614         if ((reg * 4) < adev->rmmio_size) {
 615                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 616                     amdgpu_sriov_runtime(adev) &&
 617                     down_read_trylock(&adev->reset_domain->sem)) {
 618                         ret = amdgpu_kiq_rreg(adev, reg, 0);
 619                         up_read(&adev->reset_domain->sem);
 620                 } else {
 621                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 622                 }
 623         } else {
 624                 ret = adev->pcie_rreg(adev, reg * 4);
 625         }
 626
 627         trace_amdgpu_device_rreg(adev->pdev->device, reg, ret);
 628
 629         return ret;
 630 }
 631
 632 /*
 633  * MMIO register read with bytes helper functions
 634  * @offset:bytes offset from MMIO start
 635  */
 636
 637 /**
 638  * amdgpu_mm_rreg8 - read a memory mapped IO register
 639  *
 640  * @adev: amdgpu_device pointer
 641  * @offset: byte aligned register offset
 642  *
 643  * Returns the 8 bit value from the offset specified.
 644  */
 645 uint8_t amdgpu_mm_rreg8(struct amdgpu_device *adev, uint32_t offset)
 646 {
 647         if (amdgpu_device_skip_hw_access(adev))
 648                 return 0;
 649
 650         if (offset < adev->rmmio_size)
 651                 return (readb(adev->rmmio + offset));
 652         BUG();
 653 }
 654
 655
 656 /**
 657  * amdgpu_device_xcc_rreg - read a memory mapped IO or indirect register with specific XCC
 658  *
 659  * @adev: amdgpu_device pointer
 660  * @reg: dword aligned register offset
 661  * @acc_flags: access flags which require special behavior
 662  * @xcc_id: xcc accelerated compute core id
 663  *
 664  * Returns the 32 bit value from the offset specified.
 665  */
 666 uint32_t amdgpu_device_xcc_rreg(struct amdgpu_device *adev,
 667                                 uint32_t reg, uint32_t acc_flags,
 668                                 uint32_t xcc_id)
 669 {
 670         uint32_t ret, rlcg_flag;
 671
 672         if (amdgpu_device_skip_hw_access(adev))
 673                 return 0;
 674
 675         if ((reg * 4) < adev->rmmio_size) {
 676                 if (amdgpu_sriov_vf(adev) &&
 677                     !amdgpu_sriov_runtime(adev) &&
 678                     adev->gfx.rlc.rlcg_reg_access_supported &&
 679                     amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags,
 680                                                          GC_HWIP, false,
 681                                                          &rlcg_flag)) {
 682                         ret = amdgpu_virt_rlcg_reg_rw(adev, reg, 0, rlcg_flag, GET_INST(GC, xcc_id));
 683                 } else if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 684                     amdgpu_sriov_runtime(adev) &&
 685                     down_read_trylock(&adev->reset_domain->sem)) {
 686                         ret = amdgpu_kiq_rreg(adev, reg, xcc_id);
 687                         up_read(&adev->reset_domain->sem);
 688                 } else {
 689                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 690                 }
 691         } else {
 692                 ret = adev->pcie_rreg(adev, reg * 4);
 693         }
 694
 695         return ret;
 696 }
 697
 698 /*
 699  * MMIO register write with bytes helper functions
 700  * @offset:bytes offset from MMIO start
 701  * @value: the value want to be written to the register
 702  */
 703
 704 /**
 705  * amdgpu_mm_wreg8 - read a memory mapped IO register
 706  *
 707  * @adev: amdgpu_device pointer
 708  * @offset: byte aligned register offset
 709  * @value: 8 bit value to write
 710  *
 711  * Writes the value specified to the offset specified.
 712  */
 713 void amdgpu_mm_wreg8(struct amdgpu_device *adev, uint32_t offset, uint8_t value)
 714 {
 715         if (amdgpu_device_skip_hw_access(adev))
 716                 return;
 717
 718         if (offset < adev->rmmio_size)
 719                 writeb(value, adev->rmmio + offset);
 720         else
 721                 BUG();
 722 }
 723
 724 /**
 725  * amdgpu_device_wreg - write to a memory mapped IO or indirect register
 726  *
 727  * @adev: amdgpu_device pointer
 728  * @reg: dword aligned register offset
 729  * @v: 32 bit value to write to the register
 730  * @acc_flags: access flags which require special behavior
 731  *
 732  * Writes the value specified to the offset specified.
 733  */
 734 void amdgpu_device_wreg(struct amdgpu_device *adev,
 735                         uint32_t reg, uint32_t v,
 736                         uint32_t acc_flags)
 737 {
 738         if (amdgpu_device_skip_hw_access(adev))
 739                 return;
 740
 741         if ((reg * 4) < adev->rmmio_size) {
 742                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 743                     amdgpu_sriov_runtime(adev) &&
 744                     down_read_trylock(&adev->reset_domain->sem)) {
 745                         amdgpu_kiq_wreg(adev, reg, v, 0);
 746                         up_read(&adev->reset_domain->sem);
 747                 } else {
 748                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 749                 }
 750         } else {
 751                 adev->pcie_wreg(adev, reg * 4, v);
 752         }
 753
 754         trace_amdgpu_device_wreg(adev->pdev->device, reg, v);
 755 }
 756
 757 /**
 758  * amdgpu_mm_wreg_mmio_rlc -  write register either with direct/indirect mmio or with RLC path if in range
 759  *
 760  * @adev: amdgpu_device pointer
 761  * @reg: mmio/rlc register
 762  * @v: value to write
 763  * @xcc_id: xcc accelerated compute core id
 764  *
 765  * this function is invoked only for the debugfs register access
 766  */
 767 void amdgpu_mm_wreg_mmio_rlc(struct amdgpu_device *adev,
 768                              uint32_t reg, uint32_t v,
 769                              uint32_t xcc_id)
 770 {
 771         if (amdgpu_device_skip_hw_access(adev))
 772                 return;
 773
 774         if (amdgpu_sriov_fullaccess(adev) &&
 775             adev->gfx.rlc.funcs &&
 776             adev->gfx.rlc.funcs->is_rlcg_access_range) {
 777                 if (adev->gfx.rlc.funcs->is_rlcg_access_range(adev, reg))
 778                         return amdgpu_sriov_wreg(adev, reg, v, 0, 0, xcc_id);
 779         } else if ((reg * 4) >= adev->rmmio_size) {
 780                 adev->pcie_wreg(adev, reg * 4, v);
 781         } else {
 782                 writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 783         }
 784 }
 785
 786 /**
 787  * amdgpu_device_xcc_wreg - write to a memory mapped IO or indirect register with specific XCC
 788  *
 789  * @adev: amdgpu_device pointer
 790  * @reg: dword aligned register offset
 791  * @v: 32 bit value to write to the register
 792  * @acc_flags: access flags which require special behavior
 793  * @xcc_id: xcc accelerated compute core id
 794  *
 795  * Writes the value specified to the offset specified.
 796  */
 797 void amdgpu_device_xcc_wreg(struct amdgpu_device *adev,
 798                         uint32_t reg, uint32_t v,
 799                         uint32_t acc_flags, uint32_t xcc_id)
 800 {
 801         uint32_t rlcg_flag;
 802
 803         if (amdgpu_device_skip_hw_access(adev))
 804                 return;
 805
 806         if ((reg * 4) < adev->rmmio_size) {
 807                 if (amdgpu_sriov_vf(adev) &&
 808                     !amdgpu_sriov_runtime(adev) &&
 809                     adev->gfx.rlc.rlcg_reg_access_supported &&
 810                     amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags,
 811                                                          GC_HWIP, true,
 812                                                          &rlcg_flag)) {
 813                         amdgpu_virt_rlcg_reg_rw(adev, reg, v, rlcg_flag, GET_INST(GC, xcc_id));
 814                 } else if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 815                     amdgpu_sriov_runtime(adev) &&
 816                     down_read_trylock(&adev->reset_domain->sem)) {
 817                         amdgpu_kiq_wreg(adev, reg, v, xcc_id);
 818                         up_read(&adev->reset_domain->sem);
 819                 } else {
 820                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 821                 }
 822         } else {
 823                 adev->pcie_wreg(adev, reg * 4, v);
 824         }
 825 }
 826
 827 /**
 828  * amdgpu_device_indirect_rreg - read an indirect register
 829  *
 830  * @adev: amdgpu_device pointer
 831  * @reg_addr: indirect register address to read from
 832  *
 833  * Returns the value of indirect register @reg_addr
 834  */
 835 u32 amdgpu_device_indirect_rreg(struct amdgpu_device *adev,
 836                                 u32 reg_addr)
 837 {
 838         unsigned long flags, pcie_index, pcie_data;
 839         void __iomem *pcie_index_offset;
 840         void __iomem *pcie_data_offset;
 841         u32 r;
 842
 843         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 844         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 845
 846         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 847         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 848         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 849
 850         writel(reg_addr, pcie_index_offset);
 851         readl(pcie_index_offset);
 852         r = readl(pcie_data_offset);
 853         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 854
 855         return r;
 856 }
 857
 858 u32 amdgpu_device_indirect_rreg_ext(struct amdgpu_device *adev,
 859                                     u64 reg_addr)
 860 {
 861         unsigned long flags, pcie_index, pcie_index_hi, pcie_data;
 862         u32 r;
 863         void __iomem *pcie_index_offset;
 864         void __iomem *pcie_index_hi_offset;
 865         void __iomem *pcie_data_offset;
 866
 867         if (unlikely(!adev->nbio.funcs)) {
 868                 pcie_index = AMDGPU_PCIE_INDEX_FALLBACK;
 869                 pcie_data = AMDGPU_PCIE_DATA_FALLBACK;
 870         } else {
 871                 pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 872                 pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 873         }
 874
 875         if (reg_addr >> 32) {
 876                 if (unlikely(!adev->nbio.funcs))
 877                         pcie_index_hi = AMDGPU_PCIE_INDEX_HI_FALLBACK;
 878                 else
 879                         pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
 880         } else {
 881                 pcie_index_hi = 0;
 882         }
 883
 884         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 885         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 886         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 887         if (pcie_index_hi != 0)
 888                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
 889                                 pcie_index_hi * 4;
 890
 891         writel(reg_addr, pcie_index_offset);
 892         readl(pcie_index_offset);
 893         if (pcie_index_hi != 0) {
 894                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
 895                 readl(pcie_index_hi_offset);
 896         }
 897         r = readl(pcie_data_offset);
 898
 899         /* clear the high bits */
 900         if (pcie_index_hi != 0) {
 901                 writel(0, pcie_index_hi_offset);
 902                 readl(pcie_index_hi_offset);
 903         }
 904
 905         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 906
 907         return r;
 908 }
 909
 910 /**
 911  * amdgpu_device_indirect_rreg64 - read a 64bits indirect register
 912  *
 913  * @adev: amdgpu_device pointer
 914  * @reg_addr: indirect register address to read from
 915  *
 916  * Returns the value of indirect register @reg_addr
 917  */
 918 u64 amdgpu_device_indirect_rreg64(struct amdgpu_device *adev,
 919                                   u32 reg_addr)
 920 {
 921         unsigned long flags, pcie_index, pcie_data;
 922         void __iomem *pcie_index_offset;
 923         void __iomem *pcie_data_offset;
 924         u64 r;
 925
 926         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 927         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 928
 929         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 930         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 931         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 932
 933         /* read low 32 bits */
 934         writel(reg_addr, pcie_index_offset);
 935         readl(pcie_index_offset);
 936         r = readl(pcie_data_offset);
 937         /* read high 32 bits */
 938         writel(reg_addr + 4, pcie_index_offset);
 939         readl(pcie_index_offset);
 940         r |= ((u64)readl(pcie_data_offset) << 32);
 941         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 942
 943         return r;
 944 }
 945
 946 u64 amdgpu_device_indirect_rreg64_ext(struct amdgpu_device *adev,
 947                                   u64 reg_addr)
 948 {
 949         unsigned long flags, pcie_index, pcie_data;
 950         unsigned long pcie_index_hi = 0;
 951         void __iomem *pcie_index_offset;
 952         void __iomem *pcie_index_hi_offset;
 953         void __iomem *pcie_data_offset;
 954         u64 r;
 955
 956         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 957         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 958         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
 959                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
 960
 961         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 962         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 963         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 964         if (pcie_index_hi != 0)
 965                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
 966                         pcie_index_hi * 4;
 967
 968         /* read low 32 bits */
 969         writel(reg_addr, pcie_index_offset);
 970         readl(pcie_index_offset);
 971         if (pcie_index_hi != 0) {
 972                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
 973                 readl(pcie_index_hi_offset);
 974         }
 975         r = readl(pcie_data_offset);
 976         /* read high 32 bits */
 977         writel(reg_addr + 4, pcie_index_offset);
 978         readl(pcie_index_offset);
 979         if (pcie_index_hi != 0) {
 980                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
 981                 readl(pcie_index_hi_offset);
 982         }
 983         r |= ((u64)readl(pcie_data_offset) << 32);
 984
 985         /* clear the high bits */
 986         if (pcie_index_hi != 0) {
 987                 writel(0, pcie_index_hi_offset);
 988                 readl(pcie_index_hi_offset);
 989         }
 990
 991         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 992
 993         return r;
 994 }
 995
 996 /**
 997  * amdgpu_device_indirect_wreg - write an indirect register address
 998  *
 999  * @adev: amdgpu_device pointer
1000  * @reg_addr: indirect register offset
1001  * @reg_data: indirect register data
1002  *
1003  */
1004 void amdgpu_device_indirect_wreg(struct amdgpu_device *adev,
1005                                  u32 reg_addr, u32 reg_data)
1006 {
1007         unsigned long flags, pcie_index, pcie_data;
1008         void __iomem *pcie_index_offset;
1009         void __iomem *pcie_data_offset;
1010
1011         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1012         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1013
1014         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1015         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1016         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1017
1018         writel(reg_addr, pcie_index_offset);
1019         readl(pcie_index_offset);
1020         writel(reg_data, pcie_data_offset);
1021         readl(pcie_data_offset);
1022         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1023 }
1024
1025 void amdgpu_device_indirect_wreg_ext(struct amdgpu_device *adev,
1026                                      u64 reg_addr, u32 reg_data)
1027 {
1028         unsigned long flags, pcie_index, pcie_index_hi, pcie_data;
1029         void __iomem *pcie_index_offset;
1030         void __iomem *pcie_index_hi_offset;
1031         void __iomem *pcie_data_offset;
1032
1033         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1034         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1035         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1036                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1037         else
1038                 pcie_index_hi = 0;
1039
1040         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1041         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1042         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1043         if (pcie_index_hi != 0)
1044                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1045                                 pcie_index_hi * 4;
1046
1047         writel(reg_addr, pcie_index_offset);
1048         readl(pcie_index_offset);
1049         if (pcie_index_hi != 0) {
1050                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1051                 readl(pcie_index_hi_offset);
1052         }
1053         writel(reg_data, pcie_data_offset);
1054         readl(pcie_data_offset);
1055
1056         /* clear the high bits */
1057         if (pcie_index_hi != 0) {
1058                 writel(0, pcie_index_hi_offset);
1059                 readl(pcie_index_hi_offset);
1060         }
1061
1062         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1063 }
1064
1065 /**
1066  * amdgpu_device_indirect_wreg64 - write a 64bits indirect register address
1067  *
1068  * @adev: amdgpu_device pointer
1069  * @reg_addr: indirect register offset
1070  * @reg_data: indirect register data
1071  *
1072  */
1073 void amdgpu_device_indirect_wreg64(struct amdgpu_device *adev,
1074                                    u32 reg_addr, u64 reg_data)
1075 {
1076         unsigned long flags, pcie_index, pcie_data;
1077         void __iomem *pcie_index_offset;
1078         void __iomem *pcie_data_offset;
1079
1080         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1081         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1082
1083         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1084         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1085         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1086
1087         /* write low 32 bits */
1088         writel(reg_addr, pcie_index_offset);
1089         readl(pcie_index_offset);
1090         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
1091         readl(pcie_data_offset);
1092         /* write high 32 bits */
1093         writel(reg_addr + 4, pcie_index_offset);
1094         readl(pcie_index_offset);
1095         writel((u32)(reg_data >> 32), pcie_data_offset);
1096         readl(pcie_data_offset);
1097         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1098 }
1099
1100 void amdgpu_device_indirect_wreg64_ext(struct amdgpu_device *adev,
1101                                    u64 reg_addr, u64 reg_data)
1102 {
1103         unsigned long flags, pcie_index, pcie_data;
1104         unsigned long pcie_index_hi = 0;
1105         void __iomem *pcie_index_offset;
1106         void __iomem *pcie_index_hi_offset;
1107         void __iomem *pcie_data_offset;
1108
1109         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1110         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1111         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1112                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1113
1114         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1115         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1116         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1117         if (pcie_index_hi != 0)
1118                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1119                                 pcie_index_hi * 4;
1120
1121         /* write low 32 bits */
1122         writel(reg_addr, pcie_index_offset);
1123         readl(pcie_index_offset);
1124         if (pcie_index_hi != 0) {
1125                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1126                 readl(pcie_index_hi_offset);
1127         }
1128         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
1129         readl(pcie_data_offset);
1130         /* write high 32 bits */
1131         writel(reg_addr + 4, pcie_index_offset);
1132         readl(pcie_index_offset);
1133         if (pcie_index_hi != 0) {
1134                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1135                 readl(pcie_index_hi_offset);
1136         }
1137         writel((u32)(reg_data >> 32), pcie_data_offset);
1138         readl(pcie_data_offset);
1139
1140         /* clear the high bits */
1141         if (pcie_index_hi != 0) {
1142                 writel(0, pcie_index_hi_offset);
1143                 readl(pcie_index_hi_offset);
1144         }
1145
1146         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1147 }
1148
1149 /**
1150  * amdgpu_device_get_rev_id - query device rev_id
1151  *
1152  * @adev: amdgpu_device pointer
1153  *
1154  * Return device rev_id
1155  */
1156 u32 amdgpu_device_get_rev_id(struct amdgpu_device *adev)
1157 {
1158         return adev->nbio.funcs->get_rev_id(adev);
1159 }
1160
1161 /**
1162  * amdgpu_invalid_rreg - dummy reg read function
1163  *
1164  * @adev: amdgpu_device pointer
1165  * @reg: offset of register
1166  *
1167  * Dummy register read function.  Used for register blocks
1168  * that certain asics don't have (all asics).
1169  * Returns the value in the register.
1170  */
1171 static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
1172 {
1173         DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
1174         BUG();
1175         return 0;
1176 }
1177
1178 static uint32_t amdgpu_invalid_rreg_ext(struct amdgpu_device *adev, uint64_t reg)
1179 {
1180         DRM_ERROR("Invalid callback to read register 0x%llX\n", reg);
1181         BUG();
1182         return 0;
1183 }
1184
1185 /**
1186  * amdgpu_invalid_wreg - dummy reg write function
1187  *
1188  * @adev: amdgpu_device pointer
1189  * @reg: offset of register
1190  * @v: value to write to the register
1191  *
1192  * Dummy register read function.  Used for register blocks
1193  * that certain asics don't have (all asics).
1194  */
1195 static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
1196 {
1197         DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
1198                   reg, v);
1199         BUG();
1200 }
1201
1202 static void amdgpu_invalid_wreg_ext(struct amdgpu_device *adev, uint64_t reg, uint32_t v)
1203 {
1204         DRM_ERROR("Invalid callback to write register 0x%llX with 0x%08X\n",
1205                   reg, v);
1206         BUG();
1207 }
1208
1209 /**
1210  * amdgpu_invalid_rreg64 - dummy 64 bit reg read function
1211  *
1212  * @adev: amdgpu_device pointer
1213  * @reg: offset of register
1214  *
1215  * Dummy register read function.  Used for register blocks
1216  * that certain asics don't have (all asics).
1217  * Returns the value in the register.
1218  */
1219 static uint64_t amdgpu_invalid_rreg64(struct amdgpu_device *adev, uint32_t reg)
1220 {
1221         DRM_ERROR("Invalid callback to read 64 bit register 0x%04X\n", reg);
1222         BUG();
1223         return 0;
1224 }
1225
1226 static uint64_t amdgpu_invalid_rreg64_ext(struct amdgpu_device *adev, uint64_t reg)
1227 {
1228         DRM_ERROR("Invalid callback to read register 0x%llX\n", reg);
1229         BUG();
1230         return 0;
1231 }
1232
1233 /**
1234  * amdgpu_invalid_wreg64 - dummy reg write function
1235  *
1236  * @adev: amdgpu_device pointer
1237  * @reg: offset of register
1238  * @v: value to write to the register
1239  *
1240  * Dummy register read function.  Used for register blocks
1241  * that certain asics don't have (all asics).
1242  */
1243 static void amdgpu_invalid_wreg64(struct amdgpu_device *adev, uint32_t reg, uint64_t v)
1244 {
1245         DRM_ERROR("Invalid callback to write 64 bit register 0x%04X with 0x%08llX\n",
1246                   reg, v);
1247         BUG();
1248 }
1249
1250 static void amdgpu_invalid_wreg64_ext(struct amdgpu_device *adev, uint64_t reg, uint64_t v)
1251 {
1252         DRM_ERROR("Invalid callback to write 64 bit register 0x%llX with 0x%08llX\n",
1253                   reg, v);
1254         BUG();
1255 }
1256
1257 /**
1258  * amdgpu_block_invalid_rreg - dummy reg read function
1259  *
1260  * @adev: amdgpu_device pointer
1261  * @block: offset of instance
1262  * @reg: offset of register
1263  *
1264  * Dummy register read function.  Used for register blocks
1265  * that certain asics don't have (all asics).
1266  * Returns the value in the register.
1267  */
1268 static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
1269                                           uint32_t block, uint32_t reg)
1270 {
1271         DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
1272                   reg, block);
1273         BUG();
1274         return 0;
1275 }
1276
1277 /**
1278  * amdgpu_block_invalid_wreg - dummy reg write function
1279  *
1280  * @adev: amdgpu_device pointer
1281  * @block: offset of instance
1282  * @reg: offset of register
1283  * @v: value to write to the register
1284  *
1285  * Dummy register read function.  Used for register blocks
1286  * that certain asics don't have (all asics).
1287  */
1288 static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
1289                                       uint32_t block,
1290                                       uint32_t reg, uint32_t v)
1291 {
1292         DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
1293                   reg, block, v);
1294         BUG();
1295 }
1296
1297 /**
1298  * amdgpu_device_asic_init - Wrapper for atom asic_init
1299  *
1300  * @adev: amdgpu_device pointer
1301  *
1302  * Does any asic specific work and then calls atom asic init.
1303  */
1304 static int amdgpu_device_asic_init(struct amdgpu_device *adev)
1305 {
1306         int ret;
1307
1308         amdgpu_asic_pre_asic_init(adev);
1309
1310         if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
1311             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4) ||
1312             amdgpu_ip_version(adev, GC_HWIP, 0) >= IP_VERSION(11, 0, 0)) {
1313                 amdgpu_psp_wait_for_bootloader(adev);
1314                 ret = amdgpu_atomfirmware_asic_init(adev, true);
1315                 return ret;
1316         } else {
1317                 return amdgpu_atom_asic_init(adev->mode_info.atom_context);
1318         }
1319
1320         return 0;
1321 }
1322
1323 /**
1324  * amdgpu_device_mem_scratch_init - allocate the VRAM scratch page
1325  *
1326  * @adev: amdgpu_device pointer
1327  *
1328  * Allocates a scratch page of VRAM for use by various things in the
1329  * driver.
1330  */
1331 static int amdgpu_device_mem_scratch_init(struct amdgpu_device *adev)
1332 {
1333         return amdgpu_bo_create_kernel(adev, AMDGPU_GPU_PAGE_SIZE, PAGE_SIZE,
1334                                        AMDGPU_GEM_DOMAIN_VRAM |
1335                                        AMDGPU_GEM_DOMAIN_GTT,
1336                                        &adev->mem_scratch.robj,
1337                                        &adev->mem_scratch.gpu_addr,
1338                                        (void **)&adev->mem_scratch.ptr);
1339 }
1340
1341 /**
1342  * amdgpu_device_mem_scratch_fini - Free the VRAM scratch page
1343  *
1344  * @adev: amdgpu_device pointer
1345  *
1346  * Frees the VRAM scratch page.
1347  */
1348 static void amdgpu_device_mem_scratch_fini(struct amdgpu_device *adev)
1349 {
1350         amdgpu_bo_free_kernel(&adev->mem_scratch.robj, NULL, NULL);
1351 }
1352
1353 /**
1354  * amdgpu_device_program_register_sequence - program an array of registers.
1355  *
1356  * @adev: amdgpu_device pointer
1357  * @registers: pointer to the register array
1358  * @array_size: size of the register array
1359  *
1360  * Programs an array or registers with and or masks.
1361  * This is a helper for setting golden registers.
1362  */
1363 void amdgpu_device_program_register_sequence(struct amdgpu_device *adev,
1364                                              const u32 *registers,
1365                                              const u32 array_size)
1366 {
1367         u32 tmp, reg, and_mask, or_mask;
1368         int i;
1369
1370         if (array_size % 3)
1371                 return;
1372
1373         for (i = 0; i < array_size; i += 3) {
1374                 reg = registers[i + 0];
1375                 and_mask = registers[i + 1];
1376                 or_mask = registers[i + 2];
1377
1378                 if (and_mask == 0xffffffff) {
1379                         tmp = or_mask;
1380                 } else {
1381                         tmp = RREG32(reg);
1382                         tmp &= ~and_mask;
1383                         if (adev->family >= AMDGPU_FAMILY_AI)
1384                                 tmp |= (or_mask & and_mask);
1385                         else
1386                                 tmp |= or_mask;
1387                 }
1388                 WREG32(reg, tmp);
1389         }
1390 }
1391
1392 /**
1393  * amdgpu_device_pci_config_reset - reset the GPU
1394  *
1395  * @adev: amdgpu_device pointer
1396  *
1397  * Resets the GPU using the pci config reset sequence.
1398  * Only applicable to asics prior to vega10.
1399  */
1400 void amdgpu_device_pci_config_reset(struct amdgpu_device *adev)
1401 {
1402         pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);
1403 }
1404
1405 /**
1406  * amdgpu_device_pci_reset - reset the GPU using generic PCI means
1407  *
1408  * @adev: amdgpu_device pointer
1409  *
1410  * Resets the GPU using generic pci reset interfaces (FLR, SBR, etc.).
1411  */
1412 int amdgpu_device_pci_reset(struct amdgpu_device *adev)
1413 {
1414         return pci_reset_function(adev->pdev);
1415 }
1416
1417 /*
1418  * amdgpu_device_wb_*()
1419  * Writeback is the method by which the GPU updates special pages in memory
1420  * with the status of certain GPU events (fences, ring pointers,etc.).
1421  */
1422
1423 /**
1424  * amdgpu_device_wb_fini - Disable Writeback and free memory
1425  *
1426  * @adev: amdgpu_device pointer
1427  *
1428  * Disables Writeback and frees the Writeback memory (all asics).
1429  * Used at driver shutdown.
1430  */
1431 static void amdgpu_device_wb_fini(struct amdgpu_device *adev)
1432 {
1433         if (adev->wb.wb_obj) {
1434                 amdgpu_bo_free_kernel(&adev->wb.wb_obj,
1435                                       &adev->wb.gpu_addr,
1436                                       (void **)&adev->wb.wb);
1437                 adev->wb.wb_obj = NULL;
1438         }
1439 }
1440
1441 /**
1442  * amdgpu_device_wb_init - Init Writeback driver info and allocate memory
1443  *
1444  * @adev: amdgpu_device pointer
1445  *
1446  * Initializes writeback and allocates writeback memory (all asics).
1447  * Used at driver startup.
1448  * Returns 0 on success or an -error on failure.
1449  */
1450 static int amdgpu_device_wb_init(struct amdgpu_device *adev)
1451 {
1452         int r;
1453
1454         if (adev->wb.wb_obj == NULL) {
1455                 /* AMDGPU_MAX_WB * sizeof(uint32_t) * 8 = AMDGPU_MAX_WB 256bit slots */
1456                 r = amdgpu_bo_create_kernel(adev, AMDGPU_MAX_WB * sizeof(uint32_t) * 8,
1457                                             PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
1458                                             &adev->wb.wb_obj, &adev->wb.gpu_addr,
1459                                             (void **)&adev->wb.wb);
1460                 if (r) {
1461                         dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
1462                         return r;
1463                 }
1464
1465                 adev->wb.num_wb = AMDGPU_MAX_WB;
1466                 memset(&adev->wb.used, 0, sizeof(adev->wb.used));
1467
1468                 /* clear wb memory */
1469                 memset((char *)adev->wb.wb, 0, AMDGPU_MAX_WB * sizeof(uint32_t) * 8);
1470         }
1471
1472         return 0;
1473 }
1474
1475 /**
1476  * amdgpu_device_wb_get - Allocate a wb entry
1477  *
1478  * @adev: amdgpu_device pointer
1479  * @wb: wb index
1480  *
1481  * Allocate a wb slot for use by the driver (all asics).
1482  * Returns 0 on success or -EINVAL on failure.
1483  */
1484 int amdgpu_device_wb_get(struct amdgpu_device *adev, u32 *wb)
1485 {
1486         unsigned long flags, offset;
1487
1488         spin_lock_irqsave(&adev->wb.lock, flags);
1489         offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
1490         if (offset < adev->wb.num_wb) {
1491                 __set_bit(offset, adev->wb.used);
1492                 spin_unlock_irqrestore(&adev->wb.lock, flags);
1493                 *wb = offset << 3; /* convert to dw offset */
1494                 return 0;
1495         } else {
1496                 spin_unlock_irqrestore(&adev->wb.lock, flags);
1497                 return -EINVAL;
1498         }
1499 }
1500
1501 /**
1502  * amdgpu_device_wb_free - Free a wb entry
1503  *
1504  * @adev: amdgpu_device pointer
1505  * @wb: wb index
1506  *
1507  * Free a wb slot allocated for use by the driver (all asics)
1508  */
1509 void amdgpu_device_wb_free(struct amdgpu_device *adev, u32 wb)
1510 {
1511         unsigned long flags;
1512
1513         wb >>= 3;
1514         spin_lock_irqsave(&adev->wb.lock, flags);
1515         if (wb < adev->wb.num_wb)
1516                 __clear_bit(wb, adev->wb.used);
1517         spin_unlock_irqrestore(&adev->wb.lock, flags);
1518 }
1519
1520 /**
1521  * amdgpu_device_resize_fb_bar - try to resize FB BAR
1522  *
1523  * @adev: amdgpu_device pointer
1524  *
1525  * Try to resize FB BAR to make all VRAM CPU accessible. We try very hard not
1526  * to fail, but if any of the BARs is not accessible after the size we abort
1527  * driver loading by returning -ENODEV.
1528  */
1529 int amdgpu_device_resize_fb_bar(struct amdgpu_device *adev)
1530 {
1531         int rbar_size = pci_rebar_bytes_to_size(adev->gmc.real_vram_size);
1532         struct pci_bus *root;
1533         struct resource *res;
1534         unsigned int i;
1535         u16 cmd;
1536         int r;
1537
1538         if (!IS_ENABLED(CONFIG_PHYS_ADDR_T_64BIT))
1539                 return 0;
1540
1541         /* Bypass for VF */
1542         if (amdgpu_sriov_vf(adev))
1543                 return 0;
1544
1545         /* PCI_EXT_CAP_ID_VNDR extended capability is located at 0x100 */
1546         if (!pci_find_ext_capability(adev->pdev, PCI_EXT_CAP_ID_VNDR))
1547                 DRM_WARN("System can't access extended configuration space, please check!!\n");
1548
1549         /* skip if the bios has already enabled large BAR */
1550         if (adev->gmc.real_vram_size &&
1551             (pci_resource_len(adev->pdev, 0) >= adev->gmc.real_vram_size))
1552                 return 0;
1553
1554         /* Check if the root BUS has 64bit memory resources */
1555         root = adev->pdev->bus;
1556         while (root->parent)
1557                 root = root->parent;
1558
1559         pci_bus_for_each_resource(root, res, i) {
1560                 if (res && res->flags & (IORESOURCE_MEM | IORESOURCE_MEM_64) &&
1561                     res->start > 0x100000000ull)
1562                         break;
1563         }
1564
1565         /* Trying to resize is pointless without a root hub window above 4GB */
1566         if (!res)
1567                 return 0;
1568
1569         /* Limit the BAR size to what is available */
1570         rbar_size = min(fls(pci_rebar_get_possible_sizes(adev->pdev, 0)) - 1,
1571                         rbar_size);
1572
1573         /* Disable memory decoding while we change the BAR addresses and size */
1574         pci_read_config_word(adev->pdev, PCI_COMMAND, &cmd);
1575         pci_write_config_word(adev->pdev, PCI_COMMAND,
1576                               cmd & ~PCI_COMMAND_MEMORY);
1577
1578         /* Free the VRAM and doorbell BAR, we most likely need to move both. */
1579         amdgpu_doorbell_fini(adev);
1580         if (adev->asic_type >= CHIP_BONAIRE)
1581                 pci_release_resource(adev->pdev, 2);
1582
1583         pci_release_resource(adev->pdev, 0);
1584
1585         r = pci_resize_resource(adev->pdev, 0, rbar_size);
1586         if (r == -ENOSPC)
1587                 DRM_INFO("Not enough PCI address space for a large BAR.");
1588         else if (r && r != -ENOTSUPP)
1589                 DRM_ERROR("Problem resizing BAR0 (%d).", r);
1590
1591         pci_assign_unassigned_bus_resources(adev->pdev->bus);
1592
1593         /* When the doorbell or fb BAR isn't available we have no chance of
1594          * using the device.
1595          */
1596         r = amdgpu_doorbell_init(adev);
1597         if (r || (pci_resource_flags(adev->pdev, 0) & IORESOURCE_UNSET))
1598                 return -ENODEV;
1599
1600         pci_write_config_word(adev->pdev, PCI_COMMAND, cmd);
1601
1602         return 0;
1603 }
1604
1605 static bool amdgpu_device_read_bios(struct amdgpu_device *adev)
1606 {
1607         if (hweight32(adev->aid_mask) && (adev->flags & AMD_IS_APU))
1608                 return false;
1609
1610         return true;
1611 }
1612
1613 /*
1614  * GPU helpers function.
1615  */
1616 /**
1617  * amdgpu_device_need_post - check if the hw need post or not
1618  *
1619  * @adev: amdgpu_device pointer
1620  *
1621  * Check if the asic has been initialized (all asics) at driver startup
1622  * or post is needed if  hw reset is performed.
1623  * Returns true if need or false if not.
1624  */
1625 bool amdgpu_device_need_post(struct amdgpu_device *adev)
1626 {
1627         uint32_t reg;
1628
1629         if (amdgpu_sriov_vf(adev))
1630                 return false;
1631
1632         if (!amdgpu_device_read_bios(adev))
1633                 return false;
1634
1635         if (amdgpu_passthrough(adev)) {
1636                 /* for FIJI: In whole GPU pass-through virtualization case, after VM reboot
1637                  * some old smc fw still need driver do vPost otherwise gpu hang, while
1638                  * those smc fw version above 22.15 doesn't have this flaw, so we force
1639                  * vpost executed for smc version below 22.15
1640                  */
1641                 if (adev->asic_type == CHIP_FIJI) {
1642                         int err;
1643                         uint32_t fw_ver;
1644
1645                         err = request_firmware(&adev->pm.fw, "amdgpu/fiji_smc.bin", adev->dev);
1646                         /* force vPost if error occured */
1647                         if (err)
1648                                 return true;
1649
1650                         fw_ver = *((uint32_t *)adev->pm.fw->data + 69);
1651                         release_firmware(adev->pm.fw);
1652                         if (fw_ver < 0x00160e00)
1653                                 return true;
1654                 }
1655         }
1656
1657         /* Don't post if we need to reset whole hive on init */
1658         if (adev->gmc.xgmi.pending_reset)
1659                 return false;
1660
1661         if (adev->has_hw_reset) {
1662                 adev->has_hw_reset = false;
1663                 return true;
1664         }
1665
1666         /* bios scratch used on CIK+ */
1667         if (adev->asic_type >= CHIP_BONAIRE)
1668                 return amdgpu_atombios_scratch_need_asic_init(adev);
1669
1670         /* check MEM_SIZE for older asics */
1671         reg = amdgpu_asic_get_config_memsize(adev);
1672
1673         if ((reg != 0) && (reg != 0xffffffff))
1674                 return false;
1675
1676         return true;
1677 }
1678
1679 /*
1680  * Check whether seamless boot is supported.
1681  *
1682  * So far we only support seamless boot on DCE 3.0 or later.
1683  * If users report that it works on older ASICS as well, we may
1684  * loosen this.
1685  */
1686 bool amdgpu_device_seamless_boot_supported(struct amdgpu_device *adev)
1687 {
1688         switch (amdgpu_seamless) {
1689         case -1:
1690                 break;
1691         case 1:
1692                 return true;
1693         case 0:
1694                 return false;
1695         default:
1696                 DRM_ERROR("Invalid value for amdgpu.seamless: %d\n",
1697                           amdgpu_seamless);
1698                 return false;
1699         }
1700
1701         if (!(adev->flags & AMD_IS_APU))
1702                 return false;
1703
1704         if (adev->mman.keep_stolen_vga_memory)
1705                 return false;
1706
1707         return amdgpu_ip_version(adev, DCE_HWIP, 0) >= IP_VERSION(3, 0, 0);
1708 }
1709
1710 /*
1711  * Intel hosts such as Rocket Lake, Alder Lake, Raptor Lake and Sapphire Rapids
1712  * don't support dynamic speed switching. Until we have confirmation from Intel
1713  * that a specific host supports it, it's safer that we keep it disabled for all.
1714  *
1715  * https://edc.intel.com/content/www/us/en/design/products/platforms/details/raptor-lake-s/13th-generation-core-processors-datasheet-volume-1-of-2/005/pci-express-support/
1716  * https://gitlab.freedesktop.org/drm/amd/-/issues/2663
1717  */
1718 static bool amdgpu_device_pcie_dynamic_switching_supported(struct amdgpu_device *adev)
1719 {
1720 #if IS_ENABLED(CONFIG_X86)
1721         struct cpuinfo_x86 *c = &cpu_data(0);
1722
1723         /* eGPU change speeds based on USB4 fabric conditions */
1724         if (dev_is_removable(adev->dev))
1725                 return true;
1726
1727         if (c->x86_vendor == X86_VENDOR_INTEL)
1728                 return false;
1729 #endif
1730         return true;
1731 }
1732
1733 /**
1734  * amdgpu_device_should_use_aspm - check if the device should program ASPM
1735  *
1736  * @adev: amdgpu_device pointer
1737  *
1738  * Confirm whether the module parameter and pcie bridge agree that ASPM should
1739  * be set for this device.
1740  *
1741  * Returns true if it should be used or false if not.
1742  */
1743 bool amdgpu_device_should_use_aspm(struct amdgpu_device *adev)
1744 {
1745         switch (amdgpu_aspm) {
1746         case -1:
1747                 break;
1748         case 0:
1749                 return false;
1750         case 1:
1751                 return true;
1752         default:
1753                 return false;
1754         }
1755         if (adev->flags & AMD_IS_APU)
1756                 return false;
1757         if (!(adev->pm.pp_feature & PP_PCIE_DPM_MASK))
1758                 return false;
1759         return pcie_aspm_enabled(adev->pdev);
1760 }
1761
1762 /* if we get transitioned to only one device, take VGA back */
1763 /**
1764  * amdgpu_device_vga_set_decode - enable/disable vga decode
1765  *
1766  * @pdev: PCI device pointer
1767  * @state: enable/disable vga decode
1768  *
1769  * Enable/disable vga decode (all asics).
1770  * Returns VGA resource flags.
1771  */
1772 static unsigned int amdgpu_device_vga_set_decode(struct pci_dev *pdev,
1773                 bool state)
1774 {
1775         struct amdgpu_device *adev = drm_to_adev(pci_get_drvdata(pdev));
1776
1777         amdgpu_asic_set_vga_state(adev, state);
1778         if (state)
1779                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1780                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1781         else
1782                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1783 }
1784
1785 /**
1786  * amdgpu_device_check_block_size - validate the vm block size
1787  *
1788  * @adev: amdgpu_device pointer
1789  *
1790  * Validates the vm block size specified via module parameter.
1791  * The vm block size defines number of bits in page table versus page directory,
1792  * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1793  * page table and the remaining bits are in the page directory.
1794  */
1795 static void amdgpu_device_check_block_size(struct amdgpu_device *adev)
1796 {
1797         /* defines number of bits in page table versus page directory,
1798          * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1799          * page table and the remaining bits are in the page directory
1800          */
1801         if (amdgpu_vm_block_size == -1)
1802                 return;
1803
1804         if (amdgpu_vm_block_size < 9) {
1805                 dev_warn(adev->dev, "VM page table size (%d) too small\n",
1806                          amdgpu_vm_block_size);
1807                 amdgpu_vm_block_size = -1;
1808         }
1809 }
1810
1811 /**
1812  * amdgpu_device_check_vm_size - validate the vm size
1813  *
1814  * @adev: amdgpu_device pointer
1815  *
1816  * Validates the vm size in GB specified via module parameter.
1817  * The VM size is the size of the GPU virtual memory space in GB.
1818  */
1819 static void amdgpu_device_check_vm_size(struct amdgpu_device *adev)
1820 {
1821         /* no need to check the default value */
1822         if (amdgpu_vm_size == -1)
1823                 return;
1824
1825         if (amdgpu_vm_size < 1) {
1826                 dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
1827                          amdgpu_vm_size);
1828                 amdgpu_vm_size = -1;
1829         }
1830 }
1831
1832 static void amdgpu_device_check_smu_prv_buffer_size(struct amdgpu_device *adev)
1833 {
1834         struct sysinfo si;
1835         bool is_os_64 = (sizeof(void *) == 8);
1836         uint64_t total_memory;
1837         uint64_t dram_size_seven_GB = 0x1B8000000;
1838         uint64_t dram_size_three_GB = 0xB8000000;
1839
1840         if (amdgpu_smu_memory_pool_size == 0)
1841                 return;
1842
1843         if (!is_os_64) {
1844                 DRM_WARN("Not 64-bit OS, feature not supported\n");
1845                 goto def_value;
1846         }
1847         si_meminfo(&si);
1848         total_memory = (uint64_t)si.totalram * si.mem_unit;
1849
1850         if ((amdgpu_smu_memory_pool_size == 1) ||
1851                 (amdgpu_smu_memory_pool_size == 2)) {
1852                 if (total_memory < dram_size_three_GB)
1853                         goto def_value1;
1854         } else if ((amdgpu_smu_memory_pool_size == 4) ||
1855                 (amdgpu_smu_memory_pool_size == 8)) {
1856                 if (total_memory < dram_size_seven_GB)
1857                         goto def_value1;
1858         } else {
1859                 DRM_WARN("Smu memory pool size not supported\n");
1860                 goto def_value;
1861         }
1862         adev->pm.smu_prv_buffer_size = amdgpu_smu_memory_pool_size << 28;
1863
1864         return;
1865
1866 def_value1:
1867         DRM_WARN("No enough system memory\n");
1868 def_value:
1869         adev->pm.smu_prv_buffer_size = 0;
1870 }
1871
1872 static int amdgpu_device_init_apu_flags(struct amdgpu_device *adev)
1873 {
1874         if (!(adev->flags & AMD_IS_APU) ||
1875             adev->asic_type < CHIP_RAVEN)
1876                 return 0;
1877
1878         switch (adev->asic_type) {
1879         case CHIP_RAVEN:
1880                 if (adev->pdev->device == 0x15dd)
1881                         adev->apu_flags |= AMD_APU_IS_RAVEN;
1882                 if (adev->pdev->device == 0x15d8)
1883                         adev->apu_flags |= AMD_APU_IS_PICASSO;
1884                 break;
1885         case CHIP_RENOIR:
1886                 if ((adev->pdev->device == 0x1636) ||
1887                     (adev->pdev->device == 0x164c))
1888                         adev->apu_flags |= AMD_APU_IS_RENOIR;
1889                 else
1890                         adev->apu_flags |= AMD_APU_IS_GREEN_SARDINE;
1891                 break;
1892         case CHIP_VANGOGH:
1893                 adev->apu_flags |= AMD_APU_IS_VANGOGH;
1894                 break;
1895         case CHIP_YELLOW_CARP:
1896                 break;
1897         case CHIP_CYAN_SKILLFISH:
1898                 if ((adev->pdev->device == 0x13FE) ||
1899                     (adev->pdev->device == 0x143F))
1900                         adev->apu_flags |= AMD_APU_IS_CYAN_SKILLFISH2;
1901                 break;
1902         default:
1903                 break;
1904         }
1905
1906         return 0;
1907 }
1908
1909 /**
1910  * amdgpu_device_check_arguments - validate module params
1911  *
1912  * @adev: amdgpu_device pointer
1913  *
1914  * Validates certain module parameters and updates
1915  * the associated values used by the driver (all asics).
1916  */
1917 static int amdgpu_device_check_arguments(struct amdgpu_device *adev)
1918 {
1919         int i;
1920
1921         if (amdgpu_sched_jobs < 4) {
1922                 dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
1923                          amdgpu_sched_jobs);
1924                 amdgpu_sched_jobs = 4;
1925         } else if (!is_power_of_2(amdgpu_sched_jobs)) {
1926                 dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
1927                          amdgpu_sched_jobs);
1928                 amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
1929         }
1930
1931         if (amdgpu_gart_size != -1 && amdgpu_gart_size < 32) {
1932                 /* gart size must be greater or equal to 32M */
1933                 dev_warn(adev->dev, "gart size (%d) too small\n",
1934                          amdgpu_gart_size);
1935                 amdgpu_gart_size = -1;
1936         }
1937
1938         if (amdgpu_gtt_size != -1 && amdgpu_gtt_size < 32) {
1939                 /* gtt size must be greater or equal to 32M */
1940                 dev_warn(adev->dev, "gtt size (%d) too small\n",
1941                                  amdgpu_gtt_size);
1942                 amdgpu_gtt_size = -1;
1943         }
1944
1945         /* valid range is between 4 and 9 inclusive */
1946         if (amdgpu_vm_fragment_size != -1 &&
1947             (amdgpu_vm_fragment_size > 9 || amdgpu_vm_fragment_size < 4)) {
1948                 dev_warn(adev->dev, "valid range is between 4 and 9\n");
1949                 amdgpu_vm_fragment_size = -1;
1950         }
1951
1952         if (amdgpu_sched_hw_submission < 2) {
1953                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be at least 2\n",
1954                          amdgpu_sched_hw_submission);
1955                 amdgpu_sched_hw_submission = 2;
1956         } else if (!is_power_of_2(amdgpu_sched_hw_submission)) {
1957                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be a power of 2\n",
1958                          amdgpu_sched_hw_submission);
1959                 amdgpu_sched_hw_submission = roundup_pow_of_two(amdgpu_sched_hw_submission);
1960         }
1961
1962         if (amdgpu_reset_method < -1 || amdgpu_reset_method > 4) {
1963                 dev_warn(adev->dev, "invalid option for reset method, reverting to default\n");
1964                 amdgpu_reset_method = -1;
1965         }
1966
1967         amdgpu_device_check_smu_prv_buffer_size(adev);
1968
1969         amdgpu_device_check_vm_size(adev);
1970
1971         amdgpu_device_check_block_size(adev);
1972
1973         adev->firmware.load_type = amdgpu_ucode_get_load_type(adev, amdgpu_fw_load_type);
1974
1975         for (i = 0; i < MAX_XCP; i++)
1976                 adev->enforce_isolation[i] = !!enforce_isolation;
1977
1978         return 0;
1979 }
1980
1981 /**
1982  * amdgpu_switcheroo_set_state - set switcheroo state
1983  *
1984  * @pdev: pci dev pointer
1985  * @state: vga_switcheroo state
1986  *
1987  * Callback for the switcheroo driver.  Suspends or resumes
1988  * the asics before or after it is powered up using ACPI methods.
1989  */
1990 static void amdgpu_switcheroo_set_state(struct pci_dev *pdev,
1991                                         enum vga_switcheroo_state state)
1992 {
1993         struct drm_device *dev = pci_get_drvdata(pdev);
1994         int r;
1995
1996         if (amdgpu_device_supports_px(dev) && state == VGA_SWITCHEROO_OFF)
1997                 return;
1998
1999         if (state == VGA_SWITCHEROO_ON) {
2000                 pr_info("switched on\n");
2001                 /* don't suspend or resume card normally */
2002                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
2003
2004                 pci_set_power_state(pdev, PCI_D0);
2005                 amdgpu_device_load_pci_state(pdev);
2006                 r = pci_enable_device(pdev);
2007                 if (r)
2008                         DRM_WARN("pci_enable_device failed (%d)\n", r);
2009                 amdgpu_device_resume(dev, true);
2010
2011                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
2012         } else {
2013                 pr_info("switched off\n");
2014                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
2015                 amdgpu_device_prepare(dev);
2016                 amdgpu_device_suspend(dev, true);
2017                 amdgpu_device_cache_pci_state(pdev);
2018                 /* Shut down the device */
2019                 pci_disable_device(pdev);
2020                 pci_set_power_state(pdev, PCI_D3cold);
2021                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
2022         }
2023 }
2024
2025 /**
2026  * amdgpu_switcheroo_can_switch - see if switcheroo state can change
2027  *
2028  * @pdev: pci dev pointer
2029  *
2030  * Callback for the switcheroo driver.  Check of the switcheroo
2031  * state can be changed.
2032  * Returns true if the state can be changed, false if not.
2033  */
2034 static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
2035 {
2036         struct drm_device *dev = pci_get_drvdata(pdev);
2037
2038        /*
2039         * FIXME: open_count is protected by drm_global_mutex but that would lead to
2040         * locking inversion with the driver load path. And the access here is
2041         * completely racy anyway. So don't bother with locking for now.
2042         */
2043         return atomic_read(&dev->open_count) == 0;
2044 }
2045
2046 static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
2047         .set_gpu_state = amdgpu_switcheroo_set_state,
2048         .reprobe = NULL,
2049         .can_switch = amdgpu_switcheroo_can_switch,
2050 };
2051
2052 /**
2053  * amdgpu_device_ip_set_clockgating_state - set the CG state
2054  *
2055  * @dev: amdgpu_device pointer
2056  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2057  * @state: clockgating state (gate or ungate)
2058  *
2059  * Sets the requested clockgating state for all instances of
2060  * the hardware IP specified.
2061  * Returns the error code from the last instance.
2062  */
2063 int amdgpu_device_ip_set_clockgating_state(void *dev,
2064                                            enum amd_ip_block_type block_type,
2065                                            enum amd_clockgating_state state)
2066 {
2067         struct amdgpu_device *adev = dev;
2068         int i, r = 0;
2069
2070         for (i = 0; i < adev->num_ip_blocks; i++) {
2071                 if (!adev->ip_blocks[i].status.valid)
2072                         continue;
2073                 if (adev->ip_blocks[i].version->type != block_type)
2074                         continue;
2075                 if (!adev->ip_blocks[i].version->funcs->set_clockgating_state)
2076                         continue;
2077                 r = adev->ip_blocks[i].version->funcs->set_clockgating_state(
2078                         (void *)adev, state);
2079                 if (r)
2080                         DRM_ERROR("set_clockgating_state of IP block <%s> failed %d\n",
2081                                   adev->ip_blocks[i].version->funcs->name, r);
2082         }
2083         return r;
2084 }
2085
2086 /**
2087  * amdgpu_device_ip_set_powergating_state - set the PG state
2088  *
2089  * @dev: amdgpu_device pointer
2090  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2091  * @state: powergating state (gate or ungate)
2092  *
2093  * Sets the requested powergating state for all instances of
2094  * the hardware IP specified.
2095  * Returns the error code from the last instance.
2096  */
2097 int amdgpu_device_ip_set_powergating_state(void *dev,
2098                                            enum amd_ip_block_type block_type,
2099                                            enum amd_powergating_state state)
2100 {
2101         struct amdgpu_device *adev = dev;
2102         int i, r = 0;
2103
2104         for (i = 0; i < adev->num_ip_blocks; i++) {
2105                 if (!adev->ip_blocks[i].status.valid)
2106                         continue;
2107                 if (adev->ip_blocks[i].version->type != block_type)
2108                         continue;
2109                 if (!adev->ip_blocks[i].version->funcs->set_powergating_state)
2110                         continue;
2111                 r = adev->ip_blocks[i].version->funcs->set_powergating_state(
2112                         (void *)adev, state);
2113                 if (r)
2114                         DRM_ERROR("set_powergating_state of IP block <%s> failed %d\n",
2115                                   adev->ip_blocks[i].version->funcs->name, r);
2116         }
2117         return r;
2118 }
2119
2120 /**
2121  * amdgpu_device_ip_get_clockgating_state - get the CG state
2122  *
2123  * @adev: amdgpu_device pointer
2124  * @flags: clockgating feature flags
2125  *
2126  * Walks the list of IPs on the device and updates the clockgating
2127  * flags for each IP.
2128  * Updates @flags with the feature flags for each hardware IP where
2129  * clockgating is enabled.
2130  */
2131 void amdgpu_device_ip_get_clockgating_state(struct amdgpu_device *adev,
2132                                             u64 *flags)
2133 {
2134         int i;
2135
2136         for (i = 0; i < adev->num_ip_blocks; i++) {
2137                 if (!adev->ip_blocks[i].status.valid)
2138                         continue;
2139                 if (adev->ip_blocks[i].version->funcs->get_clockgating_state)
2140                         adev->ip_blocks[i].version->funcs->get_clockgating_state((void *)adev, flags);
2141         }
2142 }
2143
2144 /**
2145  * amdgpu_device_ip_wait_for_idle - wait for idle
2146  *
2147  * @adev: amdgpu_device pointer
2148  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2149  *
2150  * Waits for the request hardware IP to be idle.
2151  * Returns 0 for success or a negative error code on failure.
2152  */
2153 int amdgpu_device_ip_wait_for_idle(struct amdgpu_device *adev,
2154                                    enum amd_ip_block_type block_type)
2155 {
2156         int i, r;
2157
2158         for (i = 0; i < adev->num_ip_blocks; i++) {
2159                 if (!adev->ip_blocks[i].status.valid)
2160                         continue;
2161                 if (adev->ip_blocks[i].version->type == block_type) {
2162                         r = adev->ip_blocks[i].version->funcs->wait_for_idle((void *)adev);
2163                         if (r)
2164                                 return r;
2165                         break;
2166                 }
2167         }
2168         return 0;
2169
2170 }
2171
2172 /**
2173  * amdgpu_device_ip_is_idle - is the hardware IP idle
2174  *
2175  * @adev: amdgpu_device pointer
2176  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2177  *
2178  * Check if the hardware IP is idle or not.
2179  * Returns true if it the IP is idle, false if not.
2180  */
2181 bool amdgpu_device_ip_is_idle(struct amdgpu_device *adev,
2182                               enum amd_ip_block_type block_type)
2183 {
2184         int i;
2185
2186         for (i = 0; i < adev->num_ip_blocks; i++) {
2187                 if (!adev->ip_blocks[i].status.valid)
2188                         continue;
2189                 if (adev->ip_blocks[i].version->type == block_type)
2190                         return adev->ip_blocks[i].version->funcs->is_idle((void *)adev);
2191         }
2192         return true;
2193
2194 }
2195
2196 /**
2197  * amdgpu_device_ip_get_ip_block - get a hw IP pointer
2198  *
2199  * @adev: amdgpu_device pointer
2200  * @type: Type of hardware IP (SMU, GFX, UVD, etc.)
2201  *
2202  * Returns a pointer to the hardware IP block structure
2203  * if it exists for the asic, otherwise NULL.
2204  */
2205 struct amdgpu_ip_block *
2206 amdgpu_device_ip_get_ip_block(struct amdgpu_device *adev,
2207                               enum amd_ip_block_type type)
2208 {
2209         int i;
2210
2211         for (i = 0; i < adev->num_ip_blocks; i++)
2212                 if (adev->ip_blocks[i].version->type == type)
2213                         return &adev->ip_blocks[i];
2214
2215         return NULL;
2216 }
2217
2218 /**
2219  * amdgpu_device_ip_block_version_cmp
2220  *
2221  * @adev: amdgpu_device pointer
2222  * @type: enum amd_ip_block_type
2223  * @major: major version
2224  * @minor: minor version
2225  *
2226  * return 0 if equal or greater
2227  * return 1 if smaller or the ip_block doesn't exist
2228  */
2229 int amdgpu_device_ip_block_version_cmp(struct amdgpu_device *adev,
2230                                        enum amd_ip_block_type type,
2231                                        u32 major, u32 minor)
2232 {
2233         struct amdgpu_ip_block *ip_block = amdgpu_device_ip_get_ip_block(adev, type);
2234
2235         if (ip_block && ((ip_block->version->major > major) ||
2236                         ((ip_block->version->major == major) &&
2237                         (ip_block->version->minor >= minor))))
2238                 return 0;
2239
2240         return 1;
2241 }
2242
2243 /**
2244  * amdgpu_device_ip_block_add
2245  *
2246  * @adev: amdgpu_device pointer
2247  * @ip_block_version: pointer to the IP to add
2248  *
2249  * Adds the IP block driver information to the collection of IPs
2250  * on the asic.
2251  */
2252 int amdgpu_device_ip_block_add(struct amdgpu_device *adev,
2253                                const struct amdgpu_ip_block_version *ip_block_version)
2254 {
2255         if (!ip_block_version)
2256                 return -EINVAL;
2257
2258         switch (ip_block_version->type) {
2259         case AMD_IP_BLOCK_TYPE_VCN:
2260                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_VCN_MASK)
2261                         return 0;
2262                 break;
2263         case AMD_IP_BLOCK_TYPE_JPEG:
2264                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_JPEG_MASK)
2265                         return 0;
2266                 break;
2267         default:
2268                 break;
2269         }
2270
2271         DRM_INFO("add ip block number %d <%s>\n", adev->num_ip_blocks,
2272                   ip_block_version->funcs->name);
2273
2274         adev->ip_blocks[adev->num_ip_blocks++].version = ip_block_version;
2275
2276         return 0;
2277 }
2278
2279 /**
2280  * amdgpu_device_enable_virtual_display - enable virtual display feature
2281  *
2282  * @adev: amdgpu_device pointer
2283  *
2284  * Enabled the virtual display feature if the user has enabled it via
2285  * the module parameter virtual_display.  This feature provides a virtual
2286  * display hardware on headless boards or in virtualized environments.
2287  * This function parses and validates the configuration string specified by
2288  * the user and configues the virtual display configuration (number of
2289  * virtual connectors, crtcs, etc.) specified.
2290  */
2291 static void amdgpu_device_enable_virtual_display(struct amdgpu_device *adev)
2292 {
2293         adev->enable_virtual_display = false;
2294
2295         if (amdgpu_virtual_display) {
2296                 const char *pci_address_name = pci_name(adev->pdev);
2297                 char *pciaddstr, *pciaddstr_tmp, *pciaddname_tmp, *pciaddname;
2298
2299                 pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
2300                 pciaddstr_tmp = pciaddstr;
2301                 while ((pciaddname_tmp = strsep(&pciaddstr_tmp, ";"))) {
2302                         pciaddname = strsep(&pciaddname_tmp, ",");
2303                         if (!strcmp("all", pciaddname)
2304                             || !strcmp(pci_address_name, pciaddname)) {
2305                                 long num_crtc;
2306                                 int res = -1;
2307
2308                                 adev->enable_virtual_display = true;
2309
2310                                 if (pciaddname_tmp)
2311                                         res = kstrtol(pciaddname_tmp, 10,
2312                                                       &num_crtc);
2313
2314                                 if (!res) {
2315                                         if (num_crtc < 1)
2316                                                 num_crtc = 1;
2317                                         if (num_crtc > 6)
2318                                                 num_crtc = 6;
2319                                         adev->mode_info.num_crtc = num_crtc;
2320                                 } else {
2321                                         adev->mode_info.num_crtc = 1;
2322                                 }
2323                                 break;
2324                         }
2325                 }
2326
2327                 DRM_INFO("virtual display string:%s, %s:virtual_display:%d, num_crtc:%d\n",
2328                          amdgpu_virtual_display, pci_address_name,
2329                          adev->enable_virtual_display, adev->mode_info.num_crtc);
2330
2331                 kfree(pciaddstr);
2332         }
2333 }
2334
2335 void amdgpu_device_set_sriov_virtual_display(struct amdgpu_device *adev)
2336 {
2337         if (amdgpu_sriov_vf(adev) && !adev->enable_virtual_display) {
2338                 adev->mode_info.num_crtc = 1;
2339                 adev->enable_virtual_display = true;
2340                 DRM_INFO("virtual_display:%d, num_crtc:%d\n",
2341                          adev->enable_virtual_display, adev->mode_info.num_crtc);
2342         }
2343 }
2344
2345 /**
2346  * amdgpu_device_parse_gpu_info_fw - parse gpu info firmware
2347  *
2348  * @adev: amdgpu_device pointer
2349  *
2350  * Parses the asic configuration parameters specified in the gpu info
2351  * firmware and makes them availale to the driver for use in configuring
2352  * the asic.
2353  * Returns 0 on success, -EINVAL on failure.
2354  */
2355 static int amdgpu_device_parse_gpu_info_fw(struct amdgpu_device *adev)
2356 {
2357         const char *chip_name;
2358         int err;
2359         const struct gpu_info_firmware_header_v1_0 *hdr;
2360
2361         adev->firmware.gpu_info_fw = NULL;
2362
2363         if (adev->mman.discovery_bin)
2364                 return 0;
2365
2366         switch (adev->asic_type) {
2367         default:
2368                 return 0;
2369         case CHIP_VEGA10:
2370                 chip_name = "vega10";
2371                 break;
2372         case CHIP_VEGA12:
2373                 chip_name = "vega12";
2374                 break;
2375         case CHIP_RAVEN:
2376                 if (adev->apu_flags & AMD_APU_IS_RAVEN2)
2377                         chip_name = "raven2";
2378                 else if (adev->apu_flags & AMD_APU_IS_PICASSO)
2379                         chip_name = "picasso";
2380                 else
2381                         chip_name = "raven";
2382                 break;
2383         case CHIP_ARCTURUS:
2384                 chip_name = "arcturus";
2385                 break;
2386         case CHIP_NAVI12:
2387                 chip_name = "navi12";
2388                 break;
2389         }
2390
2391         err = amdgpu_ucode_request(adev, &adev->firmware.gpu_info_fw,
2392                                    "amdgpu/%s_gpu_info.bin", chip_name);
2393         if (err) {
2394                 dev_err(adev->dev,
2395                         "Failed to get gpu_info firmware \"%s_gpu_info.bin\"\n",
2396                         chip_name);
2397                 goto out;
2398         }
2399
2400         hdr = (const struct gpu_info_firmware_header_v1_0 *)adev->firmware.gpu_info_fw->data;
2401         amdgpu_ucode_print_gpu_info_hdr(&hdr->header);
2402
2403         switch (hdr->version_major) {
2404         case 1:
2405         {
2406                 const struct gpu_info_firmware_v1_0 *gpu_info_fw =
2407                         (const struct gpu_info_firmware_v1_0 *)(adev->firmware.gpu_info_fw->data +
2408                                                                 le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2409
2410                 /*
2411                  * Should be droped when DAL no longer needs it.
2412                  */
2413                 if (adev->asic_type == CHIP_NAVI12)
2414                         goto parse_soc_bounding_box;
2415
2416                 adev->gfx.config.max_shader_engines = le32_to_cpu(gpu_info_fw->gc_num_se);
2417                 adev->gfx.config.max_cu_per_sh = le32_to_cpu(gpu_info_fw->gc_num_cu_per_sh);
2418                 adev->gfx.config.max_sh_per_se = le32_to_cpu(gpu_info_fw->gc_num_sh_per_se);
2419                 adev->gfx.config.max_backends_per_se = le32_to_cpu(gpu_info_fw->gc_num_rb_per_se);
2420                 adev->gfx.config.max_texture_channel_caches =
2421                         le32_to_cpu(gpu_info_fw->gc_num_tccs);
2422                 adev->gfx.config.max_gprs = le32_to_cpu(gpu_info_fw->gc_num_gprs);
2423                 adev->gfx.config.max_gs_threads = le32_to_cpu(gpu_info_fw->gc_num_max_gs_thds);
2424                 adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gpu_info_fw->gc_gs_table_depth);
2425                 adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gpu_info_fw->gc_gsprim_buff_depth);
2426                 adev->gfx.config.double_offchip_lds_buf =
2427                         le32_to_cpu(gpu_info_fw->gc_double_offchip_lds_buffer);
2428                 adev->gfx.cu_info.wave_front_size = le32_to_cpu(gpu_info_fw->gc_wave_size);
2429                 adev->gfx.cu_info.max_waves_per_simd =
2430                         le32_to_cpu(gpu_info_fw->gc_max_waves_per_simd);
2431                 adev->gfx.cu_info.max_scratch_slots_per_cu =
2432                         le32_to_cpu(gpu_info_fw->gc_max_scratch_slots_per_cu);
2433                 adev->gfx.cu_info.lds_size = le32_to_cpu(gpu_info_fw->gc_lds_size);
2434                 if (hdr->version_minor >= 1) {
2435                         const struct gpu_info_firmware_v1_1 *gpu_info_fw =
2436                                 (const struct gpu_info_firmware_v1_1 *)(adev->firmware.gpu_info_fw->data +
2437                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2438                         adev->gfx.config.num_sc_per_sh =
2439                                 le32_to_cpu(gpu_info_fw->num_sc_per_sh);
2440                         adev->gfx.config.num_packer_per_sc =
2441                                 le32_to_cpu(gpu_info_fw->num_packer_per_sc);
2442                 }
2443
2444 parse_soc_bounding_box:
2445                 /*
2446                  * soc bounding box info is not integrated in disocovery table,
2447                  * we always need to parse it from gpu info firmware if needed.
2448                  */
2449                 if (hdr->version_minor == 2) {
2450                         const struct gpu_info_firmware_v1_2 *gpu_info_fw =
2451                                 (const struct gpu_info_firmware_v1_2 *)(adev->firmware.gpu_info_fw->data +
2452                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2453                         adev->dm.soc_bounding_box = &gpu_info_fw->soc_bounding_box;
2454                 }
2455                 break;
2456         }
2457         default:
2458                 dev_err(adev->dev,
2459                         "Unsupported gpu_info table %d\n", hdr->header.ucode_version);
2460                 err = -EINVAL;
2461                 goto out;
2462         }
2463 out:
2464         return err;
2465 }
2466
2467 /**
2468  * amdgpu_device_ip_early_init - run early init for hardware IPs
2469  *
2470  * @adev: amdgpu_device pointer
2471  *
2472  * Early initialization pass for hardware IPs.  The hardware IPs that make
2473  * up each asic are discovered each IP's early_init callback is run.  This
2474  * is the first stage in initializing the asic.
2475  * Returns 0 on success, negative error code on failure.
2476  */
2477 static int amdgpu_device_ip_early_init(struct amdgpu_device *adev)
2478 {
2479         struct amdgpu_ip_block *ip_block;
2480         struct pci_dev *parent;
2481         int i, r;
2482         bool total;
2483
2484         amdgpu_device_enable_virtual_display(adev);
2485
2486         if (amdgpu_sriov_vf(adev)) {
2487                 r = amdgpu_virt_request_full_gpu(adev, true);
2488                 if (r)
2489                         return r;
2490         }
2491
2492         switch (adev->asic_type) {
2493 #ifdef CONFIG_DRM_AMDGPU_SI
2494         case CHIP_VERDE:
2495         case CHIP_TAHITI:
2496         case CHIP_PITCAIRN:
2497         case CHIP_OLAND:
2498         case CHIP_HAINAN:
2499                 adev->family = AMDGPU_FAMILY_SI;
2500                 r = si_set_ip_blocks(adev);
2501                 if (r)
2502                         return r;
2503                 break;
2504 #endif
2505 #ifdef CONFIG_DRM_AMDGPU_CIK
2506         case CHIP_BONAIRE:
2507         case CHIP_HAWAII:
2508         case CHIP_KAVERI:
2509         case CHIP_KABINI:
2510         case CHIP_MULLINS:
2511                 if (adev->flags & AMD_IS_APU)
2512                         adev->family = AMDGPU_FAMILY_KV;
2513                 else
2514                         adev->family = AMDGPU_FAMILY_CI;
2515
2516                 r = cik_set_ip_blocks(adev);
2517                 if (r)
2518                         return r;
2519                 break;
2520 #endif
2521         case CHIP_TOPAZ:
2522         case CHIP_TONGA:
2523         case CHIP_FIJI:
2524         case CHIP_POLARIS10:
2525         case CHIP_POLARIS11:
2526         case CHIP_POLARIS12:
2527         case CHIP_VEGAM:
2528         case CHIP_CARRIZO:
2529         case CHIP_STONEY:
2530                 if (adev->flags & AMD_IS_APU)
2531                         adev->family = AMDGPU_FAMILY_CZ;
2532                 else
2533                         adev->family = AMDGPU_FAMILY_VI;
2534
2535                 r = vi_set_ip_blocks(adev);
2536                 if (r)
2537                         return r;
2538                 break;
2539         default:
2540                 r = amdgpu_discovery_set_ip_blocks(adev);
2541                 if (r)
2542                         return r;
2543                 break;
2544         }
2545
2546         if (amdgpu_has_atpx() &&
2547             (amdgpu_is_atpx_hybrid() ||
2548              amdgpu_has_atpx_dgpu_power_cntl()) &&
2549             ((adev->flags & AMD_IS_APU) == 0) &&
2550             !dev_is_removable(&adev->pdev->dev))
2551                 adev->flags |= AMD_IS_PX;
2552
2553         if (!(adev->flags & AMD_IS_APU)) {
2554                 parent = pcie_find_root_port(adev->pdev);
2555                 adev->has_pr3 = parent ? pci_pr3_present(parent) : false;
2556         }
2557
2558
2559         adev->pm.pp_feature = amdgpu_pp_feature_mask;
2560         if (amdgpu_sriov_vf(adev) || sched_policy == KFD_SCHED_POLICY_NO_HWS)
2561                 adev->pm.pp_feature &= ~PP_GFXOFF_MASK;
2562         if (amdgpu_sriov_vf(adev) && adev->asic_type == CHIP_SIENNA_CICHLID)
2563                 adev->pm.pp_feature &= ~PP_OVERDRIVE_MASK;
2564         if (!amdgpu_device_pcie_dynamic_switching_supported(adev))
2565                 adev->pm.pp_feature &= ~PP_PCIE_DPM_MASK;
2566
2567         total = true;
2568         for (i = 0; i < adev->num_ip_blocks; i++) {
2569                 if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
2570                         DRM_WARN("disabled ip block: %d <%s>\n",
2571                                   i, adev->ip_blocks[i].version->funcs->name);
2572                         adev->ip_blocks[i].status.valid = false;
2573                 } else {
2574                         if (adev->ip_blocks[i].version->funcs->early_init) {
2575                                 r = adev->ip_blocks[i].version->funcs->early_init((void *)adev);
2576                                 if (r == -ENOENT) {
2577                                         adev->ip_blocks[i].status.valid = false;
2578                                 } else if (r) {
2579                                         DRM_ERROR("early_init of IP block <%s> failed %d\n",
2580                                                   adev->ip_blocks[i].version->funcs->name, r);
2581                                         total = false;
2582                                 } else {
2583                                         adev->ip_blocks[i].status.valid = true;
2584                                 }
2585                         } else {
2586                                 adev->ip_blocks[i].status.valid = true;
2587                         }
2588                 }
2589                 /* get the vbios after the asic_funcs are set up */
2590                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2591                         r = amdgpu_device_parse_gpu_info_fw(adev);
2592                         if (r)
2593                                 return r;
2594
2595                         /* Read BIOS */
2596                         if (amdgpu_device_read_bios(adev)) {
2597                                 if (!amdgpu_get_bios(adev))
2598                                         return -EINVAL;
2599
2600                                 r = amdgpu_atombios_init(adev);
2601                                 if (r) {
2602                                         dev_err(adev->dev, "amdgpu_atombios_init failed\n");
2603                                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_INIT_FAIL, 0, 0);
2604                                         return r;
2605                                 }
2606                         }
2607
2608                         /*get pf2vf msg info at it's earliest time*/
2609                         if (amdgpu_sriov_vf(adev))
2610                                 amdgpu_virt_init_data_exchange(adev);
2611
2612                 }
2613         }
2614         if (!total)
2615                 return -ENODEV;
2616
2617         ip_block = amdgpu_device_ip_get_ip_block(adev, AMD_IP_BLOCK_TYPE_GFX);
2618         if (ip_block->status.valid != false)
2619                 amdgpu_amdkfd_device_probe(adev);
2620
2621         adev->cg_flags &= amdgpu_cg_mask;
2622         adev->pg_flags &= amdgpu_pg_mask;
2623
2624         return 0;
2625 }
2626
2627 static int amdgpu_device_ip_hw_init_phase1(struct amdgpu_device *adev)
2628 {
2629         int i, r;
2630
2631         for (i = 0; i < adev->num_ip_blocks; i++) {
2632                 if (!adev->ip_blocks[i].status.sw)
2633                         continue;
2634                 if (adev->ip_blocks[i].status.hw)
2635                         continue;
2636                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2637                     (amdgpu_sriov_vf(adev) && (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)) ||
2638                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
2639                         r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2640                         if (r) {
2641                                 DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2642                                           adev->ip_blocks[i].version->funcs->name, r);
2643                                 return r;
2644                         }
2645                         adev->ip_blocks[i].status.hw = true;
2646                 }
2647         }
2648
2649         return 0;
2650 }
2651
2652 static int amdgpu_device_ip_hw_init_phase2(struct amdgpu_device *adev)
2653 {
2654         int i, r;
2655
2656         for (i = 0; i < adev->num_ip_blocks; i++) {
2657                 if (!adev->ip_blocks[i].status.sw)
2658                         continue;
2659                 if (adev->ip_blocks[i].status.hw)
2660                         continue;
2661                 r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2662                 if (r) {
2663                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2664                                   adev->ip_blocks[i].version->funcs->name, r);
2665                         return r;
2666                 }
2667                 adev->ip_blocks[i].status.hw = true;
2668         }
2669
2670         return 0;
2671 }
2672
2673 static int amdgpu_device_fw_loading(struct amdgpu_device *adev)
2674 {
2675         int r = 0;
2676         int i;
2677         uint32_t smu_version;
2678
2679         if (adev->asic_type >= CHIP_VEGA10) {
2680                 for (i = 0; i < adev->num_ip_blocks; i++) {
2681                         if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_PSP)
2682                                 continue;
2683
2684                         if (!adev->ip_blocks[i].status.sw)
2685                                 continue;
2686
2687                         /* no need to do the fw loading again if already done*/
2688                         if (adev->ip_blocks[i].status.hw == true)
2689                                 break;
2690
2691                         if (amdgpu_in_reset(adev) || adev->in_suspend) {
2692                                 r = adev->ip_blocks[i].version->funcs->resume(adev);
2693                                 if (r) {
2694                                         DRM_ERROR("resume of IP block <%s> failed %d\n",
2695                                                           adev->ip_blocks[i].version->funcs->name, r);
2696                                         return r;
2697                                 }
2698                         } else {
2699                                 r = adev->ip_blocks[i].version->funcs->hw_init(adev);
2700                                 if (r) {
2701                                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2702                                                           adev->ip_blocks[i].version->funcs->name, r);
2703                                         return r;
2704                                 }
2705                         }
2706
2707                         adev->ip_blocks[i].status.hw = true;
2708                         break;
2709                 }
2710         }
2711
2712         if (!amdgpu_sriov_vf(adev) || adev->asic_type == CHIP_TONGA)
2713                 r = amdgpu_pm_load_smu_firmware(adev, &smu_version);
2714
2715         return r;
2716 }
2717
2718 static int amdgpu_device_init_schedulers(struct amdgpu_device *adev)
2719 {
2720         long timeout;
2721         int r, i;
2722
2723         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2724                 struct amdgpu_ring *ring = adev->rings[i];
2725
2726                 /* No need to setup the GPU scheduler for rings that don't need it */
2727                 if (!ring || ring->no_scheduler)
2728                         continue;
2729
2730                 switch (ring->funcs->type) {
2731                 case AMDGPU_RING_TYPE_GFX:
2732                         timeout = adev->gfx_timeout;
2733                         break;
2734                 case AMDGPU_RING_TYPE_COMPUTE:
2735                         timeout = adev->compute_timeout;
2736                         break;
2737                 case AMDGPU_RING_TYPE_SDMA:
2738                         timeout = adev->sdma_timeout;
2739                         break;
2740                 default:
2741                         timeout = adev->video_timeout;
2742                         break;
2743                 }
2744
2745                 r = drm_sched_init(&ring->sched, &amdgpu_sched_ops, NULL,
2746                                    DRM_SCHED_PRIORITY_COUNT,
2747                                    ring->num_hw_submission, 0,
2748                                    timeout, adev->reset_domain->wq,
2749                                    ring->sched_score, ring->name,
2750                                    adev->dev);
2751                 if (r) {
2752                         DRM_ERROR("Failed to create scheduler on ring %s.\n",
2753                                   ring->name);
2754                         return r;
2755                 }
2756                 r = amdgpu_uvd_entity_init(adev, ring);
2757                 if (r) {
2758                         DRM_ERROR("Failed to create UVD scheduling entity on ring %s.\n",
2759                                   ring->name);
2760                         return r;
2761                 }
2762                 r = amdgpu_vce_entity_init(adev, ring);
2763                 if (r) {
2764                         DRM_ERROR("Failed to create VCE scheduling entity on ring %s.\n",
2765                                   ring->name);
2766                         return r;
2767                 }
2768         }
2769
2770         amdgpu_xcp_update_partition_sched_list(adev);
2771
2772         return 0;
2773 }
2774
2775
2776 /**
2777  * amdgpu_device_ip_init - run init for hardware IPs
2778  *
2779  * @adev: amdgpu_device pointer
2780  *
2781  * Main initialization pass for hardware IPs.  The list of all the hardware
2782  * IPs that make up the asic is walked and the sw_init and hw_init callbacks
2783  * are run.  sw_init initializes the software state associated with each IP
2784  * and hw_init initializes the hardware associated with each IP.
2785  * Returns 0 on success, negative error code on failure.
2786  */
2787 static int amdgpu_device_ip_init(struct amdgpu_device *adev)
2788 {
2789         int i, r;
2790
2791         r = amdgpu_ras_init(adev);
2792         if (r)
2793                 return r;
2794
2795         for (i = 0; i < adev->num_ip_blocks; i++) {
2796                 if (!adev->ip_blocks[i].status.valid)
2797                         continue;
2798                 r = adev->ip_blocks[i].version->funcs->sw_init((void *)adev);
2799                 if (r) {
2800                         DRM_ERROR("sw_init of IP block <%s> failed %d\n",
2801                                   adev->ip_blocks[i].version->funcs->name, r);
2802                         goto init_failed;
2803                 }
2804                 adev->ip_blocks[i].status.sw = true;
2805
2806                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2807                         /* need to do common hw init early so everything is set up for gmc */
2808                         r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2809                         if (r) {
2810                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2811                                 goto init_failed;
2812                         }
2813                         adev->ip_blocks[i].status.hw = true;
2814                 } else if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2815                         /* need to do gmc hw init early so we can allocate gpu mem */
2816                         /* Try to reserve bad pages early */
2817                         if (amdgpu_sriov_vf(adev))
2818                                 amdgpu_virt_exchange_data(adev);
2819
2820                         r = amdgpu_device_mem_scratch_init(adev);
2821                         if (r) {
2822                                 DRM_ERROR("amdgpu_mem_scratch_init failed %d\n", r);
2823                                 goto init_failed;
2824                         }
2825                         r = adev->ip_blocks[i].version->funcs->hw_init((void *)adev);
2826                         if (r) {
2827                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2828                                 goto init_failed;
2829                         }
2830                         r = amdgpu_device_wb_init(adev);
2831                         if (r) {
2832                                 DRM_ERROR("amdgpu_device_wb_init failed %d\n", r);
2833                                 goto init_failed;
2834                         }
2835                         adev->ip_blocks[i].status.hw = true;
2836
2837                         /* right after GMC hw init, we create CSA */
2838                         if (adev->gfx.mcbp) {
2839                                 r = amdgpu_allocate_static_csa(adev, &adev->virt.csa_obj,
2840                                                                AMDGPU_GEM_DOMAIN_VRAM |
2841                                                                AMDGPU_GEM_DOMAIN_GTT,
2842                                                                AMDGPU_CSA_SIZE);
2843                                 if (r) {
2844                                         DRM_ERROR("allocate CSA failed %d\n", r);
2845                                         goto init_failed;
2846                                 }
2847                         }
2848
2849                         r = amdgpu_seq64_init(adev);
2850                         if (r) {
2851                                 DRM_ERROR("allocate seq64 failed %d\n", r);
2852                                 goto init_failed;
2853                         }
2854                 }
2855         }
2856
2857         if (amdgpu_sriov_vf(adev))
2858                 amdgpu_virt_init_data_exchange(adev);
2859
2860         r = amdgpu_ib_pool_init(adev);
2861         if (r) {
2862                 dev_err(adev->dev, "IB initialization failed (%d).\n", r);
2863                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_IB_INIT_FAIL, 0, r);
2864                 goto init_failed;
2865         }
2866
2867         r = amdgpu_ucode_create_bo(adev); /* create ucode bo when sw_init complete*/
2868         if (r)
2869                 goto init_failed;
2870
2871         r = amdgpu_device_ip_hw_init_phase1(adev);
2872         if (r)
2873                 goto init_failed;
2874
2875         r = amdgpu_device_fw_loading(adev);
2876         if (r)
2877                 goto init_failed;
2878
2879         r = amdgpu_device_ip_hw_init_phase2(adev);
2880         if (r)
2881                 goto init_failed;
2882
2883         /*
2884          * retired pages will be loaded from eeprom and reserved here,
2885          * it should be called after amdgpu_device_ip_hw_init_phase2  since
2886          * for some ASICs the RAS EEPROM code relies on SMU fully functioning
2887          * for I2C communication which only true at this point.
2888          *
2889          * amdgpu_ras_recovery_init may fail, but the upper only cares the
2890          * failure from bad gpu situation and stop amdgpu init process
2891          * accordingly. For other failed cases, it will still release all
2892          * the resource and print error message, rather than returning one
2893          * negative value to upper level.
2894          *
2895          * Note: theoretically, this should be called before all vram allocations
2896          * to protect retired page from abusing
2897          */
2898         r = amdgpu_ras_recovery_init(adev);
2899         if (r)
2900                 goto init_failed;
2901
2902         /**
2903          * In case of XGMI grab extra reference for reset domain for this device
2904          */
2905         if (adev->gmc.xgmi.num_physical_nodes > 1) {
2906                 if (amdgpu_xgmi_add_device(adev) == 0) {
2907                         if (!amdgpu_sriov_vf(adev)) {
2908                                 struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
2909
2910                                 if (WARN_ON(!hive)) {
2911                                         r = -ENOENT;
2912                                         goto init_failed;
2913                                 }
2914
2915                                 if (!hive->reset_domain ||
2916                                     !amdgpu_reset_get_reset_domain(hive->reset_domain)) {
2917                                         r = -ENOENT;
2918                                         amdgpu_put_xgmi_hive(hive);
2919                                         goto init_failed;
2920                                 }
2921
2922                                 /* Drop the early temporary reset domain we created for device */
2923                                 amdgpu_reset_put_reset_domain(adev->reset_domain);
2924                                 adev->reset_domain = hive->reset_domain;
2925                                 amdgpu_put_xgmi_hive(hive);
2926                         }
2927                 }
2928         }
2929
2930         r = amdgpu_device_init_schedulers(adev);
2931         if (r)
2932                 goto init_failed;
2933
2934         if (adev->mman.buffer_funcs_ring->sched.ready)
2935                 amdgpu_ttm_set_buffer_funcs_status(adev, true);
2936
2937         /* Don't init kfd if whole hive need to be reset during init */
2938         if (!adev->gmc.xgmi.pending_reset) {
2939                 kgd2kfd_init_zone_device(adev);
2940                 amdgpu_amdkfd_device_init(adev);
2941         }
2942
2943         amdgpu_fru_get_product_info(adev);
2944
2945 init_failed:
2946
2947         return r;
2948 }
2949
2950 /**
2951  * amdgpu_device_fill_reset_magic - writes reset magic to gart pointer
2952  *
2953  * @adev: amdgpu_device pointer
2954  *
2955  * Writes a reset magic value to the gart pointer in VRAM.  The driver calls
2956  * this function before a GPU reset.  If the value is retained after a
2957  * GPU reset, VRAM has not been lost.  Some GPU resets may destry VRAM contents.
2958  */
2959 static void amdgpu_device_fill_reset_magic(struct amdgpu_device *adev)
2960 {
2961         memcpy(adev->reset_magic, adev->gart.ptr, AMDGPU_RESET_MAGIC_NUM);
2962 }
2963
2964 /**
2965  * amdgpu_device_check_vram_lost - check if vram is valid
2966  *
2967  * @adev: amdgpu_device pointer
2968  *
2969  * Checks the reset magic value written to the gart pointer in VRAM.
2970  * The driver calls this after a GPU reset to see if the contents of
2971  * VRAM is lost or now.
2972  * returns true if vram is lost, false if not.
2973  */
2974 static bool amdgpu_device_check_vram_lost(struct amdgpu_device *adev)
2975 {
2976         if (memcmp(adev->gart.ptr, adev->reset_magic,
2977                         AMDGPU_RESET_MAGIC_NUM))
2978                 return true;
2979
2980         if (!amdgpu_in_reset(adev))
2981                 return false;
2982
2983         /*
2984          * For all ASICs with baco/mode1 reset, the VRAM is
2985          * always assumed to be lost.
2986          */
2987         switch (amdgpu_asic_reset_method(adev)) {
2988         case AMD_RESET_METHOD_BACO:
2989         case AMD_RESET_METHOD_MODE1:
2990                 return true;
2991         default:
2992                 return false;
2993         }
2994 }
2995
2996 /**
2997  * amdgpu_device_set_cg_state - set clockgating for amdgpu device
2998  *
2999  * @adev: amdgpu_device pointer
3000  * @state: clockgating state (gate or ungate)
3001  *
3002  * The list of all the hardware IPs that make up the asic is walked and the
3003  * set_clockgating_state callbacks are run.
3004  * Late initialization pass enabling clockgating for hardware IPs.
3005  * Fini or suspend, pass disabling clockgating for hardware IPs.
3006  * Returns 0 on success, negative error code on failure.
3007  */
3008
3009 int amdgpu_device_set_cg_state(struct amdgpu_device *adev,
3010                                enum amd_clockgating_state state)
3011 {
3012         int i, j, r;
3013
3014         if (amdgpu_emu_mode == 1)
3015                 return 0;
3016
3017         for (j = 0; j < adev->num_ip_blocks; j++) {
3018                 i = state == AMD_CG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
3019                 if (!adev->ip_blocks[i].status.late_initialized)
3020                         continue;
3021                 /* skip CG for GFX, SDMA on S0ix */
3022                 if (adev->in_s0ix &&
3023                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3024                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SDMA))
3025                         continue;
3026                 /* skip CG for VCE/UVD, it's handled specially */
3027                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
3028                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
3029                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
3030                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
3031                     adev->ip_blocks[i].version->funcs->set_clockgating_state) {
3032                         /* enable clockgating to save power */
3033                         r = adev->ip_blocks[i].version->funcs->set_clockgating_state((void *)adev,
3034                                                                                      state);
3035                         if (r) {
3036                                 DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n",
3037                                           adev->ip_blocks[i].version->funcs->name, r);
3038                                 return r;
3039                         }
3040                 }
3041         }
3042
3043         return 0;
3044 }
3045
3046 int amdgpu_device_set_pg_state(struct amdgpu_device *adev,
3047                                enum amd_powergating_state state)
3048 {
3049         int i, j, r;
3050
3051         if (amdgpu_emu_mode == 1)
3052                 return 0;
3053
3054         for (j = 0; j < adev->num_ip_blocks; j++) {
3055                 i = state == AMD_PG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
3056                 if (!adev->ip_blocks[i].status.late_initialized)
3057                         continue;
3058                 /* skip PG for GFX, SDMA on S0ix */
3059                 if (adev->in_s0ix &&
3060                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3061                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SDMA))
3062                         continue;
3063                 /* skip CG for VCE/UVD, it's handled specially */
3064                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
3065                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
3066                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
3067                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
3068                     adev->ip_blocks[i].version->funcs->set_powergating_state) {
3069                         /* enable powergating to save power */
3070                         r = adev->ip_blocks[i].version->funcs->set_powergating_state((void *)adev,
3071                                                                                         state);
3072                         if (r) {
3073                                 DRM_ERROR("set_powergating_state(gate) of IP block <%s> failed %d\n",
3074                                           adev->ip_blocks[i].version->funcs->name, r);
3075                                 return r;
3076                         }
3077                 }
3078         }
3079         return 0;
3080 }
3081
3082 static int amdgpu_device_enable_mgpu_fan_boost(void)
3083 {
3084         struct amdgpu_gpu_instance *gpu_ins;
3085         struct amdgpu_device *adev;
3086         int i, ret = 0;
3087
3088         mutex_lock(&mgpu_info.mutex);
3089
3090         /*
3091          * MGPU fan boost feature should be enabled
3092          * only when there are two or more dGPUs in
3093          * the system
3094          */
3095         if (mgpu_info.num_dgpu < 2)
3096                 goto out;
3097
3098         for (i = 0; i < mgpu_info.num_dgpu; i++) {
3099                 gpu_ins = &(mgpu_info.gpu_ins[i]);
3100                 adev = gpu_ins->adev;
3101                 if (!(adev->flags & AMD_IS_APU) &&
3102                     !gpu_ins->mgpu_fan_enabled) {
3103                         ret = amdgpu_dpm_enable_mgpu_fan_boost(adev);
3104                         if (ret)
3105                                 break;
3106
3107                         gpu_ins->mgpu_fan_enabled = 1;
3108                 }
3109         }
3110
3111 out:
3112         mutex_unlock(&mgpu_info.mutex);
3113
3114         return ret;
3115 }
3116
3117 /**
3118  * amdgpu_device_ip_late_init - run late init for hardware IPs
3119  *
3120  * @adev: amdgpu_device pointer
3121  *
3122  * Late initialization pass for hardware IPs.  The list of all the hardware
3123  * IPs that make up the asic is walked and the late_init callbacks are run.
3124  * late_init covers any special initialization that an IP requires
3125  * after all of the have been initialized or something that needs to happen
3126  * late in the init process.
3127  * Returns 0 on success, negative error code on failure.
3128  */
3129 static int amdgpu_device_ip_late_init(struct amdgpu_device *adev)
3130 {
3131         struct amdgpu_gpu_instance *gpu_instance;
3132         int i = 0, r;
3133
3134         for (i = 0; i < adev->num_ip_blocks; i++) {
3135                 if (!adev->ip_blocks[i].status.hw)
3136                         continue;
3137                 if (adev->ip_blocks[i].version->funcs->late_init) {
3138                         r = adev->ip_blocks[i].version->funcs->late_init((void *)adev);
3139                         if (r) {
3140                                 DRM_ERROR("late_init of IP block <%s> failed %d\n",
3141                                           adev->ip_blocks[i].version->funcs->name, r);
3142                                 return r;
3143                         }
3144                 }
3145                 adev->ip_blocks[i].status.late_initialized = true;
3146         }
3147
3148         r = amdgpu_ras_late_init(adev);
3149         if (r) {
3150                 DRM_ERROR("amdgpu_ras_late_init failed %d", r);
3151                 return r;
3152         }
3153
3154         if (!amdgpu_in_reset(adev))
3155                 amdgpu_ras_set_error_query_ready(adev, true);
3156
3157         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_GATE);
3158         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_GATE);
3159
3160         amdgpu_device_fill_reset_magic(adev);
3161
3162         r = amdgpu_device_enable_mgpu_fan_boost();
3163         if (r)
3164                 DRM_ERROR("enable mgpu fan boost failed (%d).\n", r);
3165
3166         /* For passthrough configuration on arcturus and aldebaran, enable special handling SBR */
3167         if (amdgpu_passthrough(adev) &&
3168             ((adev->asic_type == CHIP_ARCTURUS && adev->gmc.xgmi.num_physical_nodes > 1) ||
3169              adev->asic_type == CHIP_ALDEBARAN))
3170                 amdgpu_dpm_handle_passthrough_sbr(adev, true);
3171
3172         if (adev->gmc.xgmi.num_physical_nodes > 1) {
3173                 mutex_lock(&mgpu_info.mutex);
3174
3175                 /*
3176                  * Reset device p-state to low as this was booted with high.
3177                  *
3178                  * This should be performed only after all devices from the same
3179                  * hive get initialized.
3180                  *
3181                  * However, it's unknown how many device in the hive in advance.
3182                  * As this is counted one by one during devices initializations.
3183                  *
3184                  * So, we wait for all XGMI interlinked devices initialized.
3185                  * This may bring some delays as those devices may come from
3186                  * different hives. But that should be OK.
3187                  */
3188                 if (mgpu_info.num_dgpu == adev->gmc.xgmi.num_physical_nodes) {
3189                         for (i = 0; i < mgpu_info.num_gpu; i++) {
3190                                 gpu_instance = &(mgpu_info.gpu_ins[i]);
3191                                 if (gpu_instance->adev->flags & AMD_IS_APU)
3192                                         continue;
3193
3194                                 r = amdgpu_xgmi_set_pstate(gpu_instance->adev,
3195                                                 AMDGPU_XGMI_PSTATE_MIN);
3196                                 if (r) {
3197                                         DRM_ERROR("pstate setting failed (%d).\n", r);
3198                                         break;
3199                                 }
3200                         }
3201                 }
3202
3203                 mutex_unlock(&mgpu_info.mutex);
3204         }
3205
3206         return 0;
3207 }
3208
3209 /**
3210  * amdgpu_device_smu_fini_early - smu hw_fini wrapper
3211  *
3212  * @adev: amdgpu_device pointer
3213  *
3214  * For ASICs need to disable SMC first
3215  */
3216 static void amdgpu_device_smu_fini_early(struct amdgpu_device *adev)
3217 {
3218         int i, r;
3219
3220         if (amdgpu_ip_version(adev, GC_HWIP, 0) > IP_VERSION(9, 0, 0))
3221                 return;
3222
3223         for (i = 0; i < adev->num_ip_blocks; i++) {
3224                 if (!adev->ip_blocks[i].status.hw)
3225                         continue;
3226                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3227                         r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
3228                         /* XXX handle errors */
3229                         if (r) {
3230                                 DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
3231                                           adev->ip_blocks[i].version->funcs->name, r);
3232                         }
3233                         adev->ip_blocks[i].status.hw = false;
3234                         break;
3235                 }
3236         }
3237 }
3238
3239 static int amdgpu_device_ip_fini_early(struct amdgpu_device *adev)
3240 {
3241         int i, r;
3242
3243         for (i = 0; i < adev->num_ip_blocks; i++) {
3244                 if (!adev->ip_blocks[i].version->funcs->early_fini)
3245                         continue;
3246
3247                 r = adev->ip_blocks[i].version->funcs->early_fini((void *)adev);
3248                 if (r) {
3249                         DRM_DEBUG("early_fini of IP block <%s> failed %d\n",
3250                                   adev->ip_blocks[i].version->funcs->name, r);
3251                 }
3252         }
3253
3254         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
3255         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
3256
3257         amdgpu_amdkfd_suspend(adev, false);
3258
3259         /* Workaroud for ASICs need to disable SMC first */
3260         amdgpu_device_smu_fini_early(adev);
3261
3262         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3263                 if (!adev->ip_blocks[i].status.hw)
3264                         continue;
3265
3266                 r = adev->ip_blocks[i].version->funcs->hw_fini((void *)adev);
3267                 /* XXX handle errors */
3268                 if (r) {
3269                         DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
3270                                   adev->ip_blocks[i].version->funcs->name, r);
3271                 }
3272
3273                 adev->ip_blocks[i].status.hw = false;
3274         }
3275
3276         if (amdgpu_sriov_vf(adev)) {
3277                 if (amdgpu_virt_release_full_gpu(adev, false))
3278                         DRM_ERROR("failed to release exclusive mode on fini\n");
3279         }
3280
3281         return 0;
3282 }
3283
3284 /**
3285  * amdgpu_device_ip_fini - run fini for hardware IPs
3286  *
3287  * @adev: amdgpu_device pointer
3288  *
3289  * Main teardown pass for hardware IPs.  The list of all the hardware
3290  * IPs that make up the asic is walked and the hw_fini and sw_fini callbacks
3291  * are run.  hw_fini tears down the hardware associated with each IP
3292  * and sw_fini tears down any software state associated with each IP.
3293  * Returns 0 on success, negative error code on failure.
3294  */
3295 static int amdgpu_device_ip_fini(struct amdgpu_device *adev)
3296 {
3297         int i, r;
3298
3299         if (amdgpu_sriov_vf(adev) && adev->virt.ras_init_done)
3300                 amdgpu_virt_release_ras_err_handler_data(adev);
3301
3302         if (adev->gmc.xgmi.num_physical_nodes > 1)
3303                 amdgpu_xgmi_remove_device(adev);
3304
3305         amdgpu_amdkfd_device_fini_sw(adev);
3306
3307         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3308                 if (!adev->ip_blocks[i].status.sw)
3309                         continue;
3310
3311                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
3312                         amdgpu_ucode_free_bo(adev);
3313                         amdgpu_free_static_csa(&adev->virt.csa_obj);
3314                         amdgpu_device_wb_fini(adev);
3315                         amdgpu_device_mem_scratch_fini(adev);
3316                         amdgpu_ib_pool_fini(adev);
3317                         amdgpu_seq64_fini(adev);
3318                 }
3319
3320                 r = adev->ip_blocks[i].version->funcs->sw_fini((void *)adev);
3321                 /* XXX handle errors */
3322                 if (r) {
3323                         DRM_DEBUG("sw_fini of IP block <%s> failed %d\n",
3324                                   adev->ip_blocks[i].version->funcs->name, r);
3325                 }
3326                 adev->ip_blocks[i].status.sw = false;
3327                 adev->ip_blocks[i].status.valid = false;
3328         }
3329
3330         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3331                 if (!adev->ip_blocks[i].status.late_initialized)
3332                         continue;
3333                 if (adev->ip_blocks[i].version->funcs->late_fini)
3334                         adev->ip_blocks[i].version->funcs->late_fini((void *)adev);
3335                 adev->ip_blocks[i].status.late_initialized = false;
3336         }
3337
3338         amdgpu_ras_fini(adev);
3339
3340         return 0;
3341 }
3342
3343 /**
3344  * amdgpu_device_delayed_init_work_handler - work handler for IB tests
3345  *
3346  * @work: work_struct.
3347  */
3348 static void amdgpu_device_delayed_init_work_handler(struct work_struct *work)
3349 {
3350         struct amdgpu_device *adev =
3351                 container_of(work, struct amdgpu_device, delayed_init_work.work);
3352         int r;
3353
3354         r = amdgpu_ib_ring_tests(adev);
3355         if (r)
3356                 DRM_ERROR("ib ring test failed (%d).\n", r);
3357 }
3358
3359 static void amdgpu_device_delay_enable_gfx_off(struct work_struct *work)
3360 {
3361         struct amdgpu_device *adev =
3362                 container_of(work, struct amdgpu_device, gfx.gfx_off_delay_work.work);
3363
3364         WARN_ON_ONCE(adev->gfx.gfx_off_state);
3365         WARN_ON_ONCE(adev->gfx.gfx_off_req_count);
3366
3367         if (!amdgpu_dpm_set_powergating_by_smu(adev, AMD_IP_BLOCK_TYPE_GFX, true))
3368                 adev->gfx.gfx_off_state = true;
3369 }
3370
3371 /**
3372  * amdgpu_device_ip_suspend_phase1 - run suspend for hardware IPs (phase 1)
3373  *
3374  * @adev: amdgpu_device pointer
3375  *
3376  * Main suspend function for hardware IPs.  The list of all the hardware
3377  * IPs that make up the asic is walked, clockgating is disabled and the
3378  * suspend callbacks are run.  suspend puts the hardware and software state
3379  * in each IP into a state suitable for suspend.
3380  * Returns 0 on success, negative error code on failure.
3381  */
3382 static int amdgpu_device_ip_suspend_phase1(struct amdgpu_device *adev)
3383 {
3384         int i, r;
3385
3386         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
3387         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
3388
3389         /*
3390          * Per PMFW team's suggestion, driver needs to handle gfxoff
3391          * and df cstate features disablement for gpu reset(e.g. Mode1Reset)
3392          * scenario. Add the missing df cstate disablement here.
3393          */
3394         if (amdgpu_dpm_set_df_cstate(adev, DF_CSTATE_DISALLOW))
3395                 dev_warn(adev->dev, "Failed to disallow df cstate");
3396
3397         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3398                 if (!adev->ip_blocks[i].status.valid)
3399                         continue;
3400
3401                 /* displays are handled separately */
3402                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_DCE)
3403                         continue;
3404
3405                 /* XXX handle errors */
3406                 r = adev->ip_blocks[i].version->funcs->suspend(adev);
3407                 /* XXX handle errors */
3408                 if (r) {
3409                         DRM_ERROR("suspend of IP block <%s> failed %d\n",
3410                                   adev->ip_blocks[i].version->funcs->name, r);
3411                         return r;
3412                 }
3413
3414                 adev->ip_blocks[i].status.hw = false;
3415         }
3416
3417         return 0;
3418 }
3419
3420 /**
3421  * amdgpu_device_ip_suspend_phase2 - run suspend for hardware IPs (phase 2)
3422  *
3423  * @adev: amdgpu_device pointer
3424  *
3425  * Main suspend function for hardware IPs.  The list of all the hardware
3426  * IPs that make up the asic is walked, clockgating is disabled and the
3427  * suspend callbacks are run.  suspend puts the hardware and software state
3428  * in each IP into a state suitable for suspend.
3429  * Returns 0 on success, negative error code on failure.
3430  */
3431 static int amdgpu_device_ip_suspend_phase2(struct amdgpu_device *adev)
3432 {
3433         int i, r;
3434
3435         if (adev->in_s0ix)
3436                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D3Entry);
3437
3438         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3439                 if (!adev->ip_blocks[i].status.valid)
3440                         continue;
3441                 /* displays are handled in phase1 */
3442                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE)
3443                         continue;
3444                 /* PSP lost connection when err_event_athub occurs */
3445                 if (amdgpu_ras_intr_triggered() &&
3446                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
3447                         adev->ip_blocks[i].status.hw = false;
3448                         continue;
3449                 }
3450
3451                 /* skip unnecessary suspend if we do not initialize them yet */
3452                 if (adev->gmc.xgmi.pending_reset &&
3453                     !(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3454                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC ||
3455                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3456                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH)) {
3457                         adev->ip_blocks[i].status.hw = false;
3458                         continue;
3459                 }
3460
3461                 /* skip suspend of gfx/mes and psp for S0ix
3462                  * gfx is in gfxoff state, so on resume it will exit gfxoff just
3463                  * like at runtime. PSP is also part of the always on hardware
3464                  * so no need to suspend it.
3465                  */
3466                 if (adev->in_s0ix &&
3467                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP ||
3468                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3469                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_MES))
3470                         continue;
3471
3472                 /* SDMA 5.x+ is part of GFX power domain so it's covered by GFXOFF */
3473                 if (adev->in_s0ix &&
3474                     (amdgpu_ip_version(adev, SDMA0_HWIP, 0) >=
3475                      IP_VERSION(5, 0, 0)) &&
3476                     (adev->ip_blocks[i].version->type ==
3477                      AMD_IP_BLOCK_TYPE_SDMA))
3478                         continue;
3479
3480                 /* Once swPSP provides the IMU, RLC FW binaries to TOS during cold-boot.
3481                  * These are in TMR, hence are expected to be reused by PSP-TOS to reload
3482                  * from this location and RLC Autoload automatically also gets loaded
3483                  * from here based on PMFW -> PSP message during re-init sequence.
3484                  * Therefore, the psp suspend & resume should be skipped to avoid destroy
3485                  * the TMR and reload FWs again for IMU enabled APU ASICs.
3486                  */
3487                 if (amdgpu_in_reset(adev) &&
3488                     (adev->flags & AMD_IS_APU) && adev->gfx.imu.funcs &&
3489                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3490                         continue;
3491
3492                 /* XXX handle errors */
3493                 r = adev->ip_blocks[i].version->funcs->suspend(adev);
3494                 /* XXX handle errors */
3495                 if (r) {
3496                         DRM_ERROR("suspend of IP block <%s> failed %d\n",
3497                                   adev->ip_blocks[i].version->funcs->name, r);
3498                 }
3499                 adev->ip_blocks[i].status.hw = false;
3500                 /* handle putting the SMC in the appropriate state */
3501                 if (!amdgpu_sriov_vf(adev)) {
3502                         if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3503                                 r = amdgpu_dpm_set_mp1_state(adev, adev->mp1_state);
3504                                 if (r) {
3505                                         DRM_ERROR("SMC failed to set mp1 state %d, %d\n",
3506                                                         adev->mp1_state, r);
3507                                         return r;
3508                                 }
3509                         }
3510                 }
3511         }
3512
3513         return 0;
3514 }
3515
3516 /**
3517  * amdgpu_device_ip_suspend - run suspend for hardware IPs
3518  *
3519  * @adev: amdgpu_device pointer
3520  *
3521  * Main suspend function for hardware IPs.  The list of all the hardware
3522  * IPs that make up the asic is walked, clockgating is disabled and the
3523  * suspend callbacks are run.  suspend puts the hardware and software state
3524  * in each IP into a state suitable for suspend.
3525  * Returns 0 on success, negative error code on failure.
3526  */
3527 int amdgpu_device_ip_suspend(struct amdgpu_device *adev)
3528 {
3529         int r;
3530
3531         if (amdgpu_sriov_vf(adev)) {
3532                 amdgpu_virt_fini_data_exchange(adev);
3533                 amdgpu_virt_request_full_gpu(adev, false);
3534         }
3535
3536         amdgpu_ttm_set_buffer_funcs_status(adev, false);
3537
3538         r = amdgpu_device_ip_suspend_phase1(adev);
3539         if (r)
3540                 return r;
3541         r = amdgpu_device_ip_suspend_phase2(adev);
3542
3543         if (amdgpu_sriov_vf(adev))
3544                 amdgpu_virt_release_full_gpu(adev, false);
3545
3546         return r;
3547 }
3548
3549 static int amdgpu_device_ip_reinit_early_sriov(struct amdgpu_device *adev)
3550 {
3551         int i, r;
3552
3553         static enum amd_ip_block_type ip_order[] = {
3554                 AMD_IP_BLOCK_TYPE_COMMON,
3555                 AMD_IP_BLOCK_TYPE_GMC,
3556                 AMD_IP_BLOCK_TYPE_PSP,
3557                 AMD_IP_BLOCK_TYPE_IH,
3558         };
3559
3560         for (i = 0; i < adev->num_ip_blocks; i++) {
3561                 int j;
3562                 struct amdgpu_ip_block *block;
3563
3564                 block = &adev->ip_blocks[i];
3565                 block->status.hw = false;
3566
3567                 for (j = 0; j < ARRAY_SIZE(ip_order); j++) {
3568
3569                         if (block->version->type != ip_order[j] ||
3570                                 !block->status.valid)
3571                                 continue;
3572
3573                         r = block->version->funcs->hw_init(adev);
3574                         DRM_INFO("RE-INIT-early: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3575                         if (r)
3576                                 return r;
3577                         block->status.hw = true;
3578                 }
3579         }
3580
3581         return 0;
3582 }
3583
3584 static int amdgpu_device_ip_reinit_late_sriov(struct amdgpu_device *adev)
3585 {
3586         int i, r;
3587
3588         static enum amd_ip_block_type ip_order[] = {
3589                 AMD_IP_BLOCK_TYPE_SMC,
3590                 AMD_IP_BLOCK_TYPE_DCE,
3591                 AMD_IP_BLOCK_TYPE_GFX,
3592                 AMD_IP_BLOCK_TYPE_SDMA,
3593                 AMD_IP_BLOCK_TYPE_MES,
3594                 AMD_IP_BLOCK_TYPE_UVD,
3595                 AMD_IP_BLOCK_TYPE_VCE,
3596                 AMD_IP_BLOCK_TYPE_VCN,
3597                 AMD_IP_BLOCK_TYPE_JPEG
3598         };
3599
3600         for (i = 0; i < ARRAY_SIZE(ip_order); i++) {
3601                 int j;
3602                 struct amdgpu_ip_block *block;
3603
3604                 for (j = 0; j < adev->num_ip_blocks; j++) {
3605                         block = &adev->ip_blocks[j];
3606
3607                         if (block->version->type != ip_order[i] ||
3608                                 !block->status.valid ||
3609                                 block->status.hw)
3610                                 continue;
3611
3612                         if (block->version->type == AMD_IP_BLOCK_TYPE_SMC)
3613                                 r = block->version->funcs->resume(adev);
3614                         else
3615                                 r = block->version->funcs->hw_init(adev);
3616
3617                         DRM_INFO("RE-INIT-late: %s %s\n", block->version->funcs->name, r?"failed":"succeeded");
3618                         if (r)
3619                                 return r;
3620                         block->status.hw = true;
3621                 }
3622         }
3623
3624         return 0;
3625 }
3626
3627 /**
3628  * amdgpu_device_ip_resume_phase1 - run resume for hardware IPs
3629  *
3630  * @adev: amdgpu_device pointer
3631  *
3632  * First resume function for hardware IPs.  The list of all the hardware
3633  * IPs that make up the asic is walked and the resume callbacks are run for
3634  * COMMON, GMC, and IH.  resume puts the hardware into a functional state
3635  * after a suspend and updates the software state as necessary.  This
3636  * function is also used for restoring the GPU after a GPU reset.
3637  * Returns 0 on success, negative error code on failure.
3638  */
3639 static int amdgpu_device_ip_resume_phase1(struct amdgpu_device *adev)
3640 {
3641         int i, r;
3642
3643         for (i = 0; i < adev->num_ip_blocks; i++) {
3644                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3645                         continue;
3646                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3647                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3648                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3649                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP && amdgpu_sriov_vf(adev))) {
3650
3651                         r = adev->ip_blocks[i].version->funcs->resume(adev);
3652                         if (r) {
3653                                 DRM_ERROR("resume of IP block <%s> failed %d\n",
3654                                           adev->ip_blocks[i].version->funcs->name, r);
3655                                 return r;
3656                         }
3657                         adev->ip_blocks[i].status.hw = true;
3658                 }
3659         }
3660
3661         return 0;
3662 }
3663
3664 /**
3665  * amdgpu_device_ip_resume_phase2 - run resume for hardware IPs
3666  *
3667  * @adev: amdgpu_device pointer
3668  *
3669  * First resume function for hardware IPs.  The list of all the hardware
3670  * IPs that make up the asic is walked and the resume callbacks are run for
3671  * all blocks except COMMON, GMC, and IH.  resume puts the hardware into a
3672  * functional state after a suspend and updates the software state as
3673  * necessary.  This function is also used for restoring the GPU after a GPU
3674  * reset.
3675  * Returns 0 on success, negative error code on failure.
3676  */
3677 static int amdgpu_device_ip_resume_phase2(struct amdgpu_device *adev)
3678 {
3679         int i, r;
3680
3681         for (i = 0; i < adev->num_ip_blocks; i++) {
3682                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3683                         continue;
3684                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3685                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3686                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3687                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3688                         continue;
3689                 r = adev->ip_blocks[i].version->funcs->resume(adev);
3690                 if (r) {
3691                         DRM_ERROR("resume of IP block <%s> failed %d\n",
3692                                   adev->ip_blocks[i].version->funcs->name, r);
3693                         return r;
3694                 }
3695                 adev->ip_blocks[i].status.hw = true;
3696         }
3697
3698         return 0;
3699 }
3700
3701 /**
3702  * amdgpu_device_ip_resume - run resume for hardware IPs
3703  *
3704  * @adev: amdgpu_device pointer
3705  *
3706  * Main resume function for hardware IPs.  The hardware IPs
3707  * are split into two resume functions because they are
3708  * also used in recovering from a GPU reset and some additional
3709  * steps need to be take between them.  In this case (S3/S4) they are
3710  * run sequentially.
3711  * Returns 0 on success, negative error code on failure.
3712  */
3713 static int amdgpu_device_ip_resume(struct amdgpu_device *adev)
3714 {
3715         int r;
3716
3717         r = amdgpu_device_ip_resume_phase1(adev);
3718         if (r)
3719                 return r;
3720
3721         r = amdgpu_device_fw_loading(adev);
3722         if (r)
3723                 return r;
3724
3725         r = amdgpu_device_ip_resume_phase2(adev);
3726
3727         if (adev->mman.buffer_funcs_ring->sched.ready)
3728                 amdgpu_ttm_set_buffer_funcs_status(adev, true);
3729
3730         return r;
3731 }
3732
3733 /**
3734  * amdgpu_device_detect_sriov_bios - determine if the board supports SR-IOV
3735  *
3736  * @adev: amdgpu_device pointer
3737  *
3738  * Query the VBIOS data tables to determine if the board supports SR-IOV.
3739  */
3740 static void amdgpu_device_detect_sriov_bios(struct amdgpu_device *adev)
3741 {
3742         if (amdgpu_sriov_vf(adev)) {
3743                 if (adev->is_atom_fw) {
3744                         if (amdgpu_atomfirmware_gpu_virtualization_supported(adev))
3745                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3746                 } else {
3747                         if (amdgpu_atombios_has_gpu_virtualization_table(adev))
3748                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3749                 }
3750
3751                 if (!(adev->virt.caps & AMDGPU_SRIOV_CAPS_SRIOV_VBIOS))
3752                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_NO_VBIOS, 0, 0);
3753         }
3754 }
3755
3756 /**
3757  * amdgpu_device_asic_has_dc_support - determine if DC supports the asic
3758  *
3759  * @asic_type: AMD asic type
3760  *
3761  * Check if there is DC (new modesetting infrastructre) support for an asic.
3762  * returns true if DC has support, false if not.
3763  */
3764 bool amdgpu_device_asic_has_dc_support(enum amd_asic_type asic_type)
3765 {
3766         switch (asic_type) {
3767 #ifdef CONFIG_DRM_AMDGPU_SI
3768         case CHIP_HAINAN:
3769 #endif
3770         case CHIP_TOPAZ:
3771                 /* chips with no display hardware */
3772                 return false;
3773 #if defined(CONFIG_DRM_AMD_DC)
3774         case CHIP_TAHITI:
3775         case CHIP_PITCAIRN:
3776         case CHIP_VERDE:
3777         case CHIP_OLAND:
3778                 /*
3779                  * We have systems in the wild with these ASICs that require
3780                  * LVDS and VGA support which is not supported with DC.
3781                  *
3782                  * Fallback to the non-DC driver here by default so as not to
3783                  * cause regressions.
3784                  */
3785 #if defined(CONFIG_DRM_AMD_DC_SI)
3786                 return amdgpu_dc > 0;
3787 #else
3788                 return false;
3789 #endif
3790         case CHIP_BONAIRE:
3791         case CHIP_KAVERI:
3792         case CHIP_KABINI:
3793         case CHIP_MULLINS:
3794                 /*
3795                  * We have systems in the wild with these ASICs that require
3796                  * VGA support which is not supported with DC.
3797                  *
3798                  * Fallback to the non-DC driver here by default so as not to
3799                  * cause regressions.
3800                  */
3801                 return amdgpu_dc > 0;
3802         default:
3803                 return amdgpu_dc != 0;
3804 #else
3805         default:
3806                 if (amdgpu_dc > 0)
3807                         DRM_INFO_ONCE("Display Core has been requested via kernel parameter but isn't supported by ASIC, ignoring\n");
3808                 return false;
3809 #endif
3810         }
3811 }
3812
3813 /**
3814  * amdgpu_device_has_dc_support - check if dc is supported
3815  *
3816  * @adev: amdgpu_device pointer
3817  *
3818  * Returns true for supported, false for not supported
3819  */
3820 bool amdgpu_device_has_dc_support(struct amdgpu_device *adev)
3821 {
3822         if (adev->enable_virtual_display ||
3823             (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
3824                 return false;
3825
3826         return amdgpu_device_asic_has_dc_support(adev->asic_type);
3827 }
3828
3829 static void amdgpu_device_xgmi_reset_func(struct work_struct *__work)
3830 {
3831         struct amdgpu_device *adev =
3832                 container_of(__work, struct amdgpu_device, xgmi_reset_work);
3833         struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3834
3835         /* It's a bug to not have a hive within this function */
3836         if (WARN_ON(!hive))
3837                 return;
3838
3839         /*
3840          * Use task barrier to synchronize all xgmi reset works across the
3841          * hive. task_barrier_enter and task_barrier_exit will block
3842          * until all the threads running the xgmi reset works reach
3843          * those points. task_barrier_full will do both blocks.
3844          */
3845         if (amdgpu_asic_reset_method(adev) == AMD_RESET_METHOD_BACO) {
3846
3847                 task_barrier_enter(&hive->tb);
3848                 adev->asic_reset_res = amdgpu_device_baco_enter(adev_to_drm(adev));
3849
3850                 if (adev->asic_reset_res)
3851                         goto fail;
3852
3853                 task_barrier_exit(&hive->tb);
3854                 adev->asic_reset_res = amdgpu_device_baco_exit(adev_to_drm(adev));
3855
3856                 if (adev->asic_reset_res)
3857                         goto fail;
3858
3859                 amdgpu_ras_reset_error_count(adev, AMDGPU_RAS_BLOCK__MMHUB);
3860         } else {
3861
3862                 task_barrier_full(&hive->tb);
3863                 adev->asic_reset_res =  amdgpu_asic_reset(adev);
3864         }
3865
3866 fail:
3867         if (adev->asic_reset_res)
3868                 DRM_WARN("ASIC reset failed with error, %d for drm dev, %s",
3869                          adev->asic_reset_res, adev_to_drm(adev)->unique);
3870         amdgpu_put_xgmi_hive(hive);
3871 }
3872
3873 static int amdgpu_device_get_job_timeout_settings(struct amdgpu_device *adev)
3874 {
3875         char *input = amdgpu_lockup_timeout;
3876         char *timeout_setting = NULL;
3877         int index = 0;
3878         long timeout;
3879         int ret = 0;
3880
3881         /*
3882          * By default timeout for non compute jobs is 10000
3883          * and 60000 for compute jobs.
3884          * In SR-IOV or passthrough mode, timeout for compute
3885          * jobs are 60000 by default.
3886          */
3887         adev->gfx_timeout = msecs_to_jiffies(10000);
3888         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3889         if (amdgpu_sriov_vf(adev))
3890                 adev->compute_timeout = amdgpu_sriov_is_pp_one_vf(adev) ?
3891                                         msecs_to_jiffies(60000) : msecs_to_jiffies(10000);
3892         else
3893                 adev->compute_timeout =  msecs_to_jiffies(60000);
3894
3895         if (strnlen(input, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3896                 while ((timeout_setting = strsep(&input, ",")) &&
3897                                 strnlen(timeout_setting, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
3898                         ret = kstrtol(timeout_setting, 0, &timeout);
3899                         if (ret)
3900                                 return ret;
3901
3902                         if (timeout == 0) {
3903                                 index++;
3904                                 continue;
3905                         } else if (timeout < 0) {
3906                                 timeout = MAX_SCHEDULE_TIMEOUT;
3907                                 dev_warn(adev->dev, "lockup timeout disabled");
3908                                 add_taint(TAINT_SOFTLOCKUP, LOCKDEP_STILL_OK);
3909                         } else {
3910                                 timeout = msecs_to_jiffies(timeout);
3911                         }
3912
3913                         switch (index++) {
3914                         case 0:
3915                                 adev->gfx_timeout = timeout;
3916                                 break;
3917                         case 1:
3918                                 adev->compute_timeout = timeout;
3919                                 break;
3920                         case 2:
3921                                 adev->sdma_timeout = timeout;
3922                                 break;
3923                         case 3:
3924                                 adev->video_timeout = timeout;
3925                                 break;
3926                         default:
3927                                 break;
3928                         }
3929                 }
3930                 /*
3931                  * There is only one value specified and
3932                  * it should apply to all non-compute jobs.
3933                  */
3934                 if (index == 1) {
3935                         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
3936                         if (amdgpu_sriov_vf(adev) || amdgpu_passthrough(adev))
3937                                 adev->compute_timeout = adev->gfx_timeout;
3938                 }
3939         }
3940
3941         return ret;
3942 }
3943
3944 /**
3945  * amdgpu_device_check_iommu_direct_map - check if RAM direct mapped to GPU
3946  *
3947  * @adev: amdgpu_device pointer
3948  *
3949  * RAM direct mapped to GPU if IOMMU is not enabled or is pass through mode
3950  */
3951 static void amdgpu_device_check_iommu_direct_map(struct amdgpu_device *adev)
3952 {
3953         struct iommu_domain *domain;
3954
3955         domain = iommu_get_domain_for_dev(adev->dev);
3956         if (!domain || domain->type == IOMMU_DOMAIN_IDENTITY)
3957                 adev->ram_is_direct_mapped = true;
3958 }
3959
3960 #if defined(CONFIG_HSA_AMD_P2P)
3961 /**
3962  * amdgpu_device_check_iommu_remap - Check if DMA remapping is enabled.
3963  *
3964  * @adev: amdgpu_device pointer
3965  *
3966  * return if IOMMU remapping bar address
3967  */
3968 static bool amdgpu_device_check_iommu_remap(struct amdgpu_device *adev)
3969 {
3970         struct iommu_domain *domain;
3971
3972         domain = iommu_get_domain_for_dev(adev->dev);
3973         if (domain && (domain->type == IOMMU_DOMAIN_DMA ||
3974                 domain->type == IOMMU_DOMAIN_DMA_FQ))
3975                 return true;
3976
3977         return false;
3978 }
3979 #endif
3980
3981 static const struct attribute *amdgpu_dev_attributes[] = {
3982         &dev_attr_pcie_replay_count.attr,
3983         NULL
3984 };
3985
3986 static void amdgpu_device_set_mcbp(struct amdgpu_device *adev)
3987 {
3988         if (amdgpu_mcbp == 1)
3989                 adev->gfx.mcbp = true;
3990         else if (amdgpu_mcbp == 0)
3991                 adev->gfx.mcbp = false;
3992
3993         if (amdgpu_sriov_vf(adev))
3994                 adev->gfx.mcbp = true;
3995
3996         if (adev->gfx.mcbp)
3997                 DRM_INFO("MCBP is enabled\n");
3998 }
3999
4000 /**
4001  * amdgpu_device_init - initialize the driver
4002  *
4003  * @adev: amdgpu_device pointer
4004  * @flags: driver flags
4005  *
4006  * Initializes the driver info and hw (all asics).
4007  * Returns 0 for success or an error on failure.
4008  * Called at driver startup.
4009  */
4010 int amdgpu_device_init(struct amdgpu_device *adev,
4011                        uint32_t flags)
4012 {
4013         struct drm_device *ddev = adev_to_drm(adev);
4014         struct pci_dev *pdev = adev->pdev;
4015         int r, i;
4016         bool px = false;
4017         u32 max_MBps;
4018         int tmp;
4019
4020         adev->shutdown = false;
4021         adev->flags = flags;
4022
4023         if (amdgpu_force_asic_type >= 0 && amdgpu_force_asic_type < CHIP_LAST)
4024                 adev->asic_type = amdgpu_force_asic_type;
4025         else
4026                 adev->asic_type = flags & AMD_ASIC_MASK;
4027
4028         adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
4029         if (amdgpu_emu_mode == 1)
4030                 adev->usec_timeout *= 10;
4031         adev->gmc.gart_size = 512 * 1024 * 1024;
4032         adev->accel_working = false;
4033         adev->num_rings = 0;
4034         RCU_INIT_POINTER(adev->gang_submit, dma_fence_get_stub());
4035         adev->mman.buffer_funcs = NULL;
4036         adev->mman.buffer_funcs_ring = NULL;
4037         adev->vm_manager.vm_pte_funcs = NULL;
4038         adev->vm_manager.vm_pte_num_scheds = 0;
4039         adev->gmc.gmc_funcs = NULL;
4040         adev->harvest_ip_mask = 0x0;
4041         adev->fence_context = dma_fence_context_alloc(AMDGPU_MAX_RINGS);
4042         bitmap_zero(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
4043
4044         adev->smc_rreg = &amdgpu_invalid_rreg;
4045         adev->smc_wreg = &amdgpu_invalid_wreg;
4046         adev->pcie_rreg = &amdgpu_invalid_rreg;
4047         adev->pcie_wreg = &amdgpu_invalid_wreg;
4048         adev->pcie_rreg_ext = &amdgpu_invalid_rreg_ext;
4049         adev->pcie_wreg_ext = &amdgpu_invalid_wreg_ext;
4050         adev->pciep_rreg = &amdgpu_invalid_rreg;
4051         adev->pciep_wreg = &amdgpu_invalid_wreg;
4052         adev->pcie_rreg64 = &amdgpu_invalid_rreg64;
4053         adev->pcie_wreg64 = &amdgpu_invalid_wreg64;
4054         adev->pcie_rreg64_ext = &amdgpu_invalid_rreg64_ext;
4055         adev->pcie_wreg64_ext = &amdgpu_invalid_wreg64_ext;
4056         adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
4057         adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
4058         adev->didt_rreg = &amdgpu_invalid_rreg;
4059         adev->didt_wreg = &amdgpu_invalid_wreg;
4060         adev->gc_cac_rreg = &amdgpu_invalid_rreg;
4061         adev->gc_cac_wreg = &amdgpu_invalid_wreg;
4062         adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
4063         adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
4064
4065         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
4066                  amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
4067                  pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
4068
4069         /* mutex initialization are all done here so we
4070          * can recall function without having locking issues
4071          */
4072         mutex_init(&adev->firmware.mutex);
4073         mutex_init(&adev->pm.mutex);
4074         mutex_init(&adev->gfx.gpu_clock_mutex);
4075         mutex_init(&adev->srbm_mutex);
4076         mutex_init(&adev->gfx.pipe_reserve_mutex);
4077         mutex_init(&adev->gfx.gfx_off_mutex);
4078         mutex_init(&adev->gfx.partition_mutex);
4079         mutex_init(&adev->grbm_idx_mutex);
4080         mutex_init(&adev->mn_lock);
4081         mutex_init(&adev->virt.vf_errors.lock);
4082         mutex_init(&adev->virt.rlcg_reg_lock);
4083         hash_init(adev->mn_hash);
4084         mutex_init(&adev->psp.mutex);
4085         mutex_init(&adev->notifier_lock);
4086         mutex_init(&adev->pm.stable_pstate_ctx_lock);
4087         mutex_init(&adev->benchmark_mutex);
4088         mutex_init(&adev->gfx.reset_sem_mutex);
4089         /* Initialize the mutex for cleaner shader isolation between GFX and compute processes */
4090         mutex_init(&adev->enforce_isolation_mutex);
4091         mutex_init(&adev->gfx.kfd_sch_mutex);
4092
4093         amdgpu_device_init_apu_flags(adev);
4094
4095         r = amdgpu_device_check_arguments(adev);
4096         if (r)
4097                 return r;
4098
4099         spin_lock_init(&adev->mmio_idx_lock);
4100         spin_lock_init(&adev->smc_idx_lock);
4101         spin_lock_init(&adev->pcie_idx_lock);
4102         spin_lock_init(&adev->uvd_ctx_idx_lock);
4103         spin_lock_init(&adev->didt_idx_lock);
4104         spin_lock_init(&adev->gc_cac_idx_lock);
4105         spin_lock_init(&adev->se_cac_idx_lock);
4106         spin_lock_init(&adev->audio_endpt_idx_lock);
4107         spin_lock_init(&adev->mm_stats.lock);
4108         spin_lock_init(&adev->wb.lock);
4109
4110         INIT_LIST_HEAD(&adev->shadow_list);
4111         mutex_init(&adev->shadow_list_lock);
4112
4113         INIT_LIST_HEAD(&adev->reset_list);
4114
4115         INIT_LIST_HEAD(&adev->ras_list);
4116
4117         INIT_LIST_HEAD(&adev->pm.od_kobj_list);
4118
4119         INIT_DELAYED_WORK(&adev->delayed_init_work,
4120                           amdgpu_device_delayed_init_work_handler);
4121         INIT_DELAYED_WORK(&adev->gfx.gfx_off_delay_work,
4122                           amdgpu_device_delay_enable_gfx_off);
4123         /*
4124          * Initialize the enforce_isolation work structures for each XCP
4125          * partition.  This work handler is responsible for enforcing shader
4126          * isolation on AMD GPUs.  It counts the number of emitted fences for
4127          * each GFX and compute ring.  If there are any fences, it schedules
4128          * the `enforce_isolation_work` to be run after a delay.  If there are
4129          * no fences, it signals the Kernel Fusion Driver (KFD) to resume the
4130          * runqueue.
4131          */
4132         for (i = 0; i < MAX_XCP; i++) {
4133                 INIT_DELAYED_WORK(&adev->gfx.enforce_isolation[i].work,
4134                                   amdgpu_gfx_enforce_isolation_handler);
4135                 adev->gfx.enforce_isolation[i].adev = adev;
4136                 adev->gfx.enforce_isolation[i].xcp_id = i;
4137         }
4138
4139         INIT_WORK(&adev->xgmi_reset_work, amdgpu_device_xgmi_reset_func);
4140
4141         adev->gfx.gfx_off_req_count = 1;
4142         adev->gfx.gfx_off_residency = 0;
4143         adev->gfx.gfx_off_entrycount = 0;
4144         adev->pm.ac_power = power_supply_is_system_supplied() > 0;
4145
4146         atomic_set(&adev->throttling_logging_enabled, 1);
4147         /*
4148          * If throttling continues, logging will be performed every minute
4149          * to avoid log flooding. "-1" is subtracted since the thermal
4150          * throttling interrupt comes every second. Thus, the total logging
4151          * interval is 59 seconds(retelimited printk interval) + 1(waiting
4152          * for throttling interrupt) = 60 seconds.
4153          */
4154         ratelimit_state_init(&adev->throttling_logging_rs, (60 - 1) * HZ, 1);
4155         ratelimit_set_flags(&adev->throttling_logging_rs, RATELIMIT_MSG_ON_RELEASE);
4156
4157         /* Registers mapping */
4158         /* TODO: block userspace mapping of io register */
4159         if (adev->asic_type >= CHIP_BONAIRE) {
4160                 adev->rmmio_base = pci_resource_start(adev->pdev, 5);
4161                 adev->rmmio_size = pci_resource_len(adev->pdev, 5);
4162         } else {
4163                 adev->rmmio_base = pci_resource_start(adev->pdev, 2);
4164                 adev->rmmio_size = pci_resource_len(adev->pdev, 2);
4165         }
4166
4167         for (i = 0; i < AMD_IP_BLOCK_TYPE_NUM; i++)
4168                 atomic_set(&adev->pm.pwr_state[i], POWER_STATE_UNKNOWN);
4169
4170         adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
4171         if (!adev->rmmio)
4172                 return -ENOMEM;
4173
4174         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
4175         DRM_INFO("register mmio size: %u\n", (unsigned int)adev->rmmio_size);
4176
4177         /*
4178          * Reset domain needs to be present early, before XGMI hive discovered
4179          * (if any) and intitialized to use reset sem and in_gpu reset flag
4180          * early on during init and before calling to RREG32.
4181          */
4182         adev->reset_domain = amdgpu_reset_create_reset_domain(SINGLE_DEVICE, "amdgpu-reset-dev");
4183         if (!adev->reset_domain)
4184                 return -ENOMEM;
4185
4186         /* detect hw virtualization here */
4187         amdgpu_detect_virtualization(adev);
4188
4189         amdgpu_device_get_pcie_info(adev);
4190
4191         r = amdgpu_device_get_job_timeout_settings(adev);
4192         if (r) {
4193                 dev_err(adev->dev, "invalid lockup_timeout parameter syntax\n");
4194                 return r;
4195         }
4196
4197         amdgpu_device_set_mcbp(adev);
4198
4199         /* early init functions */
4200         r = amdgpu_device_ip_early_init(adev);
4201         if (r)
4202                 return r;
4203
4204         /* Get rid of things like offb */
4205         r = drm_aperture_remove_conflicting_pci_framebuffers(adev->pdev, &amdgpu_kms_driver);
4206         if (r)
4207                 return r;
4208
4209         /* Enable TMZ based on IP_VERSION */
4210         amdgpu_gmc_tmz_set(adev);
4211
4212         if (amdgpu_sriov_vf(adev) &&
4213             amdgpu_ip_version(adev, GC_HWIP, 0) >= IP_VERSION(10, 3, 0))
4214                 /* VF MMIO access (except mailbox range) from CPU
4215                  * will be blocked during sriov runtime
4216                  */
4217                 adev->virt.caps |= AMDGPU_VF_MMIO_ACCESS_PROTECT;
4218
4219         amdgpu_gmc_noretry_set(adev);
4220         /* Need to get xgmi info early to decide the reset behavior*/
4221         if (adev->gmc.xgmi.supported) {
4222                 r = adev->gfxhub.funcs->get_xgmi_info(adev);
4223                 if (r)
4224                         return r;
4225         }
4226
4227         /* enable PCIE atomic ops */
4228         if (amdgpu_sriov_vf(adev)) {
4229                 if (adev->virt.fw_reserve.p_pf2vf)
4230                         adev->have_atomics_support = ((struct amd_sriov_msg_pf2vf_info *)
4231                                                       adev->virt.fw_reserve.p_pf2vf)->pcie_atomic_ops_support_flags ==
4232                                 (PCI_EXP_DEVCAP2_ATOMIC_COMP32 | PCI_EXP_DEVCAP2_ATOMIC_COMP64);
4233         /* APUs w/ gfx9 onwards doesn't reply on PCIe atomics, rather it is a
4234          * internal path natively support atomics, set have_atomics_support to true.
4235          */
4236         } else if ((adev->flags & AMD_IS_APU) &&
4237                    (amdgpu_ip_version(adev, GC_HWIP, 0) >
4238                     IP_VERSION(9, 0, 0))) {
4239                 adev->have_atomics_support = true;
4240         } else {
4241                 adev->have_atomics_support =
4242                         !pci_enable_atomic_ops_to_root(adev->pdev,
4243                                           PCI_EXP_DEVCAP2_ATOMIC_COMP32 |
4244                                           PCI_EXP_DEVCAP2_ATOMIC_COMP64);
4245         }
4246
4247         if (!adev->have_atomics_support)
4248                 dev_info(adev->dev, "PCIE atomic ops is not supported\n");
4249
4250         /* doorbell bar mapping and doorbell index init*/
4251         amdgpu_doorbell_init(adev);
4252
4253         if (amdgpu_emu_mode == 1) {
4254                 /* post the asic on emulation mode */
4255                 emu_soc_asic_init(adev);
4256                 goto fence_driver_init;
4257         }
4258
4259         amdgpu_reset_init(adev);
4260
4261         /* detect if we are with an SRIOV vbios */
4262         if (adev->bios)
4263                 amdgpu_device_detect_sriov_bios(adev);
4264
4265         /* check if we need to reset the asic
4266          *  E.g., driver was not cleanly unloaded previously, etc.
4267          */
4268         if (!amdgpu_sriov_vf(adev) && amdgpu_asic_need_reset_on_init(adev)) {
4269                 if (adev->gmc.xgmi.num_physical_nodes) {
4270                         dev_info(adev->dev, "Pending hive reset.\n");
4271                         adev->gmc.xgmi.pending_reset = true;
4272                         /* Only need to init necessary block for SMU to handle the reset */
4273                         for (i = 0; i < adev->num_ip_blocks; i++) {
4274                                 if (!adev->ip_blocks[i].status.valid)
4275                                         continue;
4276                                 if (!(adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
4277                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
4278                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
4279                                       adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC)) {
4280                                         DRM_DEBUG("IP %s disabled for hw_init.\n",
4281                                                 adev->ip_blocks[i].version->funcs->name);
4282                                         adev->ip_blocks[i].status.hw = true;
4283                                 }
4284                         }
4285                 } else if (amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(13, 0, 10) &&
4286                                    !amdgpu_device_has_display_hardware(adev)) {
4287                                         r = psp_gpu_reset(adev);
4288                 } else {
4289                                 tmp = amdgpu_reset_method;
4290                                 /* It should do a default reset when loading or reloading the driver,
4291                                  * regardless of the module parameter reset_method.
4292                                  */
4293                                 amdgpu_reset_method = AMD_RESET_METHOD_NONE;
4294                                 r = amdgpu_asic_reset(adev);
4295                                 amdgpu_reset_method = tmp;
4296                 }
4297
4298                 if (r) {
4299                   dev_err(adev->dev, "asic reset on init failed\n");
4300                   goto failed;
4301                 }
4302         }
4303
4304         /* Post card if necessary */
4305         if (amdgpu_device_need_post(adev)) {
4306                 if (!adev->bios) {
4307                         dev_err(adev->dev, "no vBIOS found\n");
4308                         r = -EINVAL;
4309                         goto failed;
4310                 }
4311                 DRM_INFO("GPU posting now...\n");
4312                 r = amdgpu_device_asic_init(adev);
4313                 if (r) {
4314                         dev_err(adev->dev, "gpu post error!\n");
4315                         goto failed;
4316                 }
4317         }
4318
4319         if (adev->bios) {
4320                 if (adev->is_atom_fw) {
4321                         /* Initialize clocks */
4322                         r = amdgpu_atomfirmware_get_clock_info(adev);
4323                         if (r) {
4324                                 dev_err(adev->dev, "amdgpu_atomfirmware_get_clock_info failed\n");
4325                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
4326                                 goto failed;
4327                         }
4328                 } else {
4329                         /* Initialize clocks */
4330                         r = amdgpu_atombios_get_clock_info(adev);
4331                         if (r) {
4332                                 dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
4333                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
4334                                 goto failed;
4335                         }
4336                         /* init i2c buses */
4337                         if (!amdgpu_device_has_dc_support(adev))
4338                                 amdgpu_atombios_i2c_init(adev);
4339                 }
4340         }
4341
4342 fence_driver_init:
4343         /* Fence driver */
4344         r = amdgpu_fence_driver_sw_init(adev);
4345         if (r) {
4346                 dev_err(adev->dev, "amdgpu_fence_driver_sw_init failed\n");
4347                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_FENCE_INIT_FAIL, 0, 0);
4348                 goto failed;
4349         }
4350
4351         /* init the mode config */
4352         drm_mode_config_init(adev_to_drm(adev));
4353
4354         r = amdgpu_device_ip_init(adev);
4355         if (r) {
4356                 dev_err(adev->dev, "amdgpu_device_ip_init failed\n");
4357                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_INIT_FAIL, 0, 0);
4358                 goto release_ras_con;
4359         }
4360
4361         amdgpu_fence_driver_hw_init(adev);
4362
4363         dev_info(adev->dev,
4364                 "SE %d, SH per SE %d, CU per SH %d, active_cu_number %d\n",
4365                         adev->gfx.config.max_shader_engines,
4366                         adev->gfx.config.max_sh_per_se,
4367                         adev->gfx.config.max_cu_per_sh,
4368                         adev->gfx.cu_info.number);
4369
4370         adev->accel_working = true;
4371
4372         amdgpu_vm_check_compute_bug(adev);
4373
4374         /* Initialize the buffer migration limit. */
4375         if (amdgpu_moverate >= 0)
4376                 max_MBps = amdgpu_moverate;
4377         else
4378                 max_MBps = 8; /* Allow 8 MB/s. */
4379         /* Get a log2 for easy divisions. */
4380         adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
4381
4382         /*
4383          * Register gpu instance before amdgpu_device_enable_mgpu_fan_boost.
4384          * Otherwise the mgpu fan boost feature will be skipped due to the
4385          * gpu instance is counted less.
4386          */
4387         amdgpu_register_gpu_instance(adev);
4388
4389         /* enable clockgating, etc. after ib tests, etc. since some blocks require
4390          * explicit gating rather than handling it automatically.
4391          */
4392         if (!adev->gmc.xgmi.pending_reset) {
4393                 r = amdgpu_device_ip_late_init(adev);
4394                 if (r) {
4395                         dev_err(adev->dev, "amdgpu_device_ip_late_init failed\n");
4396                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_LATE_INIT_FAIL, 0, r);
4397                         goto release_ras_con;
4398                 }
4399                 /* must succeed. */
4400                 amdgpu_ras_resume(adev);
4401                 queue_delayed_work(system_wq, &adev->delayed_init_work,
4402                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
4403         }
4404
4405         if (amdgpu_sriov_vf(adev)) {
4406                 amdgpu_virt_release_full_gpu(adev, true);
4407                 flush_delayed_work(&adev->delayed_init_work);
4408         }
4409
4410         /*
4411          * Place those sysfs registering after `late_init`. As some of those
4412          * operations performed in `late_init` might affect the sysfs
4413          * interfaces creating.
4414          */
4415         r = amdgpu_atombios_sysfs_init(adev);
4416         if (r)
4417                 drm_err(&adev->ddev,
4418                         "registering atombios sysfs failed (%d).\n", r);
4419
4420         r = amdgpu_pm_sysfs_init(adev);
4421         if (r)
4422                 DRM_ERROR("registering pm sysfs failed (%d).\n", r);
4423
4424         r = amdgpu_ucode_sysfs_init(adev);
4425         if (r) {
4426                 adev->ucode_sysfs_en = false;
4427                 DRM_ERROR("Creating firmware sysfs failed (%d).\n", r);
4428         } else
4429                 adev->ucode_sysfs_en = true;
4430
4431         r = sysfs_create_files(&adev->dev->kobj, amdgpu_dev_attributes);
4432         if (r)
4433                 dev_err(adev->dev, "Could not create amdgpu device attr\n");
4434
4435         r = devm_device_add_group(adev->dev, &amdgpu_board_attrs_group);
4436         if (r)
4437                 dev_err(adev->dev,
4438                         "Could not create amdgpu board attributes\n");
4439
4440         amdgpu_fru_sysfs_init(adev);
4441         amdgpu_reg_state_sysfs_init(adev);
4442
4443         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4444                 r = amdgpu_pmu_init(adev);
4445         if (r)
4446                 dev_err(adev->dev, "amdgpu_pmu_init failed\n");
4447
4448         /* Have stored pci confspace at hand for restore in sudden PCI error */
4449         if (amdgpu_device_cache_pci_state(adev->pdev))
4450                 pci_restore_state(pdev);
4451
4452         /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
4453         /* this will fail for cards that aren't VGA class devices, just
4454          * ignore it
4455          */
4456         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4457                 vga_client_register(adev->pdev, amdgpu_device_vga_set_decode);
4458
4459         px = amdgpu_device_supports_px(ddev);
4460
4461         if (px || (!dev_is_removable(&adev->pdev->dev) &&
4462                                 apple_gmux_detect(NULL, NULL)))
4463                 vga_switcheroo_register_client(adev->pdev,
4464                                                &amdgpu_switcheroo_ops, px);
4465
4466         if (px)
4467                 vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
4468
4469         if (adev->gmc.xgmi.pending_reset)
4470                 queue_delayed_work(system_wq, &mgpu_info.delayed_reset_work,
4471                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
4472
4473         amdgpu_device_check_iommu_direct_map(adev);
4474
4475         return 0;
4476
4477 release_ras_con:
4478         if (amdgpu_sriov_vf(adev))
4479                 amdgpu_virt_release_full_gpu(adev, true);
4480
4481         /* failed in exclusive mode due to timeout */
4482         if (amdgpu_sriov_vf(adev) &&
4483                 !amdgpu_sriov_runtime(adev) &&
4484                 amdgpu_virt_mmio_blocked(adev) &&
4485                 !amdgpu_virt_wait_reset(adev)) {
4486                 dev_err(adev->dev, "VF exclusive mode timeout\n");
4487                 /* Don't send request since VF is inactive. */
4488                 adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
4489                 adev->virt.ops = NULL;
4490                 r = -EAGAIN;
4491         }
4492         amdgpu_release_ras_context(adev);
4493
4494 failed:
4495         amdgpu_vf_error_trans_all(adev);
4496
4497         return r;
4498 }
4499
4500 static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
4501 {
4502
4503         /* Clear all CPU mappings pointing to this device */
4504         unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
4505
4506         /* Unmap all mapped bars - Doorbell, registers and VRAM */
4507         amdgpu_doorbell_fini(adev);
4508
4509         iounmap(adev->rmmio);
4510         adev->rmmio = NULL;
4511         if (adev->mman.aper_base_kaddr)
4512                 iounmap(adev->mman.aper_base_kaddr);
4513         adev->mman.aper_base_kaddr = NULL;
4514
4515         /* Memory manager related */
4516         if (!adev->gmc.xgmi.connected_to_cpu && !adev->gmc.is_app_apu) {
4517                 arch_phys_wc_del(adev->gmc.vram_mtrr);
4518                 arch_io_free_memtype_wc(adev->gmc.aper_base, adev->gmc.aper_size);
4519         }
4520 }
4521
4522 /**
4523  * amdgpu_device_fini_hw - tear down the driver
4524  *
4525  * @adev: amdgpu_device pointer
4526  *
4527  * Tear down the driver info (all asics).
4528  * Called at driver shutdown.
4529  */
4530 void amdgpu_device_fini_hw(struct amdgpu_device *adev)
4531 {
4532         dev_info(adev->dev, "amdgpu: finishing device.\n");
4533         flush_delayed_work(&adev->delayed_init_work);
4534
4535         if (adev->mman.initialized)
4536                 drain_workqueue(adev->mman.bdev.wq);
4537         adev->shutdown = true;
4538
4539         /* make sure IB test finished before entering exclusive mode
4540          * to avoid preemption on IB test
4541          */
4542         if (amdgpu_sriov_vf(adev)) {
4543                 amdgpu_virt_request_full_gpu(adev, false);
4544                 amdgpu_virt_fini_data_exchange(adev);
4545         }
4546
4547         /* disable all interrupts */
4548         amdgpu_irq_disable_all(adev);
4549         if (adev->mode_info.mode_config_initialized) {
4550                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(adev)))
4551                         drm_helper_force_disable_all(adev_to_drm(adev));
4552                 else
4553                         drm_atomic_helper_shutdown(adev_to_drm(adev));
4554         }
4555         amdgpu_fence_driver_hw_fini(adev);
4556
4557         if (adev->pm.sysfs_initialized)
4558                 amdgpu_pm_sysfs_fini(adev);
4559         if (adev->ucode_sysfs_en)
4560                 amdgpu_ucode_sysfs_fini(adev);
4561         sysfs_remove_files(&adev->dev->kobj, amdgpu_dev_attributes);
4562         amdgpu_fru_sysfs_fini(adev);
4563
4564         amdgpu_reg_state_sysfs_fini(adev);
4565
4566         /* disable ras feature must before hw fini */
4567         amdgpu_ras_pre_fini(adev);
4568
4569         amdgpu_ttm_set_buffer_funcs_status(adev, false);
4570
4571         amdgpu_device_ip_fini_early(adev);
4572
4573         amdgpu_irq_fini_hw(adev);
4574
4575         if (adev->mman.initialized)
4576                 ttm_device_clear_dma_mappings(&adev->mman.bdev);
4577
4578         amdgpu_gart_dummy_page_fini(adev);
4579
4580         if (drm_dev_is_unplugged(adev_to_drm(adev)))
4581                 amdgpu_device_unmap_mmio(adev);
4582
4583 }
4584
4585 void amdgpu_device_fini_sw(struct amdgpu_device *adev)
4586 {
4587         int idx;
4588         bool px;
4589
4590         amdgpu_fence_driver_sw_fini(adev);
4591         amdgpu_device_ip_fini(adev);
4592         amdgpu_ucode_release(&adev->firmware.gpu_info_fw);
4593         adev->accel_working = false;
4594         dma_fence_put(rcu_dereference_protected(adev->gang_submit, true));
4595
4596         amdgpu_reset_fini(adev);
4597
4598         /* free i2c buses */
4599         if (!amdgpu_device_has_dc_support(adev))
4600                 amdgpu_i2c_fini(adev);
4601
4602         if (amdgpu_emu_mode != 1)
4603                 amdgpu_atombios_fini(adev);
4604
4605         kfree(adev->bios);
4606         adev->bios = NULL;
4607
4608         kfree(adev->fru_info);
4609         adev->fru_info = NULL;
4610
4611         px = amdgpu_device_supports_px(adev_to_drm(adev));
4612
4613         if (px || (!dev_is_removable(&adev->pdev->dev) &&
4614                                 apple_gmux_detect(NULL, NULL)))
4615                 vga_switcheroo_unregister_client(adev->pdev);
4616
4617         if (px)
4618                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
4619
4620         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4621                 vga_client_unregister(adev->pdev);
4622
4623         if (drm_dev_enter(adev_to_drm(adev), &idx)) {
4624
4625                 iounmap(adev->rmmio);
4626                 adev->rmmio = NULL;
4627                 amdgpu_doorbell_fini(adev);
4628                 drm_dev_exit(idx);
4629         }
4630
4631         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4632                 amdgpu_pmu_fini(adev);
4633         if (adev->mman.discovery_bin)
4634                 amdgpu_discovery_fini(adev);
4635
4636         amdgpu_reset_put_reset_domain(adev->reset_domain);
4637         adev->reset_domain = NULL;
4638
4639         kfree(adev->pci_state);
4640
4641 }
4642
4643 /**
4644  * amdgpu_device_evict_resources - evict device resources
4645  * @adev: amdgpu device object
4646  *
4647  * Evicts all ttm device resources(vram BOs, gart table) from the lru list
4648  * of the vram memory type. Mainly used for evicting device resources
4649  * at suspend time.
4650  *
4651  */
4652 static int amdgpu_device_evict_resources(struct amdgpu_device *adev)
4653 {
4654         int ret;
4655
4656         /* No need to evict vram on APUs for suspend to ram or s2idle */
4657         if ((adev->in_s3 || adev->in_s0ix) && (adev->flags & AMD_IS_APU))
4658                 return 0;
4659
4660         ret = amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM);
4661         if (ret)
4662                 DRM_WARN("evicting device resources failed\n");
4663         return ret;
4664 }
4665
4666 /*
4667  * Suspend & resume.
4668  */
4669 /**
4670  * amdgpu_device_prepare - prepare for device suspend
4671  *
4672  * @dev: drm dev pointer
4673  *
4674  * Prepare to put the hw in the suspend state (all asics).
4675  * Returns 0 for success or an error on failure.
4676  * Called at driver suspend.
4677  */
4678 int amdgpu_device_prepare(struct drm_device *dev)
4679 {
4680         struct amdgpu_device *adev = drm_to_adev(dev);
4681         int i, r;
4682
4683         amdgpu_choose_low_power_state(adev);
4684
4685         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4686                 return 0;
4687
4688         /* Evict the majority of BOs before starting suspend sequence */
4689         r = amdgpu_device_evict_resources(adev);
4690         if (r)
4691                 goto unprepare;
4692
4693         flush_delayed_work(&adev->gfx.gfx_off_delay_work);
4694
4695         for (i = 0; i < adev->num_ip_blocks; i++) {
4696                 if (!adev->ip_blocks[i].status.valid)
4697                         continue;
4698                 if (!adev->ip_blocks[i].version->funcs->prepare_suspend)
4699                         continue;
4700                 r = adev->ip_blocks[i].version->funcs->prepare_suspend((void *)adev);
4701                 if (r)
4702                         goto unprepare;
4703         }
4704
4705         return 0;
4706
4707 unprepare:
4708         adev->in_s0ix = adev->in_s3 = false;
4709
4710         return r;
4711 }
4712
4713 /**
4714  * amdgpu_device_suspend - initiate device suspend
4715  *
4716  * @dev: drm dev pointer
4717  * @fbcon : notify the fbdev of suspend
4718  *
4719  * Puts the hw in the suspend state (all asics).
4720  * Returns 0 for success or an error on failure.
4721  * Called at driver suspend.
4722  */
4723 int amdgpu_device_suspend(struct drm_device *dev, bool fbcon)
4724 {
4725         struct amdgpu_device *adev = drm_to_adev(dev);
4726         int r = 0;
4727
4728         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4729                 return 0;
4730
4731         adev->in_suspend = true;
4732
4733         if (amdgpu_sriov_vf(adev)) {
4734                 amdgpu_virt_fini_data_exchange(adev);
4735                 r = amdgpu_virt_request_full_gpu(adev, false);
4736                 if (r)
4737                         return r;
4738         }
4739
4740         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D3))
4741                 DRM_WARN("smart shift update failed\n");
4742
4743         if (fbcon)
4744                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, true);
4745
4746         cancel_delayed_work_sync(&adev->delayed_init_work);
4747
4748         amdgpu_ras_suspend(adev);
4749
4750         amdgpu_device_ip_suspend_phase1(adev);
4751
4752         if (!adev->in_s0ix)
4753                 amdgpu_amdkfd_suspend(adev, adev->in_runpm);
4754
4755         r = amdgpu_device_evict_resources(adev);
4756         if (r)
4757                 return r;
4758
4759         amdgpu_ttm_set_buffer_funcs_status(adev, false);
4760
4761         amdgpu_fence_driver_hw_fini(adev);
4762
4763         amdgpu_device_ip_suspend_phase2(adev);
4764
4765         if (amdgpu_sriov_vf(adev))
4766                 amdgpu_virt_release_full_gpu(adev, false);
4767
4768         r = amdgpu_dpm_notify_rlc_state(adev, false);
4769         if (r)
4770                 return r;
4771
4772         return 0;
4773 }
4774
4775 /**
4776  * amdgpu_device_resume - initiate device resume
4777  *
4778  * @dev: drm dev pointer
4779  * @fbcon : notify the fbdev of resume
4780  *
4781  * Bring the hw back to operating state (all asics).
4782  * Returns 0 for success or an error on failure.
4783  * Called at driver resume.
4784  */
4785 int amdgpu_device_resume(struct drm_device *dev, bool fbcon)
4786 {
4787         struct amdgpu_device *adev = drm_to_adev(dev);
4788         int r = 0;
4789
4790         if (amdgpu_sriov_vf(adev)) {
4791                 r = amdgpu_virt_request_full_gpu(adev, true);
4792                 if (r)
4793                         return r;
4794         }
4795
4796         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4797                 return 0;
4798
4799         if (adev->in_s0ix)
4800                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D0Entry);
4801
4802         /* post card */
4803         if (amdgpu_device_need_post(adev)) {
4804                 r = amdgpu_device_asic_init(adev);
4805                 if (r)
4806                         dev_err(adev->dev, "amdgpu asic init failed\n");
4807         }
4808
4809         r = amdgpu_device_ip_resume(adev);
4810
4811         if (r) {
4812                 dev_err(adev->dev, "amdgpu_device_ip_resume failed (%d).\n", r);
4813                 goto exit;
4814         }
4815         amdgpu_fence_driver_hw_init(adev);
4816
4817         if (!adev->in_s0ix) {
4818                 r = amdgpu_amdkfd_resume(adev, adev->in_runpm);
4819                 if (r)
4820                         goto exit;
4821         }
4822
4823         r = amdgpu_device_ip_late_init(adev);
4824         if (r)
4825                 goto exit;
4826
4827         queue_delayed_work(system_wq, &adev->delayed_init_work,
4828                            msecs_to_jiffies(AMDGPU_RESUME_MS));
4829 exit:
4830         if (amdgpu_sriov_vf(adev)) {
4831                 amdgpu_virt_init_data_exchange(adev);
4832                 amdgpu_virt_release_full_gpu(adev, true);
4833         }
4834
4835         if (r)
4836                 return r;
4837
4838         /* Make sure IB tests flushed */
4839         flush_delayed_work(&adev->delayed_init_work);
4840
4841         if (fbcon)
4842                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(adev)->fb_helper, false);
4843
4844         amdgpu_ras_resume(adev);
4845
4846         if (adev->mode_info.num_crtc) {
4847                 /*
4848                  * Most of the connector probing functions try to acquire runtime pm
4849                  * refs to ensure that the GPU is powered on when connector polling is
4850                  * performed. Since we're calling this from a runtime PM callback,
4851                  * trying to acquire rpm refs will cause us to deadlock.
4852                  *
4853                  * Since we're guaranteed to be holding the rpm lock, it's safe to
4854                  * temporarily disable the rpm helpers so this doesn't deadlock us.
4855                  */
4856 #ifdef CONFIG_PM
4857                 dev->dev->power.disable_depth++;
4858 #endif
4859                 if (!adev->dc_enabled)
4860                         drm_helper_hpd_irq_event(dev);
4861                 else
4862                         drm_kms_helper_hotplug_event(dev);
4863 #ifdef CONFIG_PM
4864                 dev->dev->power.disable_depth--;
4865 #endif
4866         }
4867         adev->in_suspend = false;
4868
4869         if (adev->enable_mes)
4870                 amdgpu_mes_self_test(adev);
4871
4872         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D0))
4873                 DRM_WARN("smart shift update failed\n");
4874
4875         return 0;
4876 }
4877
4878 /**
4879  * amdgpu_device_ip_check_soft_reset - did soft reset succeed
4880  *
4881  * @adev: amdgpu_device pointer
4882  *
4883  * The list of all the hardware IPs that make up the asic is walked and
4884  * the check_soft_reset callbacks are run.  check_soft_reset determines
4885  * if the asic is still hung or not.
4886  * Returns true if any of the IPs are still in a hung state, false if not.
4887  */
4888 static bool amdgpu_device_ip_check_soft_reset(struct amdgpu_device *adev)
4889 {
4890         int i;
4891         bool asic_hang = false;
4892
4893         if (amdgpu_sriov_vf(adev))
4894                 return true;
4895
4896         if (amdgpu_asic_need_full_reset(adev))
4897                 return true;
4898
4899         for (i = 0; i < adev->num_ip_blocks; i++) {
4900                 if (!adev->ip_blocks[i].status.valid)
4901                         continue;
4902                 if (adev->ip_blocks[i].version->funcs->check_soft_reset)
4903                         adev->ip_blocks[i].status.hang =
4904                                 adev->ip_blocks[i].version->funcs->check_soft_reset(adev);
4905                 if (adev->ip_blocks[i].status.hang) {
4906                         dev_info(adev->dev, "IP block:%s is hung!\n", adev->ip_blocks[i].version->funcs->name);
4907                         asic_hang = true;
4908                 }
4909         }
4910         return asic_hang;
4911 }
4912
4913 /**
4914  * amdgpu_device_ip_pre_soft_reset - prepare for soft reset
4915  *
4916  * @adev: amdgpu_device pointer
4917  *
4918  * The list of all the hardware IPs that make up the asic is walked and the
4919  * pre_soft_reset callbacks are run if the block is hung.  pre_soft_reset
4920  * handles any IP specific hardware or software state changes that are
4921  * necessary for a soft reset to succeed.
4922  * Returns 0 on success, negative error code on failure.
4923  */
4924 static int amdgpu_device_ip_pre_soft_reset(struct amdgpu_device *adev)
4925 {
4926         int i, r = 0;
4927
4928         for (i = 0; i < adev->num_ip_blocks; i++) {
4929                 if (!adev->ip_blocks[i].status.valid)
4930                         continue;
4931                 if (adev->ip_blocks[i].status.hang &&
4932                     adev->ip_blocks[i].version->funcs->pre_soft_reset) {
4933                         r = adev->ip_blocks[i].version->funcs->pre_soft_reset(adev);
4934                         if (r)
4935                                 return r;
4936                 }
4937         }
4938
4939         return 0;
4940 }
4941
4942 /**
4943  * amdgpu_device_ip_need_full_reset - check if a full asic reset is needed
4944  *
4945  * @adev: amdgpu_device pointer
4946  *
4947  * Some hardware IPs cannot be soft reset.  If they are hung, a full gpu
4948  * reset is necessary to recover.
4949  * Returns true if a full asic reset is required, false if not.
4950  */
4951 static bool amdgpu_device_ip_need_full_reset(struct amdgpu_device *adev)
4952 {
4953         int i;
4954
4955         if (amdgpu_asic_need_full_reset(adev))
4956                 return true;
4957
4958         for (i = 0; i < adev->num_ip_blocks; i++) {
4959                 if (!adev->ip_blocks[i].status.valid)
4960                         continue;
4961                 if ((adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) ||
4962                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) ||
4963                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_ACP) ||
4964                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) ||
4965                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
4966                         if (adev->ip_blocks[i].status.hang) {
4967                                 dev_info(adev->dev, "Some block need full reset!\n");
4968                                 return true;
4969                         }
4970                 }
4971         }
4972         return false;
4973 }
4974
4975 /**
4976  * amdgpu_device_ip_soft_reset - do a soft reset
4977  *
4978  * @adev: amdgpu_device pointer
4979  *
4980  * The list of all the hardware IPs that make up the asic is walked and the
4981  * soft_reset callbacks are run if the block is hung.  soft_reset handles any
4982  * IP specific hardware or software state changes that are necessary to soft
4983  * reset the IP.
4984  * Returns 0 on success, negative error code on failure.
4985  */
4986 static int amdgpu_device_ip_soft_reset(struct amdgpu_device *adev)
4987 {
4988         int i, r = 0;
4989
4990         for (i = 0; i < adev->num_ip_blocks; i++) {
4991                 if (!adev->ip_blocks[i].status.valid)
4992                         continue;
4993                 if (adev->ip_blocks[i].status.hang &&
4994                     adev->ip_blocks[i].version->funcs->soft_reset) {
4995                         r = adev->ip_blocks[i].version->funcs->soft_reset(adev);
4996                         if (r)
4997                                 return r;
4998                 }
4999         }
5000
5001         return 0;
5002 }
5003
5004 /**
5005  * amdgpu_device_ip_post_soft_reset - clean up from soft reset
5006  *
5007  * @adev: amdgpu_device pointer
5008  *
5009  * The list of all the hardware IPs that make up the asic is walked and the
5010  * post_soft_reset callbacks are run if the asic was hung.  post_soft_reset
5011  * handles any IP specific hardware or software state changes that are
5012  * necessary after the IP has been soft reset.
5013  * Returns 0 on success, negative error code on failure.
5014  */
5015 static int amdgpu_device_ip_post_soft_reset(struct amdgpu_device *adev)
5016 {
5017         int i, r = 0;
5018
5019         for (i = 0; i < adev->num_ip_blocks; i++) {
5020                 if (!adev->ip_blocks[i].status.valid)
5021                         continue;
5022                 if (adev->ip_blocks[i].status.hang &&
5023                     adev->ip_blocks[i].version->funcs->post_soft_reset)
5024                         r = adev->ip_blocks[i].version->funcs->post_soft_reset(adev);
5025                 if (r)
5026                         return r;
5027         }
5028
5029         return 0;
5030 }
5031
5032 /**
5033  * amdgpu_device_recover_vram - Recover some VRAM contents
5034  *
5035  * @adev: amdgpu_device pointer
5036  *
5037  * Restores the contents of VRAM buffers from the shadows in GTT.  Used to
5038  * restore things like GPUVM page tables after a GPU reset where
5039  * the contents of VRAM might be lost.
5040  *
5041  * Returns:
5042  * 0 on success, negative error code on failure.
5043  */
5044 static int amdgpu_device_recover_vram(struct amdgpu_device *adev)
5045 {
5046         struct dma_fence *fence = NULL, *next = NULL;
5047         struct amdgpu_bo *shadow;
5048         struct amdgpu_bo_vm *vmbo;
5049         long r = 1, tmo;
5050
5051         if (amdgpu_sriov_runtime(adev))
5052                 tmo = msecs_to_jiffies(8000);
5053         else
5054                 tmo = msecs_to_jiffies(100);
5055
5056         dev_info(adev->dev, "recover vram bo from shadow start\n");
5057         mutex_lock(&adev->shadow_list_lock);
5058         list_for_each_entry(vmbo, &adev->shadow_list, shadow_list) {
5059                 /* If vm is compute context or adev is APU, shadow will be NULL */
5060                 if (!vmbo->shadow)
5061                         continue;
5062                 shadow = vmbo->shadow;
5063
5064                 /* No need to recover an evicted BO */
5065                 if (!shadow->tbo.resource ||
5066                     shadow->tbo.resource->mem_type != TTM_PL_TT ||
5067                     shadow->tbo.resource->start == AMDGPU_BO_INVALID_OFFSET ||
5068                     shadow->parent->tbo.resource->mem_type != TTM_PL_VRAM)
5069                         continue;
5070
5071                 r = amdgpu_bo_restore_shadow(shadow, &next);
5072                 if (r)
5073                         break;
5074
5075                 if (fence) {
5076                         tmo = dma_fence_wait_timeout(fence, false, tmo);
5077                         dma_fence_put(fence);
5078                         fence = next;
5079                         if (tmo == 0) {
5080                                 r = -ETIMEDOUT;
5081                                 break;
5082                         } else if (tmo < 0) {
5083                                 r = tmo;
5084                                 break;
5085                         }
5086                 } else {
5087                         fence = next;
5088                 }
5089         }
5090         mutex_unlock(&adev->shadow_list_lock);
5091
5092         if (fence)
5093                 tmo = dma_fence_wait_timeout(fence, false, tmo);
5094         dma_fence_put(fence);
5095
5096         if (r < 0 || tmo <= 0) {
5097                 dev_err(adev->dev, "recover vram bo from shadow failed, r is %ld, tmo is %ld\n", r, tmo);
5098                 return -EIO;
5099         }
5100
5101         dev_info(adev->dev, "recover vram bo from shadow done\n");
5102         return 0;
5103 }
5104
5105
5106 /**
5107  * amdgpu_device_reset_sriov - reset ASIC for SR-IOV vf
5108  *
5109  * @adev: amdgpu_device pointer
5110  * @reset_context: amdgpu reset context pointer
5111  *
5112  * do VF FLR and reinitialize Asic
5113  * return 0 means succeeded otherwise failed
5114  */
5115 static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
5116                                      struct amdgpu_reset_context *reset_context)
5117 {
5118         int r;
5119         struct amdgpu_hive_info *hive = NULL;
5120
5121         if (test_bit(AMDGPU_HOST_FLR, &reset_context->flags)) {
5122                 if (!amdgpu_ras_get_fed_status(adev))
5123                         amdgpu_virt_ready_to_reset(adev);
5124                 amdgpu_virt_wait_reset(adev);
5125                 clear_bit(AMDGPU_HOST_FLR, &reset_context->flags);
5126                 r = amdgpu_virt_request_full_gpu(adev, true);
5127         } else {
5128                 r = amdgpu_virt_reset_gpu(adev);
5129         }
5130         if (r)
5131                 return r;
5132
5133         amdgpu_ras_set_fed(adev, false);
5134         amdgpu_irq_gpu_reset_resume_helper(adev);
5135
5136         /* some sw clean up VF needs to do before recover */
5137         amdgpu_virt_post_reset(adev);
5138
5139         /* Resume IP prior to SMC */
5140         r = amdgpu_device_ip_reinit_early_sriov(adev);
5141         if (r)
5142                 return r;
5143
5144         amdgpu_virt_init_data_exchange(adev);
5145
5146         r = amdgpu_device_fw_loading(adev);
5147         if (r)
5148                 return r;
5149
5150         /* now we are okay to resume SMC/CP/SDMA */
5151         r = amdgpu_device_ip_reinit_late_sriov(adev);
5152         if (r)
5153                 return r;
5154
5155         hive = amdgpu_get_xgmi_hive(adev);
5156         /* Update PSP FW topology after reset */
5157         if (hive && adev->gmc.xgmi.num_physical_nodes > 1)
5158                 r = amdgpu_xgmi_update_topology(hive, adev);
5159         if (hive)
5160                 amdgpu_put_xgmi_hive(hive);
5161         if (r)
5162                 return r;
5163
5164         r = amdgpu_ib_ring_tests(adev);
5165         if (r)
5166                 return r;
5167
5168         if (adev->virt.gim_feature & AMDGIM_FEATURE_GIM_FLR_VRAMLOST) {
5169                 amdgpu_inc_vram_lost(adev);
5170                 r = amdgpu_device_recover_vram(adev);
5171         }
5172         if (r)
5173                 return r;
5174
5175         /* need to be called during full access so we can't do it later like
5176          * bare-metal does.
5177          */
5178         amdgpu_amdkfd_post_reset(adev);
5179         amdgpu_virt_release_full_gpu(adev, true);
5180
5181         /* Aldebaran and gfx_11_0_3 support ras in SRIOV, so need resume ras during reset */
5182         if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 2) ||
5183             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
5184             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4) ||
5185             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(11, 0, 3))
5186                 amdgpu_ras_resume(adev);
5187         return 0;
5188 }
5189
5190 /**
5191  * amdgpu_device_has_job_running - check if there is any job in mirror list
5192  *
5193  * @adev: amdgpu_device pointer
5194  *
5195  * check if there is any job in mirror list
5196  */
5197 bool amdgpu_device_has_job_running(struct amdgpu_device *adev)
5198 {
5199         int i;
5200         struct drm_sched_job *job;
5201
5202         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5203                 struct amdgpu_ring *ring = adev->rings[i];
5204
5205                 if (!amdgpu_ring_sched_ready(ring))
5206                         continue;
5207
5208                 spin_lock(&ring->sched.job_list_lock);
5209                 job = list_first_entry_or_null(&ring->sched.pending_list,
5210                                                struct drm_sched_job, list);
5211                 spin_unlock(&ring->sched.job_list_lock);
5212                 if (job)
5213                         return true;
5214         }
5215         return false;
5216 }
5217
5218 /**
5219  * amdgpu_device_should_recover_gpu - check if we should try GPU recovery
5220  *
5221  * @adev: amdgpu_device pointer
5222  *
5223  * Check amdgpu_gpu_recovery and SRIOV status to see if we should try to recover
5224  * a hung GPU.
5225  */
5226 bool amdgpu_device_should_recover_gpu(struct amdgpu_device *adev)
5227 {
5228
5229         if (amdgpu_gpu_recovery == 0)
5230                 goto disabled;
5231
5232         /* Skip soft reset check in fatal error mode */
5233         if (!amdgpu_ras_is_poison_mode_supported(adev))
5234                 return true;
5235
5236         if (amdgpu_sriov_vf(adev))
5237                 return true;
5238
5239         if (amdgpu_gpu_recovery == -1) {
5240                 switch (adev->asic_type) {
5241 #ifdef CONFIG_DRM_AMDGPU_SI
5242                 case CHIP_VERDE:
5243                 case CHIP_TAHITI:
5244                 case CHIP_PITCAIRN:
5245                 case CHIP_OLAND:
5246                 case CHIP_HAINAN:
5247 #endif
5248 #ifdef CONFIG_DRM_AMDGPU_CIK
5249                 case CHIP_KAVERI:
5250                 case CHIP_KABINI:
5251                 case CHIP_MULLINS:
5252 #endif
5253                 case CHIP_CARRIZO:
5254                 case CHIP_STONEY:
5255                 case CHIP_CYAN_SKILLFISH:
5256                         goto disabled;
5257                 default:
5258                         break;
5259                 }
5260         }
5261
5262         return true;
5263
5264 disabled:
5265                 dev_info(adev->dev, "GPU recovery disabled.\n");
5266                 return false;
5267 }
5268
5269 int amdgpu_device_mode1_reset(struct amdgpu_device *adev)
5270 {
5271         u32 i;
5272         int ret = 0;
5273
5274         amdgpu_atombios_scratch_regs_engine_hung(adev, true);
5275
5276         dev_info(adev->dev, "GPU mode1 reset\n");
5277
5278         /* Cache the state before bus master disable. The saved config space
5279          * values are used in other cases like restore after mode-2 reset.
5280          */
5281         amdgpu_device_cache_pci_state(adev->pdev);
5282
5283         /* disable BM */
5284         pci_clear_master(adev->pdev);
5285
5286         if (amdgpu_dpm_is_mode1_reset_supported(adev)) {
5287                 dev_info(adev->dev, "GPU smu mode1 reset\n");
5288                 ret = amdgpu_dpm_mode1_reset(adev);
5289         } else {
5290                 dev_info(adev->dev, "GPU psp mode1 reset\n");
5291                 ret = psp_gpu_reset(adev);
5292         }
5293
5294         if (ret)
5295                 goto mode1_reset_failed;
5296
5297         amdgpu_device_load_pci_state(adev->pdev);
5298         ret = amdgpu_psp_wait_for_bootloader(adev);
5299         if (ret)
5300                 goto mode1_reset_failed;
5301
5302         /* wait for asic to come out of reset */
5303         for (i = 0; i < adev->usec_timeout; i++) {
5304                 u32 memsize = adev->nbio.funcs->get_memsize(adev);
5305
5306                 if (memsize != 0xffffffff)
5307                         break;
5308                 udelay(1);
5309         }
5310
5311         if (i >= adev->usec_timeout) {
5312                 ret = -ETIMEDOUT;
5313                 goto mode1_reset_failed;
5314         }
5315
5316         amdgpu_atombios_scratch_regs_engine_hung(adev, false);
5317
5318         return 0;
5319
5320 mode1_reset_failed:
5321         dev_err(adev->dev, "GPU mode1 reset failed\n");
5322         return ret;
5323 }
5324
5325 int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev,
5326                                  struct amdgpu_reset_context *reset_context)
5327 {
5328         int i, r = 0;
5329         struct amdgpu_job *job = NULL;
5330         struct amdgpu_device *tmp_adev = reset_context->reset_req_dev;
5331         bool need_full_reset =
5332                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5333
5334         if (reset_context->reset_req_dev == adev)
5335                 job = reset_context->job;
5336
5337         if (amdgpu_sriov_vf(adev))
5338                 amdgpu_virt_pre_reset(adev);
5339
5340         amdgpu_fence_driver_isr_toggle(adev, true);
5341
5342         /* block all schedulers and reset given job's ring */
5343         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5344                 struct amdgpu_ring *ring = adev->rings[i];
5345
5346                 if (!amdgpu_ring_sched_ready(ring))
5347                         continue;
5348
5349                 /* Clear job fence from fence drv to avoid force_completion
5350                  * leave NULL and vm flush fence in fence drv
5351                  */
5352                 amdgpu_fence_driver_clear_job_fences(ring);
5353
5354                 /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
5355                 amdgpu_fence_driver_force_completion(ring);
5356         }
5357
5358         amdgpu_fence_driver_isr_toggle(adev, false);
5359
5360         if (job && job->vm)
5361                 drm_sched_increase_karma(&job->base);
5362
5363         r = amdgpu_reset_prepare_hwcontext(adev, reset_context);
5364         /* If reset handler not implemented, continue; otherwise return */
5365         if (r == -EOPNOTSUPP)
5366                 r = 0;
5367         else
5368                 return r;
5369
5370         /* Don't suspend on bare metal if we are not going to HW reset the ASIC */
5371         if (!amdgpu_sriov_vf(adev)) {
5372
5373                 if (!need_full_reset)
5374                         need_full_reset = amdgpu_device_ip_need_full_reset(adev);
5375
5376                 if (!need_full_reset && amdgpu_gpu_recovery &&
5377                     amdgpu_device_ip_check_soft_reset(adev)) {
5378                         amdgpu_device_ip_pre_soft_reset(adev);
5379                         r = amdgpu_device_ip_soft_reset(adev);
5380                         amdgpu_device_ip_post_soft_reset(adev);
5381                         if (r || amdgpu_device_ip_check_soft_reset(adev)) {
5382                                 dev_info(adev->dev, "soft reset failed, will fallback to full reset!\n");
5383                                 need_full_reset = true;
5384                         }
5385                 }
5386
5387                 if (!test_bit(AMDGPU_SKIP_COREDUMP, &reset_context->flags)) {
5388                         dev_info(tmp_adev->dev, "Dumping IP State\n");
5389                         /* Trigger ip dump before we reset the asic */
5390                         for (i = 0; i < tmp_adev->num_ip_blocks; i++)
5391                                 if (tmp_adev->ip_blocks[i].version->funcs->dump_ip_state)
5392                                         tmp_adev->ip_blocks[i].version->funcs
5393                                                 ->dump_ip_state((void *)tmp_adev);
5394                         dev_info(tmp_adev->dev, "Dumping IP State Completed\n");
5395                 }
5396
5397                 if (need_full_reset)
5398                         r = amdgpu_device_ip_suspend(adev);
5399                 if (need_full_reset)
5400                         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5401                 else
5402                         clear_bit(AMDGPU_NEED_FULL_RESET,
5403                                   &reset_context->flags);
5404         }
5405
5406         return r;
5407 }
5408
5409 int amdgpu_do_asic_reset(struct list_head *device_list_handle,
5410                          struct amdgpu_reset_context *reset_context)
5411 {
5412         struct amdgpu_device *tmp_adev = NULL;
5413         bool need_full_reset, skip_hw_reset, vram_lost = false;
5414         int r = 0;
5415
5416         /* Try reset handler method first */
5417         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5418                                     reset_list);
5419
5420         reset_context->reset_device_list = device_list_handle;
5421         r = amdgpu_reset_perform_reset(tmp_adev, reset_context);
5422         /* If reset handler not implemented, continue; otherwise return */
5423         if (r == -EOPNOTSUPP)
5424                 r = 0;
5425         else
5426                 return r;
5427
5428         /* Reset handler not implemented, use the default method */
5429         need_full_reset =
5430                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5431         skip_hw_reset = test_bit(AMDGPU_SKIP_HW_RESET, &reset_context->flags);
5432
5433         /*
5434          * ASIC reset has to be done on all XGMI hive nodes ASAP
5435          * to allow proper links negotiation in FW (within 1 sec)
5436          */
5437         if (!skip_hw_reset && need_full_reset) {
5438                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5439                         /* For XGMI run all resets in parallel to speed up the process */
5440                         if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
5441                                 tmp_adev->gmc.xgmi.pending_reset = false;
5442                                 if (!queue_work(system_unbound_wq, &tmp_adev->xgmi_reset_work))
5443                                         r = -EALREADY;
5444                         } else
5445                                 r = amdgpu_asic_reset(tmp_adev);
5446
5447                         if (r) {
5448                                 dev_err(tmp_adev->dev, "ASIC reset failed with error, %d for drm dev, %s",
5449                                          r, adev_to_drm(tmp_adev)->unique);
5450                                 goto out;
5451                         }
5452                 }
5453
5454                 /* For XGMI wait for all resets to complete before proceed */
5455                 if (!r) {
5456                         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5457                                 if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
5458                                         flush_work(&tmp_adev->xgmi_reset_work);
5459                                         r = tmp_adev->asic_reset_res;
5460                                         if (r)
5461                                                 break;
5462                                 }
5463                         }
5464                 }
5465         }
5466
5467         if (!r && amdgpu_ras_intr_triggered()) {
5468                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5469                         amdgpu_ras_reset_error_count(tmp_adev, AMDGPU_RAS_BLOCK__MMHUB);
5470                 }
5471
5472                 amdgpu_ras_intr_cleared();
5473         }
5474
5475         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5476                 if (need_full_reset) {
5477                         /* post card */
5478                         amdgpu_ras_set_fed(tmp_adev, false);
5479                         r = amdgpu_device_asic_init(tmp_adev);
5480                         if (r) {
5481                                 dev_warn(tmp_adev->dev, "asic atom init failed!");
5482                         } else {
5483                                 dev_info(tmp_adev->dev, "GPU reset succeeded, trying to resume\n");
5484
5485                                 r = amdgpu_device_ip_resume_phase1(tmp_adev);
5486                                 if (r)
5487                                         goto out;
5488
5489                                 vram_lost = amdgpu_device_check_vram_lost(tmp_adev);
5490
5491                                 if (!test_bit(AMDGPU_SKIP_COREDUMP, &reset_context->flags))
5492                                         amdgpu_coredump(tmp_adev, false, vram_lost, reset_context->job);
5493
5494                                 if (vram_lost) {
5495                                         DRM_INFO("VRAM is lost due to GPU reset!\n");
5496                                         amdgpu_inc_vram_lost(tmp_adev);
5497                                 }
5498
5499                                 r = amdgpu_device_fw_loading(tmp_adev);
5500                                 if (r)
5501                                         return r;
5502
5503                                 r = amdgpu_xcp_restore_partition_mode(
5504                                         tmp_adev->xcp_mgr);
5505                                 if (r)
5506                                         goto out;
5507
5508                                 r = amdgpu_device_ip_resume_phase2(tmp_adev);
5509                                 if (r)
5510                                         goto out;
5511
5512                                 if (tmp_adev->mman.buffer_funcs_ring->sched.ready)
5513                                         amdgpu_ttm_set_buffer_funcs_status(tmp_adev, true);
5514
5515                                 if (vram_lost)
5516                                         amdgpu_device_fill_reset_magic(tmp_adev);
5517
5518                                 /*
5519                                  * Add this ASIC as tracked as reset was already
5520                                  * complete successfully.
5521                                  */
5522                                 amdgpu_register_gpu_instance(tmp_adev);
5523
5524                                 if (!reset_context->hive &&
5525                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
5526                                         amdgpu_xgmi_add_device(tmp_adev);
5527
5528                                 r = amdgpu_device_ip_late_init(tmp_adev);
5529                                 if (r)
5530                                         goto out;
5531
5532                                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, false);
5533
5534                                 /*
5535                                  * The GPU enters bad state once faulty pages
5536                                  * by ECC has reached the threshold, and ras
5537                                  * recovery is scheduled next. So add one check
5538                                  * here to break recovery if it indeed exceeds
5539                                  * bad page threshold, and remind user to
5540                                  * retire this GPU or setting one bigger
5541                                  * bad_page_threshold value to fix this once
5542                                  * probing driver again.
5543                                  */
5544                                 if (!amdgpu_ras_is_rma(tmp_adev)) {
5545                                         /* must succeed. */
5546                                         amdgpu_ras_resume(tmp_adev);
5547                                 } else {
5548                                         r = -EINVAL;
5549                                         goto out;
5550                                 }
5551
5552                                 /* Update PSP FW topology after reset */
5553                                 if (reset_context->hive &&
5554                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
5555                                         r = amdgpu_xgmi_update_topology(
5556                                                 reset_context->hive, tmp_adev);
5557                         }
5558                 }
5559
5560 out:
5561                 if (!r) {
5562                         amdgpu_irq_gpu_reset_resume_helper(tmp_adev);
5563                         r = amdgpu_ib_ring_tests(tmp_adev);
5564                         if (r) {
5565                                 dev_err(tmp_adev->dev, "ib ring test failed (%d).\n", r);
5566                                 need_full_reset = true;
5567                                 r = -EAGAIN;
5568                                 goto end;
5569                         }
5570                 }
5571
5572                 if (!r)
5573                         r = amdgpu_device_recover_vram(tmp_adev);
5574                 else
5575                         tmp_adev->asic_reset_res = r;
5576         }
5577
5578 end:
5579         if (need_full_reset)
5580                 set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5581         else
5582                 clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5583         return r;
5584 }
5585
5586 static void amdgpu_device_set_mp1_state(struct amdgpu_device *adev)
5587 {
5588
5589         switch (amdgpu_asic_reset_method(adev)) {
5590         case AMD_RESET_METHOD_MODE1:
5591                 adev->mp1_state = PP_MP1_STATE_SHUTDOWN;
5592                 break;
5593         case AMD_RESET_METHOD_MODE2:
5594                 adev->mp1_state = PP_MP1_STATE_RESET;
5595                 break;
5596         default:
5597                 adev->mp1_state = PP_MP1_STATE_NONE;
5598                 break;
5599         }
5600 }
5601
5602 static void amdgpu_device_unset_mp1_state(struct amdgpu_device *adev)
5603 {
5604         amdgpu_vf_error_trans_all(adev);
5605         adev->mp1_state = PP_MP1_STATE_NONE;
5606 }
5607
5608 static void amdgpu_device_resume_display_audio(struct amdgpu_device *adev)
5609 {
5610         struct pci_dev *p = NULL;
5611
5612         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5613                         adev->pdev->bus->number, 1);
5614         if (p) {
5615                 pm_runtime_enable(&(p->dev));
5616                 pm_runtime_resume(&(p->dev));
5617         }
5618
5619         pci_dev_put(p);
5620 }
5621
5622 static int amdgpu_device_suspend_display_audio(struct amdgpu_device *adev)
5623 {
5624         enum amd_reset_method reset_method;
5625         struct pci_dev *p = NULL;
5626         u64 expires;
5627
5628         /*
5629          * For now, only BACO and mode1 reset are confirmed
5630          * to suffer the audio issue without proper suspended.
5631          */
5632         reset_method = amdgpu_asic_reset_method(adev);
5633         if ((reset_method != AMD_RESET_METHOD_BACO) &&
5634              (reset_method != AMD_RESET_METHOD_MODE1))
5635                 return -EINVAL;
5636
5637         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5638                         adev->pdev->bus->number, 1);
5639         if (!p)
5640                 return -ENODEV;
5641
5642         expires = pm_runtime_autosuspend_expiration(&(p->dev));
5643         if (!expires)
5644                 /*
5645                  * If we cannot get the audio device autosuspend delay,
5646                  * a fixed 4S interval will be used. Considering 3S is
5647                  * the audio controller default autosuspend delay setting.
5648                  * 4S used here is guaranteed to cover that.
5649                  */
5650                 expires = ktime_get_mono_fast_ns() + NSEC_PER_SEC * 4ULL;
5651
5652         while (!pm_runtime_status_suspended(&(p->dev))) {
5653                 if (!pm_runtime_suspend(&(p->dev)))
5654                         break;
5655
5656                 if (expires < ktime_get_mono_fast_ns()) {
5657                         dev_warn(adev->dev, "failed to suspend display audio\n");
5658                         pci_dev_put(p);
5659                         /* TODO: abort the succeeding gpu reset? */
5660                         return -ETIMEDOUT;
5661                 }
5662         }
5663
5664         pm_runtime_disable(&(p->dev));
5665
5666         pci_dev_put(p);
5667         return 0;
5668 }
5669
5670 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev)
5671 {
5672         struct amdgpu_ras *con = amdgpu_ras_get_context(adev);
5673
5674 #if defined(CONFIG_DEBUG_FS)
5675         if (!amdgpu_sriov_vf(adev))
5676                 cancel_work(&adev->reset_work);
5677 #endif
5678
5679         if (adev->kfd.dev)
5680                 cancel_work(&adev->kfd.reset_work);
5681
5682         if (amdgpu_sriov_vf(adev))
5683                 cancel_work(&adev->virt.flr_work);
5684
5685         if (con && adev->ras_enabled)
5686                 cancel_work(&con->recovery_work);
5687
5688 }
5689
5690 static int amdgpu_device_health_check(struct list_head *device_list_handle)
5691 {
5692         struct amdgpu_device *tmp_adev;
5693         int ret = 0;
5694         u32 status;
5695
5696         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5697                 pci_read_config_dword(tmp_adev->pdev, PCI_COMMAND, &status);
5698                 if (PCI_POSSIBLE_ERROR(status)) {
5699                         dev_err(tmp_adev->dev, "device lost from bus!");
5700                         ret = -ENODEV;
5701                 }
5702         }
5703
5704         return ret;
5705 }
5706
5707 /**
5708  * amdgpu_device_gpu_recover - reset the asic and recover scheduler
5709  *
5710  * @adev: amdgpu_device pointer
5711  * @job: which job trigger hang
5712  * @reset_context: amdgpu reset context pointer
5713  *
5714  * Attempt to reset the GPU if it has hung (all asics).
5715  * Attempt to do soft-reset or full-reset and reinitialize Asic
5716  * Returns 0 for success or an error on failure.
5717  */
5718
5719 int amdgpu_device_gpu_recover(struct amdgpu_device *adev,
5720                               struct amdgpu_job *job,
5721                               struct amdgpu_reset_context *reset_context)
5722 {
5723         struct list_head device_list, *device_list_handle =  NULL;
5724         bool job_signaled = false;
5725         struct amdgpu_hive_info *hive = NULL;
5726         struct amdgpu_device *tmp_adev = NULL;
5727         int i, r = 0;
5728         bool need_emergency_restart = false;
5729         bool audio_suspended = false;
5730         int retry_limit = AMDGPU_MAX_RETRY_LIMIT;
5731
5732         /*
5733          * Special case: RAS triggered and full reset isn't supported
5734          */
5735         need_emergency_restart = amdgpu_ras_need_emergency_restart(adev);
5736
5737         /*
5738          * Flush RAM to disk so that after reboot
5739          * the user can read log and see why the system rebooted.
5740          */
5741         if (need_emergency_restart && amdgpu_ras_get_context(adev) &&
5742                 amdgpu_ras_get_context(adev)->reboot) {
5743                 DRM_WARN("Emergency reboot.");
5744
5745                 ksys_sync_helper();
5746                 emergency_restart();
5747         }
5748
5749         dev_info(adev->dev, "GPU %s begin!\n",
5750                 need_emergency_restart ? "jobs stop":"reset");
5751
5752         if (!amdgpu_sriov_vf(adev))
5753                 hive = amdgpu_get_xgmi_hive(adev);
5754         if (hive)
5755                 mutex_lock(&hive->hive_lock);
5756
5757         reset_context->job = job;
5758         reset_context->hive = hive;
5759         /*
5760          * Build list of devices to reset.
5761          * In case we are in XGMI hive mode, resort the device list
5762          * to put adev in the 1st position.
5763          */
5764         INIT_LIST_HEAD(&device_list);
5765         if (!amdgpu_sriov_vf(adev) && (adev->gmc.xgmi.num_physical_nodes > 1) && hive) {
5766                 list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head) {
5767                         list_add_tail(&tmp_adev->reset_list, &device_list);
5768                         if (adev->shutdown)
5769                                 tmp_adev->shutdown = true;
5770                 }
5771                 if (!list_is_first(&adev->reset_list, &device_list))
5772                         list_rotate_to_front(&adev->reset_list, &device_list);
5773                 device_list_handle = &device_list;
5774         } else {
5775                 list_add_tail(&adev->reset_list, &device_list);
5776                 device_list_handle = &device_list;
5777         }
5778
5779         if (!amdgpu_sriov_vf(adev)) {
5780                 r = amdgpu_device_health_check(device_list_handle);
5781                 if (r)
5782                         goto end_reset;
5783         }
5784
5785         /* We need to lock reset domain only once both for XGMI and single device */
5786         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5787                                     reset_list);
5788         amdgpu_device_lock_reset_domain(tmp_adev->reset_domain);
5789
5790         /* block all schedulers and reset given job's ring */
5791         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5792
5793                 amdgpu_device_set_mp1_state(tmp_adev);
5794
5795                 /*
5796                  * Try to put the audio codec into suspend state
5797                  * before gpu reset started.
5798                  *
5799                  * Due to the power domain of the graphics device
5800                  * is shared with AZ power domain. Without this,
5801                  * we may change the audio hardware from behind
5802                  * the audio driver's back. That will trigger
5803                  * some audio codec errors.
5804                  */
5805                 if (!amdgpu_device_suspend_display_audio(tmp_adev))
5806                         audio_suspended = true;
5807
5808                 amdgpu_ras_set_error_query_ready(tmp_adev, false);
5809
5810                 cancel_delayed_work_sync(&tmp_adev->delayed_init_work);
5811
5812                 amdgpu_amdkfd_pre_reset(tmp_adev, reset_context);
5813
5814                 /*
5815                  * Mark these ASICs to be reseted as untracked first
5816                  * And add them back after reset completed
5817                  */
5818                 amdgpu_unregister_gpu_instance(tmp_adev);
5819
5820                 drm_fb_helper_set_suspend_unlocked(adev_to_drm(tmp_adev)->fb_helper, true);
5821
5822                 /* disable ras on ALL IPs */
5823                 if (!need_emergency_restart &&
5824                       amdgpu_device_ip_need_full_reset(tmp_adev))
5825                         amdgpu_ras_suspend(tmp_adev);
5826
5827                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5828                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5829
5830                         if (!amdgpu_ring_sched_ready(ring))
5831                                 continue;
5832
5833                         drm_sched_stop(&ring->sched, job ? &job->base : NULL);
5834
5835                         if (need_emergency_restart)
5836                                 amdgpu_job_stop_all_jobs_on_sched(&ring->sched);
5837                 }
5838                 atomic_inc(&tmp_adev->gpu_reset_counter);
5839         }
5840
5841         if (need_emergency_restart)
5842                 goto skip_sched_resume;
5843
5844         /*
5845          * Must check guilty signal here since after this point all old
5846          * HW fences are force signaled.
5847          *
5848          * job->base holds a reference to parent fence
5849          */
5850         if (job && dma_fence_is_signaled(&job->hw_fence)) {
5851                 job_signaled = true;
5852                 dev_info(adev->dev, "Guilty job already signaled, skipping HW reset");
5853                 goto skip_hw_reset;
5854         }
5855
5856 retry:  /* Rest of adevs pre asic reset from XGMI hive. */
5857         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5858                 r = amdgpu_device_pre_asic_reset(tmp_adev, reset_context);
5859                 /*TODO Should we stop ?*/
5860                 if (r) {
5861                         dev_err(tmp_adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
5862                                   r, adev_to_drm(tmp_adev)->unique);
5863                         tmp_adev->asic_reset_res = r;
5864                 }
5865         }
5866
5867         /* Actual ASIC resets if needed.*/
5868         /* Host driver will handle XGMI hive reset for SRIOV */
5869         if (amdgpu_sriov_vf(adev)) {
5870                 if (amdgpu_ras_get_fed_status(adev) || amdgpu_virt_rcvd_ras_interrupt(adev)) {
5871                         dev_dbg(adev->dev, "Detected RAS error, wait for FLR completion\n");
5872                         amdgpu_ras_set_fed(adev, true);
5873                         set_bit(AMDGPU_HOST_FLR, &reset_context->flags);
5874                 }
5875
5876                 r = amdgpu_device_reset_sriov(adev, reset_context);
5877                 if (AMDGPU_RETRY_SRIOV_RESET(r) && (retry_limit--) > 0) {
5878                         amdgpu_virt_release_full_gpu(adev, true);
5879                         goto retry;
5880                 }
5881                 if (r)
5882                         adev->asic_reset_res = r;
5883         } else {
5884                 r = amdgpu_do_asic_reset(device_list_handle, reset_context);
5885                 if (r && r == -EAGAIN)
5886                         goto retry;
5887         }
5888
5889         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5890                 /*
5891                  * Drop any pending non scheduler resets queued before reset is done.
5892                  * Any reset scheduled after this point would be valid. Scheduler resets
5893                  * were already dropped during drm_sched_stop and no new ones can come
5894                  * in before drm_sched_start.
5895                  */
5896                 amdgpu_device_stop_pending_resets(tmp_adev);
5897         }
5898
5899 skip_hw_reset:
5900
5901         /* Post ASIC reset for all devs .*/
5902         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5903
5904                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5905                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5906
5907                         if (!amdgpu_ring_sched_ready(ring))
5908                                 continue;
5909
5910                         drm_sched_start(&ring->sched);
5911                 }
5912
5913                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(tmp_adev)) && !job_signaled)
5914                         drm_helper_resume_force_mode(adev_to_drm(tmp_adev));
5915
5916                 if (tmp_adev->asic_reset_res)
5917                         r = tmp_adev->asic_reset_res;
5918
5919                 tmp_adev->asic_reset_res = 0;
5920
5921                 if (r) {
5922                         /* bad news, how to tell it to userspace ?
5923                          * for ras error, we should report GPU bad status instead of
5924                          * reset failure
5925                          */
5926                         if (reset_context->src != AMDGPU_RESET_SRC_RAS ||
5927                             !amdgpu_ras_eeprom_check_err_threshold(tmp_adev))
5928                                 dev_info(tmp_adev->dev, "GPU reset(%d) failed\n",
5929                                         atomic_read(&tmp_adev->gpu_reset_counter));
5930                         amdgpu_vf_error_put(tmp_adev, AMDGIM_ERROR_VF_GPU_RESET_FAIL, 0, r);
5931                 } else {
5932                         dev_info(tmp_adev->dev, "GPU reset(%d) succeeded!\n", atomic_read(&tmp_adev->gpu_reset_counter));
5933                         if (amdgpu_acpi_smart_shift_update(adev_to_drm(tmp_adev), AMDGPU_SS_DEV_D0))
5934                                 DRM_WARN("smart shift update failed\n");
5935                 }
5936         }
5937
5938 skip_sched_resume:
5939         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5940                 /* unlock kfd: SRIOV would do it separately */
5941                 if (!need_emergency_restart && !amdgpu_sriov_vf(tmp_adev))
5942                         amdgpu_amdkfd_post_reset(tmp_adev);
5943
5944                 /* kfd_post_reset will do nothing if kfd device is not initialized,
5945                  * need to bring up kfd here if it's not be initialized before
5946                  */
5947                 if (!adev->kfd.init_complete)
5948                         amdgpu_amdkfd_device_init(adev);
5949
5950                 if (audio_suspended)
5951                         amdgpu_device_resume_display_audio(tmp_adev);
5952
5953                 amdgpu_device_unset_mp1_state(tmp_adev);
5954
5955                 amdgpu_ras_set_error_query_ready(tmp_adev, true);
5956         }
5957
5958         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5959                                             reset_list);
5960         amdgpu_device_unlock_reset_domain(tmp_adev->reset_domain);
5961
5962 end_reset:
5963         if (hive) {
5964                 mutex_unlock(&hive->hive_lock);
5965                 amdgpu_put_xgmi_hive(hive);
5966         }
5967
5968         if (r)
5969                 dev_info(adev->dev, "GPU reset end with ret = %d\n", r);
5970
5971         atomic_set(&adev->reset_domain->reset_res, r);
5972         return r;
5973 }
5974
5975 /**
5976  * amdgpu_device_partner_bandwidth - find the bandwidth of appropriate partner
5977  *
5978  * @adev: amdgpu_device pointer
5979  * @speed: pointer to the speed of the link
5980  * @width: pointer to the width of the link
5981  *
5982  * Evaluate the hierarchy to find the speed and bandwidth capabilities of the
5983  * first physical partner to an AMD dGPU.
5984  * This will exclude any virtual switches and links.
5985  */
5986 static void amdgpu_device_partner_bandwidth(struct amdgpu_device *adev,
5987                                             enum pci_bus_speed *speed,
5988                                             enum pcie_link_width *width)
5989 {
5990         struct pci_dev *parent = adev->pdev;
5991
5992         if (!speed || !width)
5993                 return;
5994
5995         *speed = PCI_SPEED_UNKNOWN;
5996         *width = PCIE_LNK_WIDTH_UNKNOWN;
5997
5998         if (amdgpu_device_pcie_dynamic_switching_supported(adev)) {
5999                 while ((parent = pci_upstream_bridge(parent))) {
6000                         /* skip upstream/downstream switches internal to dGPU*/
6001                         if (parent->vendor == PCI_VENDOR_ID_ATI)
6002                                 continue;
6003                         *speed = pcie_get_speed_cap(parent);
6004                         *width = pcie_get_width_cap(parent);
6005                         break;
6006                 }
6007         } else {
6008                 /* use the current speeds rather than max if switching is not supported */
6009                 pcie_bandwidth_available(adev->pdev, NULL, speed, width);
6010         }
6011 }
6012
6013 /**
6014  * amdgpu_device_get_pcie_info - fence pcie info about the PCIE slot
6015  *
6016  * @adev: amdgpu_device pointer
6017  *
6018  * Fetchs and stores in the driver the PCIE capabilities (gen speed
6019  * and lanes) of the slot the device is in. Handles APUs and
6020  * virtualized environments where PCIE config space may not be available.
6021  */
6022 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev)
6023 {
6024         struct pci_dev *pdev;
6025         enum pci_bus_speed speed_cap, platform_speed_cap;
6026         enum pcie_link_width platform_link_width;
6027
6028         if (amdgpu_pcie_gen_cap)
6029                 adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
6030
6031         if (amdgpu_pcie_lane_cap)
6032                 adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
6033
6034         /* covers APUs as well */
6035         if (pci_is_root_bus(adev->pdev->bus) && !amdgpu_passthrough(adev)) {
6036                 if (adev->pm.pcie_gen_mask == 0)
6037                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
6038                 if (adev->pm.pcie_mlw_mask == 0)
6039                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
6040                 return;
6041         }
6042
6043         if (adev->pm.pcie_gen_mask && adev->pm.pcie_mlw_mask)
6044                 return;
6045
6046         amdgpu_device_partner_bandwidth(adev, &platform_speed_cap,
6047                                         &platform_link_width);
6048
6049         if (adev->pm.pcie_gen_mask == 0) {
6050                 /* asic caps */
6051                 pdev = adev->pdev;
6052                 speed_cap = pcie_get_speed_cap(pdev);
6053                 if (speed_cap == PCI_SPEED_UNKNOWN) {
6054                         adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6055                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6056                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
6057                 } else {
6058                         if (speed_cap == PCIE_SPEED_32_0GT)
6059                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6060                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6061                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6062                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4 |
6063                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN5);
6064                         else if (speed_cap == PCIE_SPEED_16_0GT)
6065                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6066                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6067                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6068                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4);
6069                         else if (speed_cap == PCIE_SPEED_8_0GT)
6070                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6071                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6072                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
6073                         else if (speed_cap == PCIE_SPEED_5_0GT)
6074                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6075                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2);
6076                         else
6077                                 adev->pm.pcie_gen_mask |= CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1;
6078                 }
6079                 /* platform caps */
6080                 if (platform_speed_cap == PCI_SPEED_UNKNOWN) {
6081                         adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6082                                                    CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
6083                 } else {
6084                         if (platform_speed_cap == PCIE_SPEED_32_0GT)
6085                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6086                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6087                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6088                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4 |
6089                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN5);
6090                         else if (platform_speed_cap == PCIE_SPEED_16_0GT)
6091                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6092                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6093                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6094                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4);
6095                         else if (platform_speed_cap == PCIE_SPEED_8_0GT)
6096                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6097                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6098                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3);
6099                         else if (platform_speed_cap == PCIE_SPEED_5_0GT)
6100                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6101                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
6102                         else
6103                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
6104
6105                 }
6106         }
6107         if (adev->pm.pcie_mlw_mask == 0) {
6108                 if (platform_link_width == PCIE_LNK_WIDTH_UNKNOWN) {
6109                         adev->pm.pcie_mlw_mask |= AMDGPU_DEFAULT_PCIE_MLW_MASK;
6110                 } else {
6111                         switch (platform_link_width) {
6112                         case PCIE_LNK_X32:
6113                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
6114                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
6115                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6116                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6117                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6118                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6119                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6120                                 break;
6121                         case PCIE_LNK_X16:
6122                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
6123                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6124                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6125                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6126                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6127                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6128                                 break;
6129                         case PCIE_LNK_X12:
6130                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6131                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6132                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6133                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6134                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6135                                 break;
6136                         case PCIE_LNK_X8:
6137                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6138                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6139                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6140                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6141                                 break;
6142                         case PCIE_LNK_X4:
6143                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6144                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6145                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6146                                 break;
6147                         case PCIE_LNK_X2:
6148                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6149                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6150                                 break;
6151                         case PCIE_LNK_X1:
6152                                 adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
6153                                 break;
6154                         default:
6155                                 break;
6156                         }
6157                 }
6158         }
6159 }
6160
6161 /**
6162  * amdgpu_device_is_peer_accessible - Check peer access through PCIe BAR
6163  *
6164  * @adev: amdgpu_device pointer
6165  * @peer_adev: amdgpu_device pointer for peer device trying to access @adev
6166  *
6167  * Return true if @peer_adev can access (DMA) @adev through the PCIe
6168  * BAR, i.e. @adev is "large BAR" and the BAR matches the DMA mask of
6169  * @peer_adev.
6170  */
6171 bool amdgpu_device_is_peer_accessible(struct amdgpu_device *adev,
6172                                       struct amdgpu_device *peer_adev)
6173 {
6174 #ifdef CONFIG_HSA_AMD_P2P
6175         bool p2p_access =
6176                 !adev->gmc.xgmi.connected_to_cpu &&
6177                 !(pci_p2pdma_distance(adev->pdev, peer_adev->dev, false) < 0);
6178
6179         bool is_large_bar = adev->gmc.visible_vram_size &&
6180                 adev->gmc.real_vram_size == adev->gmc.visible_vram_size;
6181         bool p2p_addressable = amdgpu_device_check_iommu_remap(peer_adev);
6182
6183         if (!p2p_addressable) {
6184                 uint64_t address_mask = peer_adev->dev->dma_mask ?
6185                         ~*peer_adev->dev->dma_mask : ~((1ULL << 32) - 1);
6186                 resource_size_t aper_limit =
6187                         adev->gmc.aper_base + adev->gmc.aper_size - 1;
6188
6189                 p2p_addressable = !(adev->gmc.aper_base & address_mask ||
6190                                      aper_limit & address_mask);
6191         }
6192         return is_large_bar && p2p_access && p2p_addressable;
6193 #else
6194         return false;
6195 #endif
6196 }
6197
6198 int amdgpu_device_baco_enter(struct drm_device *dev)
6199 {
6200         struct amdgpu_device *adev = drm_to_adev(dev);
6201         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
6202
6203         if (!amdgpu_device_supports_baco(dev))
6204                 return -ENOTSUPP;
6205
6206         if (ras && adev->ras_enabled &&
6207             adev->nbio.funcs->enable_doorbell_interrupt)
6208                 adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
6209
6210         return amdgpu_dpm_baco_enter(adev);
6211 }
6212
6213 int amdgpu_device_baco_exit(struct drm_device *dev)
6214 {
6215         struct amdgpu_device *adev = drm_to_adev(dev);
6216         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
6217         int ret = 0;
6218
6219         if (!amdgpu_device_supports_baco(dev))
6220                 return -ENOTSUPP;
6221
6222         ret = amdgpu_dpm_baco_exit(adev);
6223         if (ret)
6224                 return ret;
6225
6226         if (ras && adev->ras_enabled &&
6227             adev->nbio.funcs->enable_doorbell_interrupt)
6228                 adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
6229
6230         if (amdgpu_passthrough(adev) && adev->nbio.funcs &&
6231             adev->nbio.funcs->clear_doorbell_interrupt)
6232                 adev->nbio.funcs->clear_doorbell_interrupt(adev);
6233
6234         return 0;
6235 }
6236
6237 /**
6238  * amdgpu_pci_error_detected - Called when a PCI error is detected.
6239  * @pdev: PCI device struct
6240  * @state: PCI channel state
6241  *
6242  * Description: Called when a PCI error is detected.
6243  *
6244  * Return: PCI_ERS_RESULT_NEED_RESET or PCI_ERS_RESULT_DISCONNECT.
6245  */
6246 pci_ers_result_t amdgpu_pci_error_detected(struct pci_dev *pdev, pci_channel_state_t state)
6247 {
6248         struct drm_device *dev = pci_get_drvdata(pdev);
6249         struct amdgpu_device *adev = drm_to_adev(dev);
6250         int i;
6251
6252         DRM_INFO("PCI error: detected callback, state(%d)!!\n", state);
6253
6254         if (adev->gmc.xgmi.num_physical_nodes > 1) {
6255                 DRM_WARN("No support for XGMI hive yet...");
6256                 return PCI_ERS_RESULT_DISCONNECT;
6257         }
6258
6259         adev->pci_channel_state = state;
6260
6261         switch (state) {
6262         case pci_channel_io_normal:
6263                 return PCI_ERS_RESULT_CAN_RECOVER;
6264         /* Fatal error, prepare for slot reset */
6265         case pci_channel_io_frozen:
6266                 /*
6267                  * Locking adev->reset_domain->sem will prevent any external access
6268                  * to GPU during PCI error recovery
6269                  */
6270                 amdgpu_device_lock_reset_domain(adev->reset_domain);
6271                 amdgpu_device_set_mp1_state(adev);
6272
6273                 /*
6274                  * Block any work scheduling as we do for regular GPU reset
6275                  * for the duration of the recovery
6276                  */
6277                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6278                         struct amdgpu_ring *ring = adev->rings[i];
6279
6280                         if (!amdgpu_ring_sched_ready(ring))
6281                                 continue;
6282
6283                         drm_sched_stop(&ring->sched, NULL);
6284                 }
6285                 atomic_inc(&adev->gpu_reset_counter);
6286                 return PCI_ERS_RESULT_NEED_RESET;
6287         case pci_channel_io_perm_failure:
6288                 /* Permanent error, prepare for device removal */
6289                 return PCI_ERS_RESULT_DISCONNECT;
6290         }
6291
6292         return PCI_ERS_RESULT_NEED_RESET;
6293 }
6294
6295 /**
6296  * amdgpu_pci_mmio_enabled - Enable MMIO and dump debug registers
6297  * @pdev: pointer to PCI device
6298  */
6299 pci_ers_result_t amdgpu_pci_mmio_enabled(struct pci_dev *pdev)
6300 {
6301
6302         DRM_INFO("PCI error: mmio enabled callback!!\n");
6303
6304         /* TODO - dump whatever for debugging purposes */
6305
6306         /* This called only if amdgpu_pci_error_detected returns
6307          * PCI_ERS_RESULT_CAN_RECOVER. Read/write to the device still
6308          * works, no need to reset slot.
6309          */
6310
6311         return PCI_ERS_RESULT_RECOVERED;
6312 }
6313
6314 /**
6315  * amdgpu_pci_slot_reset - Called when PCI slot has been reset.
6316  * @pdev: PCI device struct
6317  *
6318  * Description: This routine is called by the pci error recovery
6319  * code after the PCI slot has been reset, just before we
6320  * should resume normal operations.
6321  */
6322 pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
6323 {
6324         struct drm_device *dev = pci_get_drvdata(pdev);
6325         struct amdgpu_device *adev = drm_to_adev(dev);
6326         int r, i;
6327         struct amdgpu_reset_context reset_context;
6328         u32 memsize;
6329         struct list_head device_list;
6330
6331         /* PCI error slot reset should be skipped During RAS recovery */
6332         if ((amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
6333             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4)) &&
6334             amdgpu_ras_in_recovery(adev))
6335                 return PCI_ERS_RESULT_RECOVERED;
6336
6337         DRM_INFO("PCI error: slot reset callback!!\n");
6338
6339         memset(&reset_context, 0, sizeof(reset_context));
6340
6341         INIT_LIST_HEAD(&device_list);
6342         list_add_tail(&adev->reset_list, &device_list);
6343
6344         /* wait for asic to come out of reset */
6345         msleep(500);
6346
6347         /* Restore PCI confspace */
6348         amdgpu_device_load_pci_state(pdev);
6349
6350         /* confirm  ASIC came out of reset */
6351         for (i = 0; i < adev->usec_timeout; i++) {
6352                 memsize = amdgpu_asic_get_config_memsize(adev);
6353
6354                 if (memsize != 0xffffffff)
6355                         break;
6356                 udelay(1);
6357         }
6358         if (memsize == 0xffffffff) {
6359                 r = -ETIME;
6360                 goto out;
6361         }
6362
6363         reset_context.method = AMD_RESET_METHOD_NONE;
6364         reset_context.reset_req_dev = adev;
6365         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
6366         set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
6367
6368         adev->no_hw_access = true;
6369         r = amdgpu_device_pre_asic_reset(adev, &reset_context);
6370         adev->no_hw_access = false;
6371         if (r)
6372                 goto out;
6373
6374         r = amdgpu_do_asic_reset(&device_list, &reset_context);
6375
6376 out:
6377         if (!r) {
6378                 if (amdgpu_device_cache_pci_state(adev->pdev))
6379                         pci_restore_state(adev->pdev);
6380
6381                 DRM_INFO("PCIe error recovery succeeded\n");
6382         } else {
6383                 DRM_ERROR("PCIe error recovery failed, err:%d", r);
6384                 amdgpu_device_unset_mp1_state(adev);
6385                 amdgpu_device_unlock_reset_domain(adev->reset_domain);
6386         }
6387
6388         return r ? PCI_ERS_RESULT_DISCONNECT : PCI_ERS_RESULT_RECOVERED;
6389 }
6390
6391 /**
6392  * amdgpu_pci_resume() - resume normal ops after PCI reset
6393  * @pdev: pointer to PCI device
6394  *
6395  * Called when the error recovery driver tells us that its
6396  * OK to resume normal operation.
6397  */
6398 void amdgpu_pci_resume(struct pci_dev *pdev)
6399 {
6400         struct drm_device *dev = pci_get_drvdata(pdev);
6401         struct amdgpu_device *adev = drm_to_adev(dev);
6402         int i;
6403
6404
6405         DRM_INFO("PCI error: resume callback!!\n");
6406
6407         /* Only continue execution for the case of pci_channel_io_frozen */
6408         if (adev->pci_channel_state != pci_channel_io_frozen)
6409                 return;
6410
6411         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6412                 struct amdgpu_ring *ring = adev->rings[i];
6413
6414                 if (!amdgpu_ring_sched_ready(ring))
6415                         continue;
6416
6417                 drm_sched_start(&ring->sched);
6418         }
6419
6420         amdgpu_device_unset_mp1_state(adev);
6421         amdgpu_device_unlock_reset_domain(adev->reset_domain);
6422 }
6423
6424 bool amdgpu_device_cache_pci_state(struct pci_dev *pdev)
6425 {
6426         struct drm_device *dev = pci_get_drvdata(pdev);
6427         struct amdgpu_device *adev = drm_to_adev(dev);
6428         int r;
6429
6430         r = pci_save_state(pdev);
6431         if (!r) {
6432                 kfree(adev->pci_state);
6433
6434                 adev->pci_state = pci_store_saved_state(pdev);
6435
6436                 if (!adev->pci_state) {
6437                         DRM_ERROR("Failed to store PCI saved state");
6438                         return false;
6439                 }
6440         } else {
6441                 DRM_WARN("Failed to save PCI state, err:%d\n", r);
6442                 return false;
6443         }
6444
6445         return true;
6446 }
6447
6448 bool amdgpu_device_load_pci_state(struct pci_dev *pdev)
6449 {
6450         struct drm_device *dev = pci_get_drvdata(pdev);
6451         struct amdgpu_device *adev = drm_to_adev(dev);
6452         int r;
6453
6454         if (!adev->pci_state)
6455                 return false;
6456
6457         r = pci_load_saved_state(pdev, adev->pci_state);
6458
6459         if (!r) {
6460                 pci_restore_state(pdev);
6461         } else {
6462                 DRM_WARN("Failed to load PCI state, err:%d\n", r);
6463                 return false;
6464         }
6465
6466         return true;
6467 }
6468
6469 void amdgpu_device_flush_hdp(struct amdgpu_device *adev,
6470                 struct amdgpu_ring *ring)
6471 {
6472 #ifdef CONFIG_X86_64
6473         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
6474                 return;
6475 #endif
6476         if (adev->gmc.xgmi.connected_to_cpu)
6477                 return;
6478
6479         if (ring && ring->funcs->emit_hdp_flush)
6480                 amdgpu_ring_emit_hdp_flush(ring);
6481         else
6482                 amdgpu_asic_flush_hdp(adev, ring);
6483 }
6484
6485 void amdgpu_device_invalidate_hdp(struct amdgpu_device *adev,
6486                 struct amdgpu_ring *ring)
6487 {
6488 #ifdef CONFIG_X86_64
6489         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
6490                 return;
6491 #endif
6492         if (adev->gmc.xgmi.connected_to_cpu)
6493                 return;
6494
6495         amdgpu_asic_invalidate_hdp(adev, ring);
6496 }
6497
6498 int amdgpu_in_reset(struct amdgpu_device *adev)
6499 {
6500         return atomic_read(&adev->reset_domain->in_gpu_reset);
6501 }
6502
6503 /**
6504  * amdgpu_device_halt() - bring hardware to some kind of halt state
6505  *
6506  * @adev: amdgpu_device pointer
6507  *
6508  * Bring hardware to some kind of halt state so that no one can touch it
6509  * any more. It will help to maintain error context when error occurred.
6510  * Compare to a simple hang, the system will keep stable at least for SSH
6511  * access. Then it should be trivial to inspect the hardware state and
6512  * see what's going on. Implemented as following:
6513  *
6514  * 1. drm_dev_unplug() makes device inaccessible to user space(IOCTLs, etc),
6515  *    clears all CPU mappings to device, disallows remappings through page faults
6516  * 2. amdgpu_irq_disable_all() disables all interrupts
6517  * 3. amdgpu_fence_driver_hw_fini() signals all HW fences
6518  * 4. set adev->no_hw_access to avoid potential crashes after setp 5
6519  * 5. amdgpu_device_unmap_mmio() clears all MMIO mappings
6520  * 6. pci_disable_device() and pci_wait_for_pending_transaction()
6521  *    flush any in flight DMA operations
6522  */
6523 void amdgpu_device_halt(struct amdgpu_device *adev)
6524 {
6525         struct pci_dev *pdev = adev->pdev;
6526         struct drm_device *ddev = adev_to_drm(adev);
6527
6528         amdgpu_xcp_dev_unplug(adev);
6529         drm_dev_unplug(ddev);
6530
6531         amdgpu_irq_disable_all(adev);
6532
6533         amdgpu_fence_driver_hw_fini(adev);
6534
6535         adev->no_hw_access = true;
6536
6537         amdgpu_device_unmap_mmio(adev);
6538
6539         pci_disable_device(pdev);
6540         pci_wait_for_pending_transaction(pdev);
6541 }
6542
6543 u32 amdgpu_device_pcie_port_rreg(struct amdgpu_device *adev,
6544                                 u32 reg)
6545 {
6546         unsigned long flags, address, data;
6547         u32 r;
6548
6549         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
6550         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
6551
6552         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
6553         WREG32(address, reg * 4);
6554         (void)RREG32(address);
6555         r = RREG32(data);
6556         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
6557         return r;
6558 }
6559
6560 void amdgpu_device_pcie_port_wreg(struct amdgpu_device *adev,
6561                                 u32 reg, u32 v)
6562 {
6563         unsigned long flags, address, data;
6564
6565         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
6566         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
6567
6568         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
6569         WREG32(address, reg * 4);
6570         (void)RREG32(address);
6571         WREG32(data, v);
6572         (void)RREG32(data);
6573         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
6574 }
6575
6576 /**
6577  * amdgpu_device_get_gang - return a reference to the current gang
6578  * @adev: amdgpu_device pointer
6579  *
6580  * Returns: A new reference to the current gang leader.
6581  */
6582 struct dma_fence *amdgpu_device_get_gang(struct amdgpu_device *adev)
6583 {
6584         struct dma_fence *fence;
6585
6586         rcu_read_lock();
6587         fence = dma_fence_get_rcu_safe(&adev->gang_submit);
6588         rcu_read_unlock();
6589         return fence;
6590 }
6591
6592 /**
6593  * amdgpu_device_switch_gang - switch to a new gang
6594  * @adev: amdgpu_device pointer
6595  * @gang: the gang to switch to
6596  *
6597  * Try to switch to a new gang.
6598  * Returns: NULL if we switched to the new gang or a reference to the current
6599  * gang leader.
6600  */
6601 struct dma_fence *amdgpu_device_switch_gang(struct amdgpu_device *adev,
6602                                             struct dma_fence *gang)
6603 {
6604         struct dma_fence *old = NULL;
6605
6606         do {
6607                 dma_fence_put(old);
6608                 old = amdgpu_device_get_gang(adev);
6609                 if (old == gang)
6610                         break;
6611
6612                 if (!dma_fence_is_signaled(old))
6613                         return old;
6614
6615         } while (cmpxchg((struct dma_fence __force **)&adev->gang_submit,
6616                          old, gang) != old);
6617
6618         dma_fence_put(old);
6619         return NULL;
6620 }
6621
6622 bool amdgpu_device_has_display_hardware(struct amdgpu_device *adev)
6623 {
6624         switch (adev->asic_type) {
6625 #ifdef CONFIG_DRM_AMDGPU_SI
6626         case CHIP_HAINAN:
6627 #endif
6628         case CHIP_TOPAZ:
6629                 /* chips with no display hardware */
6630                 return false;
6631 #ifdef CONFIG_DRM_AMDGPU_SI
6632         case CHIP_TAHITI:
6633         case CHIP_PITCAIRN:
6634         case CHIP_VERDE:
6635         case CHIP_OLAND:
6636 #endif
6637 #ifdef CONFIG_DRM_AMDGPU_CIK
6638         case CHIP_BONAIRE:
6639         case CHIP_HAWAII:
6640         case CHIP_KAVERI:
6641         case CHIP_KABINI:
6642         case CHIP_MULLINS:
6643 #endif
6644         case CHIP_TONGA:
6645         case CHIP_FIJI:
6646         case CHIP_POLARIS10:
6647         case CHIP_POLARIS11:
6648         case CHIP_POLARIS12:
6649         case CHIP_VEGAM:
6650         case CHIP_CARRIZO:
6651         case CHIP_STONEY:
6652                 /* chips with display hardware */
6653                 return true;
6654         default:
6655                 /* IP discovery */
6656                 if (!amdgpu_ip_version(adev, DCE_HWIP, 0) ||
6657                     (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
6658                         return false;
6659                 return true;
6660         }
6661 }
6662
6663 uint32_t amdgpu_device_wait_on_rreg(struct amdgpu_device *adev,
6664                 uint32_t inst, uint32_t reg_addr, char reg_name[],
6665                 uint32_t expected_value, uint32_t mask)
6666 {
6667         uint32_t ret = 0;
6668         uint32_t old_ = 0;
6669         uint32_t tmp_ = RREG32(reg_addr);
6670         uint32_t loop = adev->usec_timeout;
6671
6672         while ((tmp_ & (mask)) != (expected_value)) {
6673                 if (old_ != tmp_) {
6674                         loop = adev->usec_timeout;
6675                         old_ = tmp_;
6676                 } else
6677                         udelay(1);
6678                 tmp_ = RREG32(reg_addr);
6679                 loop--;
6680                 if (!loop) {
6681                         DRM_WARN("Register(%d) [%s] failed to reach value 0x%08x != 0x%08xn",
6682                                   inst, reg_name, (uint32_t)expected_value,
6683                                   (uint32_t)(tmp_ & (mask)));
6684                         ret = -ETIMEDOUT;
6685                         break;
6686                 }
6687         }
6688         return ret;
6689 }