drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

   1 /*
   2  * Copyright 2008 Advanced Micro Devices, Inc.
   3  * Copyright 2008 Red Hat Inc.
   4  * Copyright 2009 Jerome Glisse.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining a
   7  * copy of this software and associated documentation files (the "Software"),
   8  * to deal in the Software without restriction, including without limitation
   9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10  * and/or sell copies of the Software, and to permit persons to whom the
  11  * Software is furnished to do so, subject to the following conditions:
  12  *
  13  * The above copyright notice and this permission notice shall be included in
  14  * all copies or substantial portions of the Software.
  15  *
  16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22  * OTHER DEALINGS IN THE SOFTWARE.
  23  *
  24  * Authors: Dave Airlie
  25  *          Alex Deucher
  26  *          Jerome Glisse
  27  */
  28
  29 #include <linux/aperture.h>
  30 #include <linux/power_supply.h>
  31 #include <linux/kthread.h>
  32 #include <linux/module.h>
  33 #include <linux/console.h>
  34 #include <linux/slab.h>
  35 #include <linux/iommu.h>
  36 #include <linux/pci.h>
  37 #include <linux/pci-p2pdma.h>
  38 #include <linux/apple-gmux.h>
  39
  40 #include <drm/drm_atomic_helper.h>
  41 #include <drm/drm_client_event.h>
  42 #include <drm/drm_crtc_helper.h>
  43 #include <drm/drm_probe_helper.h>
  44 #include <drm/amdgpu_drm.h>
  45 #include <linux/device.h>
  46 #include <linux/vgaarb.h>
  47 #include <linux/vga_switcheroo.h>
  48 #include <linux/efi.h>
  49 #include "amdgpu.h"
  50 #include "amdgpu_trace.h"
  51 #include "amdgpu_i2c.h"
  52 #include "atom.h"
  53 #include "amdgpu_atombios.h"
  54 #include "amdgpu_atomfirmware.h"
  55 #include "amd_pcie.h"
  56 #ifdef CONFIG_DRM_AMDGPU_SI
  57 #include "si.h"
  58 #endif
  59 #ifdef CONFIG_DRM_AMDGPU_CIK
  60 #include "cik.h"
  61 #endif
  62 #include "vi.h"
  63 #include "soc15.h"
  64 #include "nv.h"
  65 #include "bif/bif_4_1_d.h"
  66 #include <linux/firmware.h>
  67 #include "amdgpu_vf_error.h"
  68
  69 #include "amdgpu_amdkfd.h"
  70 #include "amdgpu_pm.h"
  71
  72 #include "amdgpu_xgmi.h"
  73 #include "amdgpu_ras.h"
  74 #include "amdgpu_pmu.h"
  75 #include "amdgpu_fru_eeprom.h"
  76 #include "amdgpu_reset.h"
  77 #include "amdgpu_virt.h"
  78 #include "amdgpu_dev_coredump.h"
  79
  80 #include <linux/suspend.h>
  81 #include <drm/task_barrier.h>
  82 #include <linux/pm_runtime.h>
  83
  84 #include <drm/drm_drv.h>
  85
  86 #if IS_ENABLED(CONFIG_X86)
  87 #include <asm/intel-family.h>
  88 #endif
  89
  90 MODULE_FIRMWARE("amdgpu/vega10_gpu_info.bin");
  91 MODULE_FIRMWARE("amdgpu/vega12_gpu_info.bin");
  92 MODULE_FIRMWARE("amdgpu/raven_gpu_info.bin");
  93 MODULE_FIRMWARE("amdgpu/picasso_gpu_info.bin");
  94 MODULE_FIRMWARE("amdgpu/raven2_gpu_info.bin");
  95 MODULE_FIRMWARE("amdgpu/arcturus_gpu_info.bin");
  96 MODULE_FIRMWARE("amdgpu/navi12_gpu_info.bin");
  97
  98 #define AMDGPU_RESUME_MS                2000
  99 #define AMDGPU_MAX_RETRY_LIMIT          2
 100 #define AMDGPU_RETRY_SRIOV_RESET(r) ((r) == -EBUSY || (r) == -ETIMEDOUT || (r) == -EINVAL)
 101 #define AMDGPU_PCIE_INDEX_FALLBACK (0x38 >> 2)
 102 #define AMDGPU_PCIE_INDEX_HI_FALLBACK (0x44 >> 2)
 103 #define AMDGPU_PCIE_DATA_FALLBACK (0x3C >> 2)
 104
 105 static const struct drm_driver amdgpu_kms_driver;
 106
 107 const char *amdgpu_asic_name[] = {
 108         "TAHITI",
 109         "PITCAIRN",
 110         "VERDE",
 111         "OLAND",
 112         "HAINAN",
 113         "BONAIRE",
 114         "KAVERI",
 115         "KABINI",
 116         "HAWAII",
 117         "MULLINS",
 118         "TOPAZ",
 119         "TONGA",
 120         "FIJI",
 121         "CARRIZO",
 122         "STONEY",
 123         "POLARIS10",
 124         "POLARIS11",
 125         "POLARIS12",
 126         "VEGAM",
 127         "VEGA10",
 128         "VEGA12",
 129         "VEGA20",
 130         "RAVEN",
 131         "ARCTURUS",
 132         "RENOIR",
 133         "ALDEBARAN",
 134         "NAVI10",
 135         "CYAN_SKILLFISH",
 136         "NAVI14",
 137         "NAVI12",
 138         "SIENNA_CICHLID",
 139         "NAVY_FLOUNDER",
 140         "VANGOGH",
 141         "DIMGREY_CAVEFISH",
 142         "BEIGE_GOBY",
 143         "YELLOW_CARP",
 144         "IP DISCOVERY",
 145         "LAST",
 146 };
 147
 148 #define AMDGPU_IP_BLK_MASK_ALL GENMASK(AMD_IP_BLOCK_TYPE_NUM  - 1, 0)
 149 /*
 150  * Default init level where all blocks are expected to be initialized. This is
 151  * the level of initialization expected by default and also after a full reset
 152  * of the device.
 153  */
 154 struct amdgpu_init_level amdgpu_init_default = {
 155         .level = AMDGPU_INIT_LEVEL_DEFAULT,
 156         .hwini_ip_block_mask = AMDGPU_IP_BLK_MASK_ALL,
 157 };
 158
 159 struct amdgpu_init_level amdgpu_init_recovery = {
 160         .level = AMDGPU_INIT_LEVEL_RESET_RECOVERY,
 161         .hwini_ip_block_mask = AMDGPU_IP_BLK_MASK_ALL,
 162 };
 163
 164 /*
 165  * Minimal blocks needed to be initialized before a XGMI hive can be reset. This
 166  * is used for cases like reset on initialization where the entire hive needs to
 167  * be reset before first use.
 168  */
 169 struct amdgpu_init_level amdgpu_init_minimal_xgmi = {
 170         .level = AMDGPU_INIT_LEVEL_MINIMAL_XGMI,
 171         .hwini_ip_block_mask =
 172                 BIT(AMD_IP_BLOCK_TYPE_GMC) | BIT(AMD_IP_BLOCK_TYPE_SMC) |
 173                 BIT(AMD_IP_BLOCK_TYPE_COMMON) | BIT(AMD_IP_BLOCK_TYPE_IH) |
 174                 BIT(AMD_IP_BLOCK_TYPE_PSP)
 175 };
 176
 177 static inline bool amdgpu_ip_member_of_hwini(struct amdgpu_device *adev,
 178                                              enum amd_ip_block_type block)
 179 {
 180         return (adev->init_lvl->hwini_ip_block_mask & (1U << block)) != 0;
 181 }
 182
 183 void amdgpu_set_init_level(struct amdgpu_device *adev,
 184                            enum amdgpu_init_lvl_id lvl)
 185 {
 186         switch (lvl) {
 187         case AMDGPU_INIT_LEVEL_MINIMAL_XGMI:
 188                 adev->init_lvl = &amdgpu_init_minimal_xgmi;
 189                 break;
 190         case AMDGPU_INIT_LEVEL_RESET_RECOVERY:
 191                 adev->init_lvl = &amdgpu_init_recovery;
 192                 break;
 193         case AMDGPU_INIT_LEVEL_DEFAULT:
 194                 fallthrough;
 195         default:
 196                 adev->init_lvl = &amdgpu_init_default;
 197                 break;
 198         }
 199 }
 200
 201 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev);
 202
 203 /**
 204  * DOC: pcie_replay_count
 205  *
 206  * The amdgpu driver provides a sysfs API for reporting the total number
 207  * of PCIe replays (NAKs)
 208  * The file pcie_replay_count is used for this and returns the total
 209  * number of replays as a sum of the NAKs generated and NAKs received
 210  */
 211
 212 static ssize_t amdgpu_device_get_pcie_replay_count(struct device *dev,
 213                 struct device_attribute *attr, char *buf)
 214 {
 215         struct drm_device *ddev = dev_get_drvdata(dev);
 216         struct amdgpu_device *adev = drm_to_adev(ddev);
 217         uint64_t cnt = amdgpu_asic_get_pcie_replay_count(adev);
 218
 219         return sysfs_emit(buf, "%llu\n", cnt);
 220 }
 221
 222 static DEVICE_ATTR(pcie_replay_count, 0444,
 223                 amdgpu_device_get_pcie_replay_count, NULL);
 224
 225 static ssize_t amdgpu_sysfs_reg_state_get(struct file *f, struct kobject *kobj,
 226                                           struct bin_attribute *attr, char *buf,
 227                                           loff_t ppos, size_t count)
 228 {
 229         struct device *dev = kobj_to_dev(kobj);
 230         struct drm_device *ddev = dev_get_drvdata(dev);
 231         struct amdgpu_device *adev = drm_to_adev(ddev);
 232         ssize_t bytes_read;
 233
 234         switch (ppos) {
 235         case AMDGPU_SYS_REG_STATE_XGMI:
 236                 bytes_read = amdgpu_asic_get_reg_state(
 237                         adev, AMDGPU_REG_STATE_TYPE_XGMI, buf, count);
 238                 break;
 239         case AMDGPU_SYS_REG_STATE_WAFL:
 240                 bytes_read = amdgpu_asic_get_reg_state(
 241                         adev, AMDGPU_REG_STATE_TYPE_WAFL, buf, count);
 242                 break;
 243         case AMDGPU_SYS_REG_STATE_PCIE:
 244                 bytes_read = amdgpu_asic_get_reg_state(
 245                         adev, AMDGPU_REG_STATE_TYPE_PCIE, buf, count);
 246                 break;
 247         case AMDGPU_SYS_REG_STATE_USR:
 248                 bytes_read = amdgpu_asic_get_reg_state(
 249                         adev, AMDGPU_REG_STATE_TYPE_USR, buf, count);
 250                 break;
 251         case AMDGPU_SYS_REG_STATE_USR_1:
 252                 bytes_read = amdgpu_asic_get_reg_state(
 253                         adev, AMDGPU_REG_STATE_TYPE_USR_1, buf, count);
 254                 break;
 255         default:
 256                 return -EINVAL;
 257         }
 258
 259         return bytes_read;
 260 }
 261
 262 BIN_ATTR(reg_state, 0444, amdgpu_sysfs_reg_state_get, NULL,
 263          AMDGPU_SYS_REG_STATE_END);
 264
 265 int amdgpu_reg_state_sysfs_init(struct amdgpu_device *adev)
 266 {
 267         int ret;
 268
 269         if (!amdgpu_asic_get_reg_state_supported(adev))
 270                 return 0;
 271
 272         ret = sysfs_create_bin_file(&adev->dev->kobj, &bin_attr_reg_state);
 273
 274         return ret;
 275 }
 276
 277 void amdgpu_reg_state_sysfs_fini(struct amdgpu_device *adev)
 278 {
 279         if (!amdgpu_asic_get_reg_state_supported(adev))
 280                 return;
 281         sysfs_remove_bin_file(&adev->dev->kobj, &bin_attr_reg_state);
 282 }
 283
 284 int amdgpu_ip_block_suspend(struct amdgpu_ip_block *ip_block)
 285 {
 286         int r;
 287
 288         if (ip_block->version->funcs->suspend) {
 289                 r = ip_block->version->funcs->suspend(ip_block);
 290                 if (r) {
 291                         dev_err(ip_block->adev->dev,
 292                                 "suspend of IP block <%s> failed %d\n",
 293                                 ip_block->version->funcs->name, r);
 294                         return r;
 295                 }
 296         }
 297
 298         ip_block->status.hw = false;
 299         return 0;
 300 }
 301
 302 int amdgpu_ip_block_resume(struct amdgpu_ip_block *ip_block)
 303 {
 304         int r;
 305
 306         if (ip_block->version->funcs->resume) {
 307                 r = ip_block->version->funcs->resume(ip_block);
 308                 if (r) {
 309                         dev_err(ip_block->adev->dev,
 310                                 "resume of IP block <%s> failed %d\n",
 311                                 ip_block->version->funcs->name, r);
 312                         return r;
 313                 }
 314         }
 315
 316         ip_block->status.hw = true;
 317         return 0;
 318 }
 319
 320 /**
 321  * DOC: board_info
 322  *
 323  * The amdgpu driver provides a sysfs API for giving board related information.
 324  * It provides the form factor information in the format
 325  *
 326  *   type : form factor
 327  *
 328  * Possible form factor values
 329  *
 330  * - "cem"              - PCIE CEM card
 331  * - "oam"              - Open Compute Accelerator Module
 332  * - "unknown"  - Not known
 333  *
 334  */
 335
 336 static ssize_t amdgpu_device_get_board_info(struct device *dev,
 337                                             struct device_attribute *attr,
 338                                             char *buf)
 339 {
 340         struct drm_device *ddev = dev_get_drvdata(dev);
 341         struct amdgpu_device *adev = drm_to_adev(ddev);
 342         enum amdgpu_pkg_type pkg_type = AMDGPU_PKG_TYPE_CEM;
 343         const char *pkg;
 344
 345         if (adev->smuio.funcs && adev->smuio.funcs->get_pkg_type)
 346                 pkg_type = adev->smuio.funcs->get_pkg_type(adev);
 347
 348         switch (pkg_type) {
 349         case AMDGPU_PKG_TYPE_CEM:
 350                 pkg = "cem";
 351                 break;
 352         case AMDGPU_PKG_TYPE_OAM:
 353                 pkg = "oam";
 354                 break;
 355         default:
 356                 pkg = "unknown";
 357                 break;
 358         }
 359
 360         return sysfs_emit(buf, "%s : %s\n", "type", pkg);
 361 }
 362
 363 static DEVICE_ATTR(board_info, 0444, amdgpu_device_get_board_info, NULL);
 364
 365 static struct attribute *amdgpu_board_attrs[] = {
 366         &dev_attr_board_info.attr,
 367         NULL,
 368 };
 369
 370 static umode_t amdgpu_board_attrs_is_visible(struct kobject *kobj,
 371                                              struct attribute *attr, int n)
 372 {
 373         struct device *dev = kobj_to_dev(kobj);
 374         struct drm_device *ddev = dev_get_drvdata(dev);
 375         struct amdgpu_device *adev = drm_to_adev(ddev);
 376
 377         if (adev->flags & AMD_IS_APU)
 378                 return 0;
 379
 380         return attr->mode;
 381 }
 382
 383 static const struct attribute_group amdgpu_board_attrs_group = {
 384         .attrs = amdgpu_board_attrs,
 385         .is_visible = amdgpu_board_attrs_is_visible
 386 };
 387
 388 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev);
 389
 390
 391 /**
 392  * amdgpu_device_supports_px - Is the device a dGPU with ATPX power control
 393  *
 394  * @dev: drm_device pointer
 395  *
 396  * Returns true if the device is a dGPU with ATPX power control,
 397  * otherwise return false.
 398  */
 399 bool amdgpu_device_supports_px(struct drm_device *dev)
 400 {
 401         struct amdgpu_device *adev = drm_to_adev(dev);
 402
 403         if ((adev->flags & AMD_IS_PX) && !amdgpu_is_atpx_hybrid())
 404                 return true;
 405         return false;
 406 }
 407
 408 /**
 409  * amdgpu_device_supports_boco - Is the device a dGPU with ACPI power resources
 410  *
 411  * @dev: drm_device pointer
 412  *
 413  * Returns true if the device is a dGPU with ACPI power control,
 414  * otherwise return false.
 415  */
 416 bool amdgpu_device_supports_boco(struct drm_device *dev)
 417 {
 418         struct amdgpu_device *adev = drm_to_adev(dev);
 419
 420         if (!IS_ENABLED(CONFIG_HOTPLUG_PCI_PCIE))
 421                 return false;
 422
 423         if (adev->has_pr3 ||
 424             ((adev->flags & AMD_IS_PX) && amdgpu_is_atpx_hybrid()))
 425                 return true;
 426         return false;
 427 }
 428
 429 /**
 430  * amdgpu_device_supports_baco - Does the device support BACO
 431  *
 432  * @dev: drm_device pointer
 433  *
 434  * Return:
 435  * 1 if the device supporte BACO;
 436  * 3 if the device support MACO (only works if BACO is supported)
 437  * otherwise return 0.
 438  */
 439 int amdgpu_device_supports_baco(struct drm_device *dev)
 440 {
 441         struct amdgpu_device *adev = drm_to_adev(dev);
 442
 443         return amdgpu_asic_supports_baco(adev);
 444 }
 445
 446 void amdgpu_device_detect_runtime_pm_mode(struct amdgpu_device *adev)
 447 {
 448         struct drm_device *dev;
 449         int bamaco_support;
 450
 451         dev = adev_to_drm(adev);
 452
 453         adev->pm.rpm_mode = AMDGPU_RUNPM_NONE;
 454         bamaco_support = amdgpu_device_supports_baco(dev);
 455
 456         switch (amdgpu_runtime_pm) {
 457         case 2:
 458                 if (bamaco_support & MACO_SUPPORT) {
 459                         adev->pm.rpm_mode = AMDGPU_RUNPM_BAMACO;
 460                         dev_info(adev->dev, "Forcing BAMACO for runtime pm\n");
 461                 } else if (bamaco_support == BACO_SUPPORT) {
 462                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 463                         dev_info(adev->dev, "Requested mode BAMACO not available,fallback to use BACO\n");
 464                 }
 465                 break;
 466         case 1:
 467                 if (bamaco_support & BACO_SUPPORT) {
 468                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 469                         dev_info(adev->dev, "Forcing BACO for runtime pm\n");
 470                 }
 471                 break;
 472         case -1:
 473         case -2:
 474                 if (amdgpu_device_supports_px(dev)) { /* enable PX as runtime mode */
 475                         adev->pm.rpm_mode = AMDGPU_RUNPM_PX;
 476                         dev_info(adev->dev, "Using ATPX for runtime pm\n");
 477                 } else if (amdgpu_device_supports_boco(dev)) { /* enable boco as runtime mode */
 478                         adev->pm.rpm_mode = AMDGPU_RUNPM_BOCO;
 479                         dev_info(adev->dev, "Using BOCO for runtime pm\n");
 480                 } else {
 481                         if (!bamaco_support)
 482                                 goto no_runtime_pm;
 483
 484                         switch (adev->asic_type) {
 485                         case CHIP_VEGA20:
 486                         case CHIP_ARCTURUS:
 487                                 /* BACO are not supported on vega20 and arctrus */
 488                                 break;
 489                         case CHIP_VEGA10:
 490                                 /* enable BACO as runpm mode if noretry=0 */
 491                                 if (!adev->gmc.noretry)
 492                                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 493                                 break;
 494                         default:
 495                                 /* enable BACO as runpm mode on CI+ */
 496                                 adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 497                                 break;
 498                         }
 499
 500                         if (adev->pm.rpm_mode == AMDGPU_RUNPM_BACO) {
 501                                 if (bamaco_support & MACO_SUPPORT) {
 502                                         adev->pm.rpm_mode = AMDGPU_RUNPM_BAMACO;
 503                                         dev_info(adev->dev, "Using BAMACO for runtime pm\n");
 504                                 } else {
 505                                         dev_info(adev->dev, "Using BACO for runtime pm\n");
 506                                 }
 507                         }
 508                 }
 509                 break;
 510         case 0:
 511                 dev_info(adev->dev, "runtime pm is manually disabled\n");
 512                 break;
 513         default:
 514                 break;
 515         }
 516
 517 no_runtime_pm:
 518         if (adev->pm.rpm_mode == AMDGPU_RUNPM_NONE)
 519                 dev_info(adev->dev, "Runtime PM not available\n");
 520 }
 521 /**
 522  * amdgpu_device_supports_smart_shift - Is the device dGPU with
 523  * smart shift support
 524  *
 525  * @dev: drm_device pointer
 526  *
 527  * Returns true if the device is a dGPU with Smart Shift support,
 528  * otherwise returns false.
 529  */
 530 bool amdgpu_device_supports_smart_shift(struct drm_device *dev)
 531 {
 532         return (amdgpu_device_supports_boco(dev) &&
 533                 amdgpu_acpi_is_power_shift_control_supported());
 534 }
 535
 536 /*
 537  * VRAM access helper functions
 538  */
 539
 540 /**
 541  * amdgpu_device_mm_access - access vram by MM_INDEX/MM_DATA
 542  *
 543  * @adev: amdgpu_device pointer
 544  * @pos: offset of the buffer in vram
 545  * @buf: virtual address of the buffer in system memory
 546  * @size: read/write size, sizeof(@buf) must > @size
 547  * @write: true - write to vram, otherwise - read from vram
 548  */
 549 void amdgpu_device_mm_access(struct amdgpu_device *adev, loff_t pos,
 550                              void *buf, size_t size, bool write)
 551 {
 552         unsigned long flags;
 553         uint32_t hi = ~0, tmp = 0;
 554         uint32_t *data = buf;
 555         uint64_t last;
 556         int idx;
 557
 558         if (!drm_dev_enter(adev_to_drm(adev), &idx))
 559                 return;
 560
 561         BUG_ON(!IS_ALIGNED(pos, 4) || !IS_ALIGNED(size, 4));
 562
 563         spin_lock_irqsave(&adev->mmio_idx_lock, flags);
 564         for (last = pos + size; pos < last; pos += 4) {
 565                 tmp = pos >> 31;
 566
 567                 WREG32_NO_KIQ(mmMM_INDEX, ((uint32_t)pos) | 0x80000000);
 568                 if (tmp != hi) {
 569                         WREG32_NO_KIQ(mmMM_INDEX_HI, tmp);
 570                         hi = tmp;
 571                 }
 572                 if (write)
 573                         WREG32_NO_KIQ(mmMM_DATA, *data++);
 574                 else
 575                         *data++ = RREG32_NO_KIQ(mmMM_DATA);
 576         }
 577
 578         spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
 579         drm_dev_exit(idx);
 580 }
 581
 582 /**
 583  * amdgpu_device_aper_access - access vram by vram aperature
 584  *
 585  * @adev: amdgpu_device pointer
 586  * @pos: offset of the buffer in vram
 587  * @buf: virtual address of the buffer in system memory
 588  * @size: read/write size, sizeof(@buf) must > @size
 589  * @write: true - write to vram, otherwise - read from vram
 590  *
 591  * The return value means how many bytes have been transferred.
 592  */
 593 size_t amdgpu_device_aper_access(struct amdgpu_device *adev, loff_t pos,
 594                                  void *buf, size_t size, bool write)
 595 {
 596 #ifdef CONFIG_64BIT
 597         void __iomem *addr;
 598         size_t count = 0;
 599         uint64_t last;
 600
 601         if (!adev->mman.aper_base_kaddr)
 602                 return 0;
 603
 604         last = min(pos + size, adev->gmc.visible_vram_size);
 605         if (last > pos) {
 606                 addr = adev->mman.aper_base_kaddr + pos;
 607                 count = last - pos;
 608
 609                 if (write) {
 610                         memcpy_toio(addr, buf, count);
 611                         /* Make sure HDP write cache flush happens without any reordering
 612                          * after the system memory contents are sent over PCIe device
 613                          */
 614                         mb();
 615                         amdgpu_device_flush_hdp(adev, NULL);
 616                 } else {
 617                         amdgpu_device_invalidate_hdp(adev, NULL);
 618                         /* Make sure HDP read cache is invalidated before issuing a read
 619                          * to the PCIe device
 620                          */
 621                         mb();
 622                         memcpy_fromio(buf, addr, count);
 623                 }
 624
 625         }
 626
 627         return count;
 628 #else
 629         return 0;
 630 #endif
 631 }
 632
 633 /**
 634  * amdgpu_device_vram_access - read/write a buffer in vram
 635  *
 636  * @adev: amdgpu_device pointer
 637  * @pos: offset of the buffer in vram
 638  * @buf: virtual address of the buffer in system memory
 639  * @size: read/write size, sizeof(@buf) must > @size
 640  * @write: true - write to vram, otherwise - read from vram
 641  */
 642 void amdgpu_device_vram_access(struct amdgpu_device *adev, loff_t pos,
 643                                void *buf, size_t size, bool write)
 644 {
 645         size_t count;
 646
 647         /* try to using vram apreature to access vram first */
 648         count = amdgpu_device_aper_access(adev, pos, buf, size, write);
 649         size -= count;
 650         if (size) {
 651                 /* using MM to access rest vram */
 652                 pos += count;
 653                 buf += count;
 654                 amdgpu_device_mm_access(adev, pos, buf, size, write);
 655         }
 656 }
 657
 658 /*
 659  * register access helper functions.
 660  */
 661
 662 /* Check if hw access should be skipped because of hotplug or device error */
 663 bool amdgpu_device_skip_hw_access(struct amdgpu_device *adev)
 664 {
 665         if (adev->no_hw_access)
 666                 return true;
 667
 668 #ifdef CONFIG_LOCKDEP
 669         /*
 670          * This is a bit complicated to understand, so worth a comment. What we assert
 671          * here is that the GPU reset is not running on another thread in parallel.
 672          *
 673          * For this we trylock the read side of the reset semaphore, if that succeeds
 674          * we know that the reset is not running in paralell.
 675          *
 676          * If the trylock fails we assert that we are either already holding the read
 677          * side of the lock or are the reset thread itself and hold the write side of
 678          * the lock.
 679          */
 680         if (in_task()) {
 681                 if (down_read_trylock(&adev->reset_domain->sem))
 682                         up_read(&adev->reset_domain->sem);
 683                 else
 684                         lockdep_assert_held(&adev->reset_domain->sem);
 685         }
 686 #endif
 687         return false;
 688 }
 689
 690 /**
 691  * amdgpu_device_rreg - read a memory mapped IO or indirect register
 692  *
 693  * @adev: amdgpu_device pointer
 694  * @reg: dword aligned register offset
 695  * @acc_flags: access flags which require special behavior
 696  *
 697  * Returns the 32 bit value from the offset specified.
 698  */
 699 uint32_t amdgpu_device_rreg(struct amdgpu_device *adev,
 700                             uint32_t reg, uint32_t acc_flags)
 701 {
 702         uint32_t ret;
 703
 704         if (amdgpu_device_skip_hw_access(adev))
 705                 return 0;
 706
 707         if ((reg * 4) < adev->rmmio_size) {
 708                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 709                     amdgpu_sriov_runtime(adev) &&
 710                     down_read_trylock(&adev->reset_domain->sem)) {
 711                         ret = amdgpu_kiq_rreg(adev, reg, 0);
 712                         up_read(&adev->reset_domain->sem);
 713                 } else {
 714                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 715                 }
 716         } else {
 717                 ret = adev->pcie_rreg(adev, reg * 4);
 718         }
 719
 720         trace_amdgpu_device_rreg(adev->pdev->device, reg, ret);
 721
 722         return ret;
 723 }
 724
 725 /*
 726  * MMIO register read with bytes helper functions
 727  * @offset:bytes offset from MMIO start
 728  */
 729
 730 /**
 731  * amdgpu_mm_rreg8 - read a memory mapped IO register
 732  *
 733  * @adev: amdgpu_device pointer
 734  * @offset: byte aligned register offset
 735  *
 736  * Returns the 8 bit value from the offset specified.
 737  */
 738 uint8_t amdgpu_mm_rreg8(struct amdgpu_device *adev, uint32_t offset)
 739 {
 740         if (amdgpu_device_skip_hw_access(adev))
 741                 return 0;
 742
 743         if (offset < adev->rmmio_size)
 744                 return (readb(adev->rmmio + offset));
 745         BUG();
 746 }
 747
 748
 749 /**
 750  * amdgpu_device_xcc_rreg - read a memory mapped IO or indirect register with specific XCC
 751  *
 752  * @adev: amdgpu_device pointer
 753  * @reg: dword aligned register offset
 754  * @acc_flags: access flags which require special behavior
 755  * @xcc_id: xcc accelerated compute core id
 756  *
 757  * Returns the 32 bit value from the offset specified.
 758  */
 759 uint32_t amdgpu_device_xcc_rreg(struct amdgpu_device *adev,
 760                                 uint32_t reg, uint32_t acc_flags,
 761                                 uint32_t xcc_id)
 762 {
 763         uint32_t ret, rlcg_flag;
 764
 765         if (amdgpu_device_skip_hw_access(adev))
 766                 return 0;
 767
 768         if ((reg * 4) < adev->rmmio_size) {
 769                 if (amdgpu_sriov_vf(adev) &&
 770                     !amdgpu_sriov_runtime(adev) &&
 771                     adev->gfx.rlc.rlcg_reg_access_supported &&
 772                     amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags,
 773                                                          GC_HWIP, false,
 774                                                          &rlcg_flag)) {
 775                         ret = amdgpu_virt_rlcg_reg_rw(adev, reg, 0, rlcg_flag, GET_INST(GC, xcc_id));
 776                 } else if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 777                     amdgpu_sriov_runtime(adev) &&
 778                     down_read_trylock(&adev->reset_domain->sem)) {
 779                         ret = amdgpu_kiq_rreg(adev, reg, xcc_id);
 780                         up_read(&adev->reset_domain->sem);
 781                 } else {
 782                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 783                 }
 784         } else {
 785                 ret = adev->pcie_rreg(adev, reg * 4);
 786         }
 787
 788         return ret;
 789 }
 790
 791 /*
 792  * MMIO register write with bytes helper functions
 793  * @offset:bytes offset from MMIO start
 794  * @value: the value want to be written to the register
 795  */
 796
 797 /**
 798  * amdgpu_mm_wreg8 - read a memory mapped IO register
 799  *
 800  * @adev: amdgpu_device pointer
 801  * @offset: byte aligned register offset
 802  * @value: 8 bit value to write
 803  *
 804  * Writes the value specified to the offset specified.
 805  */
 806 void amdgpu_mm_wreg8(struct amdgpu_device *adev, uint32_t offset, uint8_t value)
 807 {
 808         if (amdgpu_device_skip_hw_access(adev))
 809                 return;
 810
 811         if (offset < adev->rmmio_size)
 812                 writeb(value, adev->rmmio + offset);
 813         else
 814                 BUG();
 815 }
 816
 817 /**
 818  * amdgpu_device_wreg - write to a memory mapped IO or indirect register
 819  *
 820  * @adev: amdgpu_device pointer
 821  * @reg: dword aligned register offset
 822  * @v: 32 bit value to write to the register
 823  * @acc_flags: access flags which require special behavior
 824  *
 825  * Writes the value specified to the offset specified.
 826  */
 827 void amdgpu_device_wreg(struct amdgpu_device *adev,
 828                         uint32_t reg, uint32_t v,
 829                         uint32_t acc_flags)
 830 {
 831         if (amdgpu_device_skip_hw_access(adev))
 832                 return;
 833
 834         if ((reg * 4) < adev->rmmio_size) {
 835                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 836                     amdgpu_sriov_runtime(adev) &&
 837                     down_read_trylock(&adev->reset_domain->sem)) {
 838                         amdgpu_kiq_wreg(adev, reg, v, 0);
 839                         up_read(&adev->reset_domain->sem);
 840                 } else {
 841                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 842                 }
 843         } else {
 844                 adev->pcie_wreg(adev, reg * 4, v);
 845         }
 846
 847         trace_amdgpu_device_wreg(adev->pdev->device, reg, v);
 848 }
 849
 850 /**
 851  * amdgpu_mm_wreg_mmio_rlc -  write register either with direct/indirect mmio or with RLC path if in range
 852  *
 853  * @adev: amdgpu_device pointer
 854  * @reg: mmio/rlc register
 855  * @v: value to write
 856  * @xcc_id: xcc accelerated compute core id
 857  *
 858  * this function is invoked only for the debugfs register access
 859  */
 860 void amdgpu_mm_wreg_mmio_rlc(struct amdgpu_device *adev,
 861                              uint32_t reg, uint32_t v,
 862                              uint32_t xcc_id)
 863 {
 864         if (amdgpu_device_skip_hw_access(adev))
 865                 return;
 866
 867         if (amdgpu_sriov_fullaccess(adev) &&
 868             adev->gfx.rlc.funcs &&
 869             adev->gfx.rlc.funcs->is_rlcg_access_range) {
 870                 if (adev->gfx.rlc.funcs->is_rlcg_access_range(adev, reg))
 871                         return amdgpu_sriov_wreg(adev, reg, v, 0, 0, xcc_id);
 872         } else if ((reg * 4) >= adev->rmmio_size) {
 873                 adev->pcie_wreg(adev, reg * 4, v);
 874         } else {
 875                 writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 876         }
 877 }
 878
 879 /**
 880  * amdgpu_device_xcc_wreg - write to a memory mapped IO or indirect register with specific XCC
 881  *
 882  * @adev: amdgpu_device pointer
 883  * @reg: dword aligned register offset
 884  * @v: 32 bit value to write to the register
 885  * @acc_flags: access flags which require special behavior
 886  * @xcc_id: xcc accelerated compute core id
 887  *
 888  * Writes the value specified to the offset specified.
 889  */
 890 void amdgpu_device_xcc_wreg(struct amdgpu_device *adev,
 891                         uint32_t reg, uint32_t v,
 892                         uint32_t acc_flags, uint32_t xcc_id)
 893 {
 894         uint32_t rlcg_flag;
 895
 896         if (amdgpu_device_skip_hw_access(adev))
 897                 return;
 898
 899         if ((reg * 4) < adev->rmmio_size) {
 900                 if (amdgpu_sriov_vf(adev) &&
 901                     !amdgpu_sriov_runtime(adev) &&
 902                     adev->gfx.rlc.rlcg_reg_access_supported &&
 903                     amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags,
 904                                                          GC_HWIP, true,
 905                                                          &rlcg_flag)) {
 906                         amdgpu_virt_rlcg_reg_rw(adev, reg, v, rlcg_flag, GET_INST(GC, xcc_id));
 907                 } else if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 908                     amdgpu_sriov_runtime(adev) &&
 909                     down_read_trylock(&adev->reset_domain->sem)) {
 910                         amdgpu_kiq_wreg(adev, reg, v, xcc_id);
 911                         up_read(&adev->reset_domain->sem);
 912                 } else {
 913                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 914                 }
 915         } else {
 916                 adev->pcie_wreg(adev, reg * 4, v);
 917         }
 918 }
 919
 920 /**
 921  * amdgpu_device_indirect_rreg - read an indirect register
 922  *
 923  * @adev: amdgpu_device pointer
 924  * @reg_addr: indirect register address to read from
 925  *
 926  * Returns the value of indirect register @reg_addr
 927  */
 928 u32 amdgpu_device_indirect_rreg(struct amdgpu_device *adev,
 929                                 u32 reg_addr)
 930 {
 931         unsigned long flags, pcie_index, pcie_data;
 932         void __iomem *pcie_index_offset;
 933         void __iomem *pcie_data_offset;
 934         u32 r;
 935
 936         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 937         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 938
 939         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 940         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 941         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 942
 943         writel(reg_addr, pcie_index_offset);
 944         readl(pcie_index_offset);
 945         r = readl(pcie_data_offset);
 946         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 947
 948         return r;
 949 }
 950
 951 u32 amdgpu_device_indirect_rreg_ext(struct amdgpu_device *adev,
 952                                     u64 reg_addr)
 953 {
 954         unsigned long flags, pcie_index, pcie_index_hi, pcie_data;
 955         u32 r;
 956         void __iomem *pcie_index_offset;
 957         void __iomem *pcie_index_hi_offset;
 958         void __iomem *pcie_data_offset;
 959
 960         if (unlikely(!adev->nbio.funcs)) {
 961                 pcie_index = AMDGPU_PCIE_INDEX_FALLBACK;
 962                 pcie_data = AMDGPU_PCIE_DATA_FALLBACK;
 963         } else {
 964                 pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 965                 pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 966         }
 967
 968         if (reg_addr >> 32) {
 969                 if (unlikely(!adev->nbio.funcs))
 970                         pcie_index_hi = AMDGPU_PCIE_INDEX_HI_FALLBACK;
 971                 else
 972                         pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
 973         } else {
 974                 pcie_index_hi = 0;
 975         }
 976
 977         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 978         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 979         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 980         if (pcie_index_hi != 0)
 981                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
 982                                 pcie_index_hi * 4;
 983
 984         writel(reg_addr, pcie_index_offset);
 985         readl(pcie_index_offset);
 986         if (pcie_index_hi != 0) {
 987                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
 988                 readl(pcie_index_hi_offset);
 989         }
 990         r = readl(pcie_data_offset);
 991
 992         /* clear the high bits */
 993         if (pcie_index_hi != 0) {
 994                 writel(0, pcie_index_hi_offset);
 995                 readl(pcie_index_hi_offset);
 996         }
 997
 998         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 999
1000         return r;
1001 }
1002
1003 /**
1004  * amdgpu_device_indirect_rreg64 - read a 64bits indirect register
1005  *
1006  * @adev: amdgpu_device pointer
1007  * @reg_addr: indirect register address to read from
1008  *
1009  * Returns the value of indirect register @reg_addr
1010  */
1011 u64 amdgpu_device_indirect_rreg64(struct amdgpu_device *adev,
1012                                   u32 reg_addr)
1013 {
1014         unsigned long flags, pcie_index, pcie_data;
1015         void __iomem *pcie_index_offset;
1016         void __iomem *pcie_data_offset;
1017         u64 r;
1018
1019         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1020         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1021
1022         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1023         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1024         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1025
1026         /* read low 32 bits */
1027         writel(reg_addr, pcie_index_offset);
1028         readl(pcie_index_offset);
1029         r = readl(pcie_data_offset);
1030         /* read high 32 bits */
1031         writel(reg_addr + 4, pcie_index_offset);
1032         readl(pcie_index_offset);
1033         r |= ((u64)readl(pcie_data_offset) << 32);
1034         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1035
1036         return r;
1037 }
1038
1039 u64 amdgpu_device_indirect_rreg64_ext(struct amdgpu_device *adev,
1040                                   u64 reg_addr)
1041 {
1042         unsigned long flags, pcie_index, pcie_data;
1043         unsigned long pcie_index_hi = 0;
1044         void __iomem *pcie_index_offset;
1045         void __iomem *pcie_index_hi_offset;
1046         void __iomem *pcie_data_offset;
1047         u64 r;
1048
1049         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1050         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1051         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1052                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1053
1054         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1055         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1056         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1057         if (pcie_index_hi != 0)
1058                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1059                         pcie_index_hi * 4;
1060
1061         /* read low 32 bits */
1062         writel(reg_addr, pcie_index_offset);
1063         readl(pcie_index_offset);
1064         if (pcie_index_hi != 0) {
1065                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1066                 readl(pcie_index_hi_offset);
1067         }
1068         r = readl(pcie_data_offset);
1069         /* read high 32 bits */
1070         writel(reg_addr + 4, pcie_index_offset);
1071         readl(pcie_index_offset);
1072         if (pcie_index_hi != 0) {
1073                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1074                 readl(pcie_index_hi_offset);
1075         }
1076         r |= ((u64)readl(pcie_data_offset) << 32);
1077
1078         /* clear the high bits */
1079         if (pcie_index_hi != 0) {
1080                 writel(0, pcie_index_hi_offset);
1081                 readl(pcie_index_hi_offset);
1082         }
1083
1084         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1085
1086         return r;
1087 }
1088
1089 /**
1090  * amdgpu_device_indirect_wreg - write an indirect register address
1091  *
1092  * @adev: amdgpu_device pointer
1093  * @reg_addr: indirect register offset
1094  * @reg_data: indirect register data
1095  *
1096  */
1097 void amdgpu_device_indirect_wreg(struct amdgpu_device *adev,
1098                                  u32 reg_addr, u32 reg_data)
1099 {
1100         unsigned long flags, pcie_index, pcie_data;
1101         void __iomem *pcie_index_offset;
1102         void __iomem *pcie_data_offset;
1103
1104         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1105         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1106
1107         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1108         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1109         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1110
1111         writel(reg_addr, pcie_index_offset);
1112         readl(pcie_index_offset);
1113         writel(reg_data, pcie_data_offset);
1114         readl(pcie_data_offset);
1115         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1116 }
1117
1118 void amdgpu_device_indirect_wreg_ext(struct amdgpu_device *adev,
1119                                      u64 reg_addr, u32 reg_data)
1120 {
1121         unsigned long flags, pcie_index, pcie_index_hi, pcie_data;
1122         void __iomem *pcie_index_offset;
1123         void __iomem *pcie_index_hi_offset;
1124         void __iomem *pcie_data_offset;
1125
1126         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1127         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1128         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1129                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1130         else
1131                 pcie_index_hi = 0;
1132
1133         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1134         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1135         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1136         if (pcie_index_hi != 0)
1137                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1138                                 pcie_index_hi * 4;
1139
1140         writel(reg_addr, pcie_index_offset);
1141         readl(pcie_index_offset);
1142         if (pcie_index_hi != 0) {
1143                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1144                 readl(pcie_index_hi_offset);
1145         }
1146         writel(reg_data, pcie_data_offset);
1147         readl(pcie_data_offset);
1148
1149         /* clear the high bits */
1150         if (pcie_index_hi != 0) {
1151                 writel(0, pcie_index_hi_offset);
1152                 readl(pcie_index_hi_offset);
1153         }
1154
1155         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1156 }
1157
1158 /**
1159  * amdgpu_device_indirect_wreg64 - write a 64bits indirect register address
1160  *
1161  * @adev: amdgpu_device pointer
1162  * @reg_addr: indirect register offset
1163  * @reg_data: indirect register data
1164  *
1165  */
1166 void amdgpu_device_indirect_wreg64(struct amdgpu_device *adev,
1167                                    u32 reg_addr, u64 reg_data)
1168 {
1169         unsigned long flags, pcie_index, pcie_data;
1170         void __iomem *pcie_index_offset;
1171         void __iomem *pcie_data_offset;
1172
1173         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1174         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1175
1176         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1177         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1178         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1179
1180         /* write low 32 bits */
1181         writel(reg_addr, pcie_index_offset);
1182         readl(pcie_index_offset);
1183         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
1184         readl(pcie_data_offset);
1185         /* write high 32 bits */
1186         writel(reg_addr + 4, pcie_index_offset);
1187         readl(pcie_index_offset);
1188         writel((u32)(reg_data >> 32), pcie_data_offset);
1189         readl(pcie_data_offset);
1190         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1191 }
1192
1193 void amdgpu_device_indirect_wreg64_ext(struct amdgpu_device *adev,
1194                                    u64 reg_addr, u64 reg_data)
1195 {
1196         unsigned long flags, pcie_index, pcie_data;
1197         unsigned long pcie_index_hi = 0;
1198         void __iomem *pcie_index_offset;
1199         void __iomem *pcie_index_hi_offset;
1200         void __iomem *pcie_data_offset;
1201
1202         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1203         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1204         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1205                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1206
1207         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1208         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1209         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1210         if (pcie_index_hi != 0)
1211                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1212                                 pcie_index_hi * 4;
1213
1214         /* write low 32 bits */
1215         writel(reg_addr, pcie_index_offset);
1216         readl(pcie_index_offset);
1217         if (pcie_index_hi != 0) {
1218                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1219                 readl(pcie_index_hi_offset);
1220         }
1221         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
1222         readl(pcie_data_offset);
1223         /* write high 32 bits */
1224         writel(reg_addr + 4, pcie_index_offset);
1225         readl(pcie_index_offset);
1226         if (pcie_index_hi != 0) {
1227                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1228                 readl(pcie_index_hi_offset);
1229         }
1230         writel((u32)(reg_data >> 32), pcie_data_offset);
1231         readl(pcie_data_offset);
1232
1233         /* clear the high bits */
1234         if (pcie_index_hi != 0) {
1235                 writel(0, pcie_index_hi_offset);
1236                 readl(pcie_index_hi_offset);
1237         }
1238
1239         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1240 }
1241
1242 /**
1243  * amdgpu_device_get_rev_id - query device rev_id
1244  *
1245  * @adev: amdgpu_device pointer
1246  *
1247  * Return device rev_id
1248  */
1249 u32 amdgpu_device_get_rev_id(struct amdgpu_device *adev)
1250 {
1251         return adev->nbio.funcs->get_rev_id(adev);
1252 }
1253
1254 /**
1255  * amdgpu_invalid_rreg - dummy reg read function
1256  *
1257  * @adev: amdgpu_device pointer
1258  * @reg: offset of register
1259  *
1260  * Dummy register read function.  Used for register blocks
1261  * that certain asics don't have (all asics).
1262  * Returns the value in the register.
1263  */
1264 static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
1265 {
1266         DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
1267         BUG();
1268         return 0;
1269 }
1270
1271 static uint32_t amdgpu_invalid_rreg_ext(struct amdgpu_device *adev, uint64_t reg)
1272 {
1273         DRM_ERROR("Invalid callback to read register 0x%llX\n", reg);
1274         BUG();
1275         return 0;
1276 }
1277
1278 /**
1279  * amdgpu_invalid_wreg - dummy reg write function
1280  *
1281  * @adev: amdgpu_device pointer
1282  * @reg: offset of register
1283  * @v: value to write to the register
1284  *
1285  * Dummy register read function.  Used for register blocks
1286  * that certain asics don't have (all asics).
1287  */
1288 static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
1289 {
1290         DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
1291                   reg, v);
1292         BUG();
1293 }
1294
1295 static void amdgpu_invalid_wreg_ext(struct amdgpu_device *adev, uint64_t reg, uint32_t v)
1296 {
1297         DRM_ERROR("Invalid callback to write register 0x%llX with 0x%08X\n",
1298                   reg, v);
1299         BUG();
1300 }
1301
1302 /**
1303  * amdgpu_invalid_rreg64 - dummy 64 bit reg read function
1304  *
1305  * @adev: amdgpu_device pointer
1306  * @reg: offset of register
1307  *
1308  * Dummy register read function.  Used for register blocks
1309  * that certain asics don't have (all asics).
1310  * Returns the value in the register.
1311  */
1312 static uint64_t amdgpu_invalid_rreg64(struct amdgpu_device *adev, uint32_t reg)
1313 {
1314         DRM_ERROR("Invalid callback to read 64 bit register 0x%04X\n", reg);
1315         BUG();
1316         return 0;
1317 }
1318
1319 static uint64_t amdgpu_invalid_rreg64_ext(struct amdgpu_device *adev, uint64_t reg)
1320 {
1321         DRM_ERROR("Invalid callback to read register 0x%llX\n", reg);
1322         BUG();
1323         return 0;
1324 }
1325
1326 /**
1327  * amdgpu_invalid_wreg64 - dummy reg write function
1328  *
1329  * @adev: amdgpu_device pointer
1330  * @reg: offset of register
1331  * @v: value to write to the register
1332  *
1333  * Dummy register read function.  Used for register blocks
1334  * that certain asics don't have (all asics).
1335  */
1336 static void amdgpu_invalid_wreg64(struct amdgpu_device *adev, uint32_t reg, uint64_t v)
1337 {
1338         DRM_ERROR("Invalid callback to write 64 bit register 0x%04X with 0x%08llX\n",
1339                   reg, v);
1340         BUG();
1341 }
1342
1343 static void amdgpu_invalid_wreg64_ext(struct amdgpu_device *adev, uint64_t reg, uint64_t v)
1344 {
1345         DRM_ERROR("Invalid callback to write 64 bit register 0x%llX with 0x%08llX\n",
1346                   reg, v);
1347         BUG();
1348 }
1349
1350 /**
1351  * amdgpu_block_invalid_rreg - dummy reg read function
1352  *
1353  * @adev: amdgpu_device pointer
1354  * @block: offset of instance
1355  * @reg: offset of register
1356  *
1357  * Dummy register read function.  Used for register blocks
1358  * that certain asics don't have (all asics).
1359  * Returns the value in the register.
1360  */
1361 static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
1362                                           uint32_t block, uint32_t reg)
1363 {
1364         DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
1365                   reg, block);
1366         BUG();
1367         return 0;
1368 }
1369
1370 /**
1371  * amdgpu_block_invalid_wreg - dummy reg write function
1372  *
1373  * @adev: amdgpu_device pointer
1374  * @block: offset of instance
1375  * @reg: offset of register
1376  * @v: value to write to the register
1377  *
1378  * Dummy register read function.  Used for register blocks
1379  * that certain asics don't have (all asics).
1380  */
1381 static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
1382                                       uint32_t block,
1383                                       uint32_t reg, uint32_t v)
1384 {
1385         DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
1386                   reg, block, v);
1387         BUG();
1388 }
1389
1390 /**
1391  * amdgpu_device_asic_init - Wrapper for atom asic_init
1392  *
1393  * @adev: amdgpu_device pointer
1394  *
1395  * Does any asic specific work and then calls atom asic init.
1396  */
1397 static int amdgpu_device_asic_init(struct amdgpu_device *adev)
1398 {
1399         int ret;
1400
1401         amdgpu_asic_pre_asic_init(adev);
1402
1403         if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
1404             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4) ||
1405             amdgpu_ip_version(adev, GC_HWIP, 0) >= IP_VERSION(11, 0, 0)) {
1406                 amdgpu_psp_wait_for_bootloader(adev);
1407                 ret = amdgpu_atomfirmware_asic_init(adev, true);
1408                 return ret;
1409         } else {
1410                 return amdgpu_atom_asic_init(adev->mode_info.atom_context);
1411         }
1412
1413         return 0;
1414 }
1415
1416 /**
1417  * amdgpu_device_mem_scratch_init - allocate the VRAM scratch page
1418  *
1419  * @adev: amdgpu_device pointer
1420  *
1421  * Allocates a scratch page of VRAM for use by various things in the
1422  * driver.
1423  */
1424 static int amdgpu_device_mem_scratch_init(struct amdgpu_device *adev)
1425 {
1426         return amdgpu_bo_create_kernel(adev, AMDGPU_GPU_PAGE_SIZE, PAGE_SIZE,
1427                                        AMDGPU_GEM_DOMAIN_VRAM |
1428                                        AMDGPU_GEM_DOMAIN_GTT,
1429                                        &adev->mem_scratch.robj,
1430                                        &adev->mem_scratch.gpu_addr,
1431                                        (void **)&adev->mem_scratch.ptr);
1432 }
1433
1434 /**
1435  * amdgpu_device_mem_scratch_fini - Free the VRAM scratch page
1436  *
1437  * @adev: amdgpu_device pointer
1438  *
1439  * Frees the VRAM scratch page.
1440  */
1441 static void amdgpu_device_mem_scratch_fini(struct amdgpu_device *adev)
1442 {
1443         amdgpu_bo_free_kernel(&adev->mem_scratch.robj, NULL, NULL);
1444 }
1445
1446 /**
1447  * amdgpu_device_program_register_sequence - program an array of registers.
1448  *
1449  * @adev: amdgpu_device pointer
1450  * @registers: pointer to the register array
1451  * @array_size: size of the register array
1452  *
1453  * Programs an array or registers with and or masks.
1454  * This is a helper for setting golden registers.
1455  */
1456 void amdgpu_device_program_register_sequence(struct amdgpu_device *adev,
1457                                              const u32 *registers,
1458                                              const u32 array_size)
1459 {
1460         u32 tmp, reg, and_mask, or_mask;
1461         int i;
1462
1463         if (array_size % 3)
1464                 return;
1465
1466         for (i = 0; i < array_size; i += 3) {
1467                 reg = registers[i + 0];
1468                 and_mask = registers[i + 1];
1469                 or_mask = registers[i + 2];
1470
1471                 if (and_mask == 0xffffffff) {
1472                         tmp = or_mask;
1473                 } else {
1474                         tmp = RREG32(reg);
1475                         tmp &= ~and_mask;
1476                         if (adev->family >= AMDGPU_FAMILY_AI)
1477                                 tmp |= (or_mask & and_mask);
1478                         else
1479                                 tmp |= or_mask;
1480                 }
1481                 WREG32(reg, tmp);
1482         }
1483 }
1484
1485 /**
1486  * amdgpu_device_pci_config_reset - reset the GPU
1487  *
1488  * @adev: amdgpu_device pointer
1489  *
1490  * Resets the GPU using the pci config reset sequence.
1491  * Only applicable to asics prior to vega10.
1492  */
1493 void amdgpu_device_pci_config_reset(struct amdgpu_device *adev)
1494 {
1495         pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);
1496 }
1497
1498 /**
1499  * amdgpu_device_pci_reset - reset the GPU using generic PCI means
1500  *
1501  * @adev: amdgpu_device pointer
1502  *
1503  * Resets the GPU using generic pci reset interfaces (FLR, SBR, etc.).
1504  */
1505 int amdgpu_device_pci_reset(struct amdgpu_device *adev)
1506 {
1507         return pci_reset_function(adev->pdev);
1508 }
1509
1510 /*
1511  * amdgpu_device_wb_*()
1512  * Writeback is the method by which the GPU updates special pages in memory
1513  * with the status of certain GPU events (fences, ring pointers,etc.).
1514  */
1515
1516 /**
1517  * amdgpu_device_wb_fini - Disable Writeback and free memory
1518  *
1519  * @adev: amdgpu_device pointer
1520  *
1521  * Disables Writeback and frees the Writeback memory (all asics).
1522  * Used at driver shutdown.
1523  */
1524 static void amdgpu_device_wb_fini(struct amdgpu_device *adev)
1525 {
1526         if (adev->wb.wb_obj) {
1527                 amdgpu_bo_free_kernel(&adev->wb.wb_obj,
1528                                       &adev->wb.gpu_addr,
1529                                       (void **)&adev->wb.wb);
1530                 adev->wb.wb_obj = NULL;
1531         }
1532 }
1533
1534 /**
1535  * amdgpu_device_wb_init - Init Writeback driver info and allocate memory
1536  *
1537  * @adev: amdgpu_device pointer
1538  *
1539  * Initializes writeback and allocates writeback memory (all asics).
1540  * Used at driver startup.
1541  * Returns 0 on success or an -error on failure.
1542  */
1543 static int amdgpu_device_wb_init(struct amdgpu_device *adev)
1544 {
1545         int r;
1546
1547         if (adev->wb.wb_obj == NULL) {
1548                 /* AMDGPU_MAX_WB * sizeof(uint32_t) * 8 = AMDGPU_MAX_WB 256bit slots */
1549                 r = amdgpu_bo_create_kernel(adev, AMDGPU_MAX_WB * sizeof(uint32_t) * 8,
1550                                             PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
1551                                             &adev->wb.wb_obj, &adev->wb.gpu_addr,
1552                                             (void **)&adev->wb.wb);
1553                 if (r) {
1554                         dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
1555                         return r;
1556                 }
1557
1558                 adev->wb.num_wb = AMDGPU_MAX_WB;
1559                 memset(&adev->wb.used, 0, sizeof(adev->wb.used));
1560
1561                 /* clear wb memory */
1562                 memset((char *)adev->wb.wb, 0, AMDGPU_MAX_WB * sizeof(uint32_t) * 8);
1563         }
1564
1565         return 0;
1566 }
1567
1568 /**
1569  * amdgpu_device_wb_get - Allocate a wb entry
1570  *
1571  * @adev: amdgpu_device pointer
1572  * @wb: wb index
1573  *
1574  * Allocate a wb slot for use by the driver (all asics).
1575  * Returns 0 on success or -EINVAL on failure.
1576  */
1577 int amdgpu_device_wb_get(struct amdgpu_device *adev, u32 *wb)
1578 {
1579         unsigned long flags, offset;
1580
1581         spin_lock_irqsave(&adev->wb.lock, flags);
1582         offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
1583         if (offset < adev->wb.num_wb) {
1584                 __set_bit(offset, adev->wb.used);
1585                 spin_unlock_irqrestore(&adev->wb.lock, flags);
1586                 *wb = offset << 3; /* convert to dw offset */
1587                 return 0;
1588         } else {
1589                 spin_unlock_irqrestore(&adev->wb.lock, flags);
1590                 return -EINVAL;
1591         }
1592 }
1593
1594 /**
1595  * amdgpu_device_wb_free - Free a wb entry
1596  *
1597  * @adev: amdgpu_device pointer
1598  * @wb: wb index
1599  *
1600  * Free a wb slot allocated for use by the driver (all asics)
1601  */
1602 void amdgpu_device_wb_free(struct amdgpu_device *adev, u32 wb)
1603 {
1604         unsigned long flags;
1605
1606         wb >>= 3;
1607         spin_lock_irqsave(&adev->wb.lock, flags);
1608         if (wb < adev->wb.num_wb)
1609                 __clear_bit(wb, adev->wb.used);
1610         spin_unlock_irqrestore(&adev->wb.lock, flags);
1611 }
1612
1613 /**
1614  * amdgpu_device_resize_fb_bar - try to resize FB BAR
1615  *
1616  * @adev: amdgpu_device pointer
1617  *
1618  * Try to resize FB BAR to make all VRAM CPU accessible. We try very hard not
1619  * to fail, but if any of the BARs is not accessible after the size we abort
1620  * driver loading by returning -ENODEV.
1621  */
1622 int amdgpu_device_resize_fb_bar(struct amdgpu_device *adev)
1623 {
1624         int rbar_size = pci_rebar_bytes_to_size(adev->gmc.real_vram_size);
1625         struct pci_bus *root;
1626         struct resource *res;
1627         unsigned int i;
1628         u16 cmd;
1629         int r;
1630
1631         if (!IS_ENABLED(CONFIG_PHYS_ADDR_T_64BIT))
1632                 return 0;
1633
1634         /* Bypass for VF */
1635         if (amdgpu_sriov_vf(adev))
1636                 return 0;
1637
1638         /* PCI_EXT_CAP_ID_VNDR extended capability is located at 0x100 */
1639         if (!pci_find_ext_capability(adev->pdev, PCI_EXT_CAP_ID_VNDR))
1640                 DRM_WARN("System can't access extended configuration space, please check!!\n");
1641
1642         /* skip if the bios has already enabled large BAR */
1643         if (adev->gmc.real_vram_size &&
1644             (pci_resource_len(adev->pdev, 0) >= adev->gmc.real_vram_size))
1645                 return 0;
1646
1647         /* Check if the root BUS has 64bit memory resources */
1648         root = adev->pdev->bus;
1649         while (root->parent)
1650                 root = root->parent;
1651
1652         pci_bus_for_each_resource(root, res, i) {
1653                 if (res && res->flags & (IORESOURCE_MEM | IORESOURCE_MEM_64) &&
1654                     res->start > 0x100000000ull)
1655                         break;
1656         }
1657
1658         /* Trying to resize is pointless without a root hub window above 4GB */
1659         if (!res)
1660                 return 0;
1661
1662         /* Limit the BAR size to what is available */
1663         rbar_size = min(fls(pci_rebar_get_possible_sizes(adev->pdev, 0)) - 1,
1664                         rbar_size);
1665
1666         /* Disable memory decoding while we change the BAR addresses and size */
1667         pci_read_config_word(adev->pdev, PCI_COMMAND, &cmd);
1668         pci_write_config_word(adev->pdev, PCI_COMMAND,
1669                               cmd & ~PCI_COMMAND_MEMORY);
1670
1671         /* Free the VRAM and doorbell BAR, we most likely need to move both. */
1672         amdgpu_doorbell_fini(adev);
1673         if (adev->asic_type >= CHIP_BONAIRE)
1674                 pci_release_resource(adev->pdev, 2);
1675
1676         pci_release_resource(adev->pdev, 0);
1677
1678         r = pci_resize_resource(adev->pdev, 0, rbar_size);
1679         if (r == -ENOSPC)
1680                 DRM_INFO("Not enough PCI address space for a large BAR.");
1681         else if (r && r != -ENOTSUPP)
1682                 DRM_ERROR("Problem resizing BAR0 (%d).", r);
1683
1684         pci_assign_unassigned_bus_resources(adev->pdev->bus);
1685
1686         /* When the doorbell or fb BAR isn't available we have no chance of
1687          * using the device.
1688          */
1689         r = amdgpu_doorbell_init(adev);
1690         if (r || (pci_resource_flags(adev->pdev, 0) & IORESOURCE_UNSET))
1691                 return -ENODEV;
1692
1693         pci_write_config_word(adev->pdev, PCI_COMMAND, cmd);
1694
1695         return 0;
1696 }
1697
1698 static bool amdgpu_device_read_bios(struct amdgpu_device *adev)
1699 {
1700         if (hweight32(adev->aid_mask) && (adev->flags & AMD_IS_APU))
1701                 return false;
1702
1703         return true;
1704 }
1705
1706 /*
1707  * GPU helpers function.
1708  */
1709 /**
1710  * amdgpu_device_need_post - check if the hw need post or not
1711  *
1712  * @adev: amdgpu_device pointer
1713  *
1714  * Check if the asic has been initialized (all asics) at driver startup
1715  * or post is needed if  hw reset is performed.
1716  * Returns true if need or false if not.
1717  */
1718 bool amdgpu_device_need_post(struct amdgpu_device *adev)
1719 {
1720         uint32_t reg;
1721
1722         if (amdgpu_sriov_vf(adev))
1723                 return false;
1724
1725         if (!amdgpu_device_read_bios(adev))
1726                 return false;
1727
1728         if (amdgpu_passthrough(adev)) {
1729                 /* for FIJI: In whole GPU pass-through virtualization case, after VM reboot
1730                  * some old smc fw still need driver do vPost otherwise gpu hang, while
1731                  * those smc fw version above 22.15 doesn't have this flaw, so we force
1732                  * vpost executed for smc version below 22.15
1733                  */
1734                 if (adev->asic_type == CHIP_FIJI) {
1735                         int err;
1736                         uint32_t fw_ver;
1737
1738                         err = request_firmware(&adev->pm.fw, "amdgpu/fiji_smc.bin", adev->dev);
1739                         /* force vPost if error occured */
1740                         if (err)
1741                                 return true;
1742
1743                         fw_ver = *((uint32_t *)adev->pm.fw->data + 69);
1744                         release_firmware(adev->pm.fw);
1745                         if (fw_ver < 0x00160e00)
1746                                 return true;
1747                 }
1748         }
1749
1750         /* Don't post if we need to reset whole hive on init */
1751         if (adev->init_lvl->level == AMDGPU_INIT_LEVEL_MINIMAL_XGMI)
1752                 return false;
1753
1754         if (adev->has_hw_reset) {
1755                 adev->has_hw_reset = false;
1756                 return true;
1757         }
1758
1759         /* bios scratch used on CIK+ */
1760         if (adev->asic_type >= CHIP_BONAIRE)
1761                 return amdgpu_atombios_scratch_need_asic_init(adev);
1762
1763         /* check MEM_SIZE for older asics */
1764         reg = amdgpu_asic_get_config_memsize(adev);
1765
1766         if ((reg != 0) && (reg != 0xffffffff))
1767                 return false;
1768
1769         return true;
1770 }
1771
1772 /*
1773  * Check whether seamless boot is supported.
1774  *
1775  * So far we only support seamless boot on DCE 3.0 or later.
1776  * If users report that it works on older ASICS as well, we may
1777  * loosen this.
1778  */
1779 bool amdgpu_device_seamless_boot_supported(struct amdgpu_device *adev)
1780 {
1781         switch (amdgpu_seamless) {
1782         case -1:
1783                 break;
1784         case 1:
1785                 return true;
1786         case 0:
1787                 return false;
1788         default:
1789                 DRM_ERROR("Invalid value for amdgpu.seamless: %d\n",
1790                           amdgpu_seamless);
1791                 return false;
1792         }
1793
1794         if (!(adev->flags & AMD_IS_APU))
1795                 return false;
1796
1797         if (adev->mman.keep_stolen_vga_memory)
1798                 return false;
1799
1800         return amdgpu_ip_version(adev, DCE_HWIP, 0) >= IP_VERSION(3, 0, 0);
1801 }
1802
1803 /*
1804  * Intel hosts such as Rocket Lake, Alder Lake, Raptor Lake and Sapphire Rapids
1805  * don't support dynamic speed switching. Until we have confirmation from Intel
1806  * that a specific host supports it, it's safer that we keep it disabled for all.
1807  *
1808  * https://edc.intel.com/content/www/us/en/design/products/platforms/details/raptor-lake-s/13th-generation-core-processors-datasheet-volume-1-of-2/005/pci-express-support/
1809  * https://gitlab.freedesktop.org/drm/amd/-/issues/2663
1810  */
1811 static bool amdgpu_device_pcie_dynamic_switching_supported(struct amdgpu_device *adev)
1812 {
1813 #if IS_ENABLED(CONFIG_X86)
1814         struct cpuinfo_x86 *c = &cpu_data(0);
1815
1816         /* eGPU change speeds based on USB4 fabric conditions */
1817         if (dev_is_removable(adev->dev))
1818                 return true;
1819
1820         if (c->x86_vendor == X86_VENDOR_INTEL)
1821                 return false;
1822 #endif
1823         return true;
1824 }
1825
1826 /**
1827  * amdgpu_device_should_use_aspm - check if the device should program ASPM
1828  *
1829  * @adev: amdgpu_device pointer
1830  *
1831  * Confirm whether the module parameter and pcie bridge agree that ASPM should
1832  * be set for this device.
1833  *
1834  * Returns true if it should be used or false if not.
1835  */
1836 bool amdgpu_device_should_use_aspm(struct amdgpu_device *adev)
1837 {
1838         switch (amdgpu_aspm) {
1839         case -1:
1840                 break;
1841         case 0:
1842                 return false;
1843         case 1:
1844                 return true;
1845         default:
1846                 return false;
1847         }
1848         if (adev->flags & AMD_IS_APU)
1849                 return false;
1850         if (!(adev->pm.pp_feature & PP_PCIE_DPM_MASK))
1851                 return false;
1852         return pcie_aspm_enabled(adev->pdev);
1853 }
1854
1855 /* if we get transitioned to only one device, take VGA back */
1856 /**
1857  * amdgpu_device_vga_set_decode - enable/disable vga decode
1858  *
1859  * @pdev: PCI device pointer
1860  * @state: enable/disable vga decode
1861  *
1862  * Enable/disable vga decode (all asics).
1863  * Returns VGA resource flags.
1864  */
1865 static unsigned int amdgpu_device_vga_set_decode(struct pci_dev *pdev,
1866                 bool state)
1867 {
1868         struct amdgpu_device *adev = drm_to_adev(pci_get_drvdata(pdev));
1869
1870         amdgpu_asic_set_vga_state(adev, state);
1871         if (state)
1872                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1873                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1874         else
1875                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1876 }
1877
1878 /**
1879  * amdgpu_device_check_block_size - validate the vm block size
1880  *
1881  * @adev: amdgpu_device pointer
1882  *
1883  * Validates the vm block size specified via module parameter.
1884  * The vm block size defines number of bits in page table versus page directory,
1885  * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1886  * page table and the remaining bits are in the page directory.
1887  */
1888 static void amdgpu_device_check_block_size(struct amdgpu_device *adev)
1889 {
1890         /* defines number of bits in page table versus page directory,
1891          * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1892          * page table and the remaining bits are in the page directory
1893          */
1894         if (amdgpu_vm_block_size == -1)
1895                 return;
1896
1897         if (amdgpu_vm_block_size < 9) {
1898                 dev_warn(adev->dev, "VM page table size (%d) too small\n",
1899                          amdgpu_vm_block_size);
1900                 amdgpu_vm_block_size = -1;
1901         }
1902 }
1903
1904 /**
1905  * amdgpu_device_check_vm_size - validate the vm size
1906  *
1907  * @adev: amdgpu_device pointer
1908  *
1909  * Validates the vm size in GB specified via module parameter.
1910  * The VM size is the size of the GPU virtual memory space in GB.
1911  */
1912 static void amdgpu_device_check_vm_size(struct amdgpu_device *adev)
1913 {
1914         /* no need to check the default value */
1915         if (amdgpu_vm_size == -1)
1916                 return;
1917
1918         if (amdgpu_vm_size < 1) {
1919                 dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
1920                          amdgpu_vm_size);
1921                 amdgpu_vm_size = -1;
1922         }
1923 }
1924
1925 static void amdgpu_device_check_smu_prv_buffer_size(struct amdgpu_device *adev)
1926 {
1927         struct sysinfo si;
1928         bool is_os_64 = (sizeof(void *) == 8);
1929         uint64_t total_memory;
1930         uint64_t dram_size_seven_GB = 0x1B8000000;
1931         uint64_t dram_size_three_GB = 0xB8000000;
1932
1933         if (amdgpu_smu_memory_pool_size == 0)
1934                 return;
1935
1936         if (!is_os_64) {
1937                 DRM_WARN("Not 64-bit OS, feature not supported\n");
1938                 goto def_value;
1939         }
1940         si_meminfo(&si);
1941         total_memory = (uint64_t)si.totalram * si.mem_unit;
1942
1943         if ((amdgpu_smu_memory_pool_size == 1) ||
1944                 (amdgpu_smu_memory_pool_size == 2)) {
1945                 if (total_memory < dram_size_three_GB)
1946                         goto def_value1;
1947         } else if ((amdgpu_smu_memory_pool_size == 4) ||
1948                 (amdgpu_smu_memory_pool_size == 8)) {
1949                 if (total_memory < dram_size_seven_GB)
1950                         goto def_value1;
1951         } else {
1952                 DRM_WARN("Smu memory pool size not supported\n");
1953                 goto def_value;
1954         }
1955         adev->pm.smu_prv_buffer_size = amdgpu_smu_memory_pool_size << 28;
1956
1957         return;
1958
1959 def_value1:
1960         DRM_WARN("No enough system memory\n");
1961 def_value:
1962         adev->pm.smu_prv_buffer_size = 0;
1963 }
1964
1965 static int amdgpu_device_init_apu_flags(struct amdgpu_device *adev)
1966 {
1967         if (!(adev->flags & AMD_IS_APU) ||
1968             adev->asic_type < CHIP_RAVEN)
1969                 return 0;
1970
1971         switch (adev->asic_type) {
1972         case CHIP_RAVEN:
1973                 if (adev->pdev->device == 0x15dd)
1974                         adev->apu_flags |= AMD_APU_IS_RAVEN;
1975                 if (adev->pdev->device == 0x15d8)
1976                         adev->apu_flags |= AMD_APU_IS_PICASSO;
1977                 break;
1978         case CHIP_RENOIR:
1979                 if ((adev->pdev->device == 0x1636) ||
1980                     (adev->pdev->device == 0x164c))
1981                         adev->apu_flags |= AMD_APU_IS_RENOIR;
1982                 else
1983                         adev->apu_flags |= AMD_APU_IS_GREEN_SARDINE;
1984                 break;
1985         case CHIP_VANGOGH:
1986                 adev->apu_flags |= AMD_APU_IS_VANGOGH;
1987                 break;
1988         case CHIP_YELLOW_CARP:
1989                 break;
1990         case CHIP_CYAN_SKILLFISH:
1991                 if ((adev->pdev->device == 0x13FE) ||
1992                     (adev->pdev->device == 0x143F))
1993                         adev->apu_flags |= AMD_APU_IS_CYAN_SKILLFISH2;
1994                 break;
1995         default:
1996                 break;
1997         }
1998
1999         return 0;
2000 }
2001
2002 /**
2003  * amdgpu_device_check_arguments - validate module params
2004  *
2005  * @adev: amdgpu_device pointer
2006  *
2007  * Validates certain module parameters and updates
2008  * the associated values used by the driver (all asics).
2009  */
2010 static int amdgpu_device_check_arguments(struct amdgpu_device *adev)
2011 {
2012         int i;
2013
2014         if (amdgpu_sched_jobs < 4) {
2015                 dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
2016                          amdgpu_sched_jobs);
2017                 amdgpu_sched_jobs = 4;
2018         } else if (!is_power_of_2(amdgpu_sched_jobs)) {
2019                 dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
2020                          amdgpu_sched_jobs);
2021                 amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
2022         }
2023
2024         if (amdgpu_gart_size != -1 && amdgpu_gart_size < 32) {
2025                 /* gart size must be greater or equal to 32M */
2026                 dev_warn(adev->dev, "gart size (%d) too small\n",
2027                          amdgpu_gart_size);
2028                 amdgpu_gart_size = -1;
2029         }
2030
2031         if (amdgpu_gtt_size != -1 && amdgpu_gtt_size < 32) {
2032                 /* gtt size must be greater or equal to 32M */
2033                 dev_warn(adev->dev, "gtt size (%d) too small\n",
2034                                  amdgpu_gtt_size);
2035                 amdgpu_gtt_size = -1;
2036         }
2037
2038         /* valid range is between 4 and 9 inclusive */
2039         if (amdgpu_vm_fragment_size != -1 &&
2040             (amdgpu_vm_fragment_size > 9 || amdgpu_vm_fragment_size < 4)) {
2041                 dev_warn(adev->dev, "valid range is between 4 and 9\n");
2042                 amdgpu_vm_fragment_size = -1;
2043         }
2044
2045         if (amdgpu_sched_hw_submission < 2) {
2046                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be at least 2\n",
2047                          amdgpu_sched_hw_submission);
2048                 amdgpu_sched_hw_submission = 2;
2049         } else if (!is_power_of_2(amdgpu_sched_hw_submission)) {
2050                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be a power of 2\n",
2051                          amdgpu_sched_hw_submission);
2052                 amdgpu_sched_hw_submission = roundup_pow_of_two(amdgpu_sched_hw_submission);
2053         }
2054
2055         if (amdgpu_reset_method < -1 || amdgpu_reset_method > 4) {
2056                 dev_warn(adev->dev, "invalid option for reset method, reverting to default\n");
2057                 amdgpu_reset_method = -1;
2058         }
2059
2060         amdgpu_device_check_smu_prv_buffer_size(adev);
2061
2062         amdgpu_device_check_vm_size(adev);
2063
2064         amdgpu_device_check_block_size(adev);
2065
2066         adev->firmware.load_type = amdgpu_ucode_get_load_type(adev, amdgpu_fw_load_type);
2067
2068         for (i = 0; i < MAX_XCP; i++)
2069                 adev->enforce_isolation[i] = !!enforce_isolation;
2070
2071         return 0;
2072 }
2073
2074 /**
2075  * amdgpu_switcheroo_set_state - set switcheroo state
2076  *
2077  * @pdev: pci dev pointer
2078  * @state: vga_switcheroo state
2079  *
2080  * Callback for the switcheroo driver.  Suspends or resumes
2081  * the asics before or after it is powered up using ACPI methods.
2082  */
2083 static void amdgpu_switcheroo_set_state(struct pci_dev *pdev,
2084                                         enum vga_switcheroo_state state)
2085 {
2086         struct drm_device *dev = pci_get_drvdata(pdev);
2087         int r;
2088
2089         if (amdgpu_device_supports_px(dev) && state == VGA_SWITCHEROO_OFF)
2090                 return;
2091
2092         if (state == VGA_SWITCHEROO_ON) {
2093                 pr_info("switched on\n");
2094                 /* don't suspend or resume card normally */
2095                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
2096
2097                 pci_set_power_state(pdev, PCI_D0);
2098                 amdgpu_device_load_pci_state(pdev);
2099                 r = pci_enable_device(pdev);
2100                 if (r)
2101                         DRM_WARN("pci_enable_device failed (%d)\n", r);
2102                 amdgpu_device_resume(dev, true);
2103
2104                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
2105         } else {
2106                 pr_info("switched off\n");
2107                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
2108                 amdgpu_device_prepare(dev);
2109                 amdgpu_device_suspend(dev, true);
2110                 amdgpu_device_cache_pci_state(pdev);
2111                 /* Shut down the device */
2112                 pci_disable_device(pdev);
2113                 pci_set_power_state(pdev, PCI_D3cold);
2114                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
2115         }
2116 }
2117
2118 /**
2119  * amdgpu_switcheroo_can_switch - see if switcheroo state can change
2120  *
2121  * @pdev: pci dev pointer
2122  *
2123  * Callback for the switcheroo driver.  Check of the switcheroo
2124  * state can be changed.
2125  * Returns true if the state can be changed, false if not.
2126  */
2127 static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
2128 {
2129         struct drm_device *dev = pci_get_drvdata(pdev);
2130
2131        /*
2132         * FIXME: open_count is protected by drm_global_mutex but that would lead to
2133         * locking inversion with the driver load path. And the access here is
2134         * completely racy anyway. So don't bother with locking for now.
2135         */
2136         return atomic_read(&dev->open_count) == 0;
2137 }
2138
2139 static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
2140         .set_gpu_state = amdgpu_switcheroo_set_state,
2141         .reprobe = NULL,
2142         .can_switch = amdgpu_switcheroo_can_switch,
2143 };
2144
2145 /**
2146  * amdgpu_device_ip_set_clockgating_state - set the CG state
2147  *
2148  * @dev: amdgpu_device pointer
2149  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2150  * @state: clockgating state (gate or ungate)
2151  *
2152  * Sets the requested clockgating state for all instances of
2153  * the hardware IP specified.
2154  * Returns the error code from the last instance.
2155  */
2156 int amdgpu_device_ip_set_clockgating_state(void *dev,
2157                                            enum amd_ip_block_type block_type,
2158                                            enum amd_clockgating_state state)
2159 {
2160         struct amdgpu_device *adev = dev;
2161         int i, r = 0;
2162
2163         for (i = 0; i < adev->num_ip_blocks; i++) {
2164                 if (!adev->ip_blocks[i].status.valid)
2165                         continue;
2166                 if (adev->ip_blocks[i].version->type != block_type)
2167                         continue;
2168                 if (!adev->ip_blocks[i].version->funcs->set_clockgating_state)
2169                         continue;
2170                 r = adev->ip_blocks[i].version->funcs->set_clockgating_state(
2171                         (void *)adev, state);
2172                 if (r)
2173                         DRM_ERROR("set_clockgating_state of IP block <%s> failed %d\n",
2174                                   adev->ip_blocks[i].version->funcs->name, r);
2175         }
2176         return r;
2177 }
2178
2179 /**
2180  * amdgpu_device_ip_set_powergating_state - set the PG state
2181  *
2182  * @dev: amdgpu_device pointer
2183  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2184  * @state: powergating state (gate or ungate)
2185  *
2186  * Sets the requested powergating state for all instances of
2187  * the hardware IP specified.
2188  * Returns the error code from the last instance.
2189  */
2190 int amdgpu_device_ip_set_powergating_state(void *dev,
2191                                            enum amd_ip_block_type block_type,
2192                                            enum amd_powergating_state state)
2193 {
2194         struct amdgpu_device *adev = dev;
2195         int i, r = 0;
2196
2197         for (i = 0; i < adev->num_ip_blocks; i++) {
2198                 if (!adev->ip_blocks[i].status.valid)
2199                         continue;
2200                 if (adev->ip_blocks[i].version->type != block_type)
2201                         continue;
2202                 if (!adev->ip_blocks[i].version->funcs->set_powergating_state)
2203                         continue;
2204                 r = adev->ip_blocks[i].version->funcs->set_powergating_state(
2205                         (void *)adev, state);
2206                 if (r)
2207                         DRM_ERROR("set_powergating_state of IP block <%s> failed %d\n",
2208                                   adev->ip_blocks[i].version->funcs->name, r);
2209         }
2210         return r;
2211 }
2212
2213 /**
2214  * amdgpu_device_ip_get_clockgating_state - get the CG state
2215  *
2216  * @adev: amdgpu_device pointer
2217  * @flags: clockgating feature flags
2218  *
2219  * Walks the list of IPs on the device and updates the clockgating
2220  * flags for each IP.
2221  * Updates @flags with the feature flags for each hardware IP where
2222  * clockgating is enabled.
2223  */
2224 void amdgpu_device_ip_get_clockgating_state(struct amdgpu_device *adev,
2225                                             u64 *flags)
2226 {
2227         int i;
2228
2229         for (i = 0; i < adev->num_ip_blocks; i++) {
2230                 if (!adev->ip_blocks[i].status.valid)
2231                         continue;
2232                 if (adev->ip_blocks[i].version->funcs->get_clockgating_state)
2233                         adev->ip_blocks[i].version->funcs->get_clockgating_state((void *)adev, flags);
2234         }
2235 }
2236
2237 /**
2238  * amdgpu_device_ip_wait_for_idle - wait for idle
2239  *
2240  * @adev: amdgpu_device pointer
2241  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2242  *
2243  * Waits for the request hardware IP to be idle.
2244  * Returns 0 for success or a negative error code on failure.
2245  */
2246 int amdgpu_device_ip_wait_for_idle(struct amdgpu_device *adev,
2247                                    enum amd_ip_block_type block_type)
2248 {
2249         int i, r;
2250
2251         for (i = 0; i < adev->num_ip_blocks; i++) {
2252                 if (!adev->ip_blocks[i].status.valid)
2253                         continue;
2254                 if (adev->ip_blocks[i].version->type == block_type) {
2255                         if (adev->ip_blocks[i].version->funcs->wait_for_idle) {
2256                                 r = adev->ip_blocks[i].version->funcs->wait_for_idle(
2257                                                                 &adev->ip_blocks[i]);
2258                                 if (r)
2259                                         return r;
2260                         }
2261                         break;
2262                 }
2263         }
2264         return 0;
2265
2266 }
2267
2268 /**
2269  * amdgpu_device_ip_is_valid - is the hardware IP enabled
2270  *
2271  * @adev: amdgpu_device pointer
2272  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2273  *
2274  * Check if the hardware IP is enable or not.
2275  * Returns true if it the IP is enable, false if not.
2276  */
2277 bool amdgpu_device_ip_is_valid(struct amdgpu_device *adev,
2278                                enum amd_ip_block_type block_type)
2279 {
2280         int i;
2281
2282         for (i = 0; i < adev->num_ip_blocks; i++) {
2283                 if (adev->ip_blocks[i].version->type == block_type)
2284                         return adev->ip_blocks[i].status.valid;
2285         }
2286         return false;
2287
2288 }
2289
2290 /**
2291  * amdgpu_device_ip_get_ip_block - get a hw IP pointer
2292  *
2293  * @adev: amdgpu_device pointer
2294  * @type: Type of hardware IP (SMU, GFX, UVD, etc.)
2295  *
2296  * Returns a pointer to the hardware IP block structure
2297  * if it exists for the asic, otherwise NULL.
2298  */
2299 struct amdgpu_ip_block *
2300 amdgpu_device_ip_get_ip_block(struct amdgpu_device *adev,
2301                               enum amd_ip_block_type type)
2302 {
2303         int i;
2304
2305         for (i = 0; i < adev->num_ip_blocks; i++)
2306                 if (adev->ip_blocks[i].version->type == type)
2307                         return &adev->ip_blocks[i];
2308
2309         return NULL;
2310 }
2311
2312 /**
2313  * amdgpu_device_ip_block_version_cmp
2314  *
2315  * @adev: amdgpu_device pointer
2316  * @type: enum amd_ip_block_type
2317  * @major: major version
2318  * @minor: minor version
2319  *
2320  * return 0 if equal or greater
2321  * return 1 if smaller or the ip_block doesn't exist
2322  */
2323 int amdgpu_device_ip_block_version_cmp(struct amdgpu_device *adev,
2324                                        enum amd_ip_block_type type,
2325                                        u32 major, u32 minor)
2326 {
2327         struct amdgpu_ip_block *ip_block = amdgpu_device_ip_get_ip_block(adev, type);
2328
2329         if (ip_block && ((ip_block->version->major > major) ||
2330                         ((ip_block->version->major == major) &&
2331                         (ip_block->version->minor >= minor))))
2332                 return 0;
2333
2334         return 1;
2335 }
2336
2337 /**
2338  * amdgpu_device_ip_block_add
2339  *
2340  * @adev: amdgpu_device pointer
2341  * @ip_block_version: pointer to the IP to add
2342  *
2343  * Adds the IP block driver information to the collection of IPs
2344  * on the asic.
2345  */
2346 int amdgpu_device_ip_block_add(struct amdgpu_device *adev,
2347                                const struct amdgpu_ip_block_version *ip_block_version)
2348 {
2349         if (!ip_block_version)
2350                 return -EINVAL;
2351
2352         switch (ip_block_version->type) {
2353         case AMD_IP_BLOCK_TYPE_VCN:
2354                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_VCN_MASK)
2355                         return 0;
2356                 break;
2357         case AMD_IP_BLOCK_TYPE_JPEG:
2358                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_JPEG_MASK)
2359                         return 0;
2360                 break;
2361         default:
2362                 break;
2363         }
2364
2365         DRM_INFO("add ip block number %d <%s>\n", adev->num_ip_blocks,
2366                   ip_block_version->funcs->name);
2367
2368         adev->ip_blocks[adev->num_ip_blocks].adev = adev;
2369
2370         adev->ip_blocks[adev->num_ip_blocks++].version = ip_block_version;
2371
2372         return 0;
2373 }
2374
2375 /**
2376  * amdgpu_device_enable_virtual_display - enable virtual display feature
2377  *
2378  * @adev: amdgpu_device pointer
2379  *
2380  * Enabled the virtual display feature if the user has enabled it via
2381  * the module parameter virtual_display.  This feature provides a virtual
2382  * display hardware on headless boards or in virtualized environments.
2383  * This function parses and validates the configuration string specified by
2384  * the user and configues the virtual display configuration (number of
2385  * virtual connectors, crtcs, etc.) specified.
2386  */
2387 static void amdgpu_device_enable_virtual_display(struct amdgpu_device *adev)
2388 {
2389         adev->enable_virtual_display = false;
2390
2391         if (amdgpu_virtual_display) {
2392                 const char *pci_address_name = pci_name(adev->pdev);
2393                 char *pciaddstr, *pciaddstr_tmp, *pciaddname_tmp, *pciaddname;
2394
2395                 pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
2396                 pciaddstr_tmp = pciaddstr;
2397                 while ((pciaddname_tmp = strsep(&pciaddstr_tmp, ";"))) {
2398                         pciaddname = strsep(&pciaddname_tmp, ",");
2399                         if (!strcmp("all", pciaddname)
2400                             || !strcmp(pci_address_name, pciaddname)) {
2401                                 long num_crtc;
2402                                 int res = -1;
2403
2404                                 adev->enable_virtual_display = true;
2405
2406                                 if (pciaddname_tmp)
2407                                         res = kstrtol(pciaddname_tmp, 10,
2408                                                       &num_crtc);
2409
2410                                 if (!res) {
2411                                         if (num_crtc < 1)
2412                                                 num_crtc = 1;
2413                                         if (num_crtc > 6)
2414                                                 num_crtc = 6;
2415                                         adev->mode_info.num_crtc = num_crtc;
2416                                 } else {
2417                                         adev->mode_info.num_crtc = 1;
2418                                 }
2419                                 break;
2420                         }
2421                 }
2422
2423                 DRM_INFO("virtual display string:%s, %s:virtual_display:%d, num_crtc:%d\n",
2424                          amdgpu_virtual_display, pci_address_name,
2425                          adev->enable_virtual_display, adev->mode_info.num_crtc);
2426
2427                 kfree(pciaddstr);
2428         }
2429 }
2430
2431 void amdgpu_device_set_sriov_virtual_display(struct amdgpu_device *adev)
2432 {
2433         if (amdgpu_sriov_vf(adev) && !adev->enable_virtual_display) {
2434                 adev->mode_info.num_crtc = 1;
2435                 adev->enable_virtual_display = true;
2436                 DRM_INFO("virtual_display:%d, num_crtc:%d\n",
2437                          adev->enable_virtual_display, adev->mode_info.num_crtc);
2438         }
2439 }
2440
2441 /**
2442  * amdgpu_device_parse_gpu_info_fw - parse gpu info firmware
2443  *
2444  * @adev: amdgpu_device pointer
2445  *
2446  * Parses the asic configuration parameters specified in the gpu info
2447  * firmware and makes them availale to the driver for use in configuring
2448  * the asic.
2449  * Returns 0 on success, -EINVAL on failure.
2450  */
2451 static int amdgpu_device_parse_gpu_info_fw(struct amdgpu_device *adev)
2452 {
2453         const char *chip_name;
2454         int err;
2455         const struct gpu_info_firmware_header_v1_0 *hdr;
2456
2457         adev->firmware.gpu_info_fw = NULL;
2458
2459         if (adev->mman.discovery_bin)
2460                 return 0;
2461
2462         switch (adev->asic_type) {
2463         default:
2464                 return 0;
2465         case CHIP_VEGA10:
2466                 chip_name = "vega10";
2467                 break;
2468         case CHIP_VEGA12:
2469                 chip_name = "vega12";
2470                 break;
2471         case CHIP_RAVEN:
2472                 if (adev->apu_flags & AMD_APU_IS_RAVEN2)
2473                         chip_name = "raven2";
2474                 else if (adev->apu_flags & AMD_APU_IS_PICASSO)
2475                         chip_name = "picasso";
2476                 else
2477                         chip_name = "raven";
2478                 break;
2479         case CHIP_ARCTURUS:
2480                 chip_name = "arcturus";
2481                 break;
2482         case CHIP_NAVI12:
2483                 chip_name = "navi12";
2484                 break;
2485         }
2486
2487         err = amdgpu_ucode_request(adev, &adev->firmware.gpu_info_fw,
2488                                    "amdgpu/%s_gpu_info.bin", chip_name);
2489         if (err) {
2490                 dev_err(adev->dev,
2491                         "Failed to get gpu_info firmware \"%s_gpu_info.bin\"\n",
2492                         chip_name);
2493                 goto out;
2494         }
2495
2496         hdr = (const struct gpu_info_firmware_header_v1_0 *)adev->firmware.gpu_info_fw->data;
2497         amdgpu_ucode_print_gpu_info_hdr(&hdr->header);
2498
2499         switch (hdr->version_major) {
2500         case 1:
2501         {
2502                 const struct gpu_info_firmware_v1_0 *gpu_info_fw =
2503                         (const struct gpu_info_firmware_v1_0 *)(adev->firmware.gpu_info_fw->data +
2504                                                                 le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2505
2506                 /*
2507                  * Should be droped when DAL no longer needs it.
2508                  */
2509                 if (adev->asic_type == CHIP_NAVI12)
2510                         goto parse_soc_bounding_box;
2511
2512                 adev->gfx.config.max_shader_engines = le32_to_cpu(gpu_info_fw->gc_num_se);
2513                 adev->gfx.config.max_cu_per_sh = le32_to_cpu(gpu_info_fw->gc_num_cu_per_sh);
2514                 adev->gfx.config.max_sh_per_se = le32_to_cpu(gpu_info_fw->gc_num_sh_per_se);
2515                 adev->gfx.config.max_backends_per_se = le32_to_cpu(gpu_info_fw->gc_num_rb_per_se);
2516                 adev->gfx.config.max_texture_channel_caches =
2517                         le32_to_cpu(gpu_info_fw->gc_num_tccs);
2518                 adev->gfx.config.max_gprs = le32_to_cpu(gpu_info_fw->gc_num_gprs);
2519                 adev->gfx.config.max_gs_threads = le32_to_cpu(gpu_info_fw->gc_num_max_gs_thds);
2520                 adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gpu_info_fw->gc_gs_table_depth);
2521                 adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gpu_info_fw->gc_gsprim_buff_depth);
2522                 adev->gfx.config.double_offchip_lds_buf =
2523                         le32_to_cpu(gpu_info_fw->gc_double_offchip_lds_buffer);
2524                 adev->gfx.cu_info.wave_front_size = le32_to_cpu(gpu_info_fw->gc_wave_size);
2525                 adev->gfx.cu_info.max_waves_per_simd =
2526                         le32_to_cpu(gpu_info_fw->gc_max_waves_per_simd);
2527                 adev->gfx.cu_info.max_scratch_slots_per_cu =
2528                         le32_to_cpu(gpu_info_fw->gc_max_scratch_slots_per_cu);
2529                 adev->gfx.cu_info.lds_size = le32_to_cpu(gpu_info_fw->gc_lds_size);
2530                 if (hdr->version_minor >= 1) {
2531                         const struct gpu_info_firmware_v1_1 *gpu_info_fw =
2532                                 (const struct gpu_info_firmware_v1_1 *)(adev->firmware.gpu_info_fw->data +
2533                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2534                         adev->gfx.config.num_sc_per_sh =
2535                                 le32_to_cpu(gpu_info_fw->num_sc_per_sh);
2536                         adev->gfx.config.num_packer_per_sc =
2537                                 le32_to_cpu(gpu_info_fw->num_packer_per_sc);
2538                 }
2539
2540 parse_soc_bounding_box:
2541                 /*
2542                  * soc bounding box info is not integrated in disocovery table,
2543                  * we always need to parse it from gpu info firmware if needed.
2544                  */
2545                 if (hdr->version_minor == 2) {
2546                         const struct gpu_info_firmware_v1_2 *gpu_info_fw =
2547                                 (const struct gpu_info_firmware_v1_2 *)(adev->firmware.gpu_info_fw->data +
2548                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2549                         adev->dm.soc_bounding_box = &gpu_info_fw->soc_bounding_box;
2550                 }
2551                 break;
2552         }
2553         default:
2554                 dev_err(adev->dev,
2555                         "Unsupported gpu_info table %d\n", hdr->header.ucode_version);
2556                 err = -EINVAL;
2557                 goto out;
2558         }
2559 out:
2560         return err;
2561 }
2562
2563 /**
2564  * amdgpu_device_ip_early_init - run early init for hardware IPs
2565  *
2566  * @adev: amdgpu_device pointer
2567  *
2568  * Early initialization pass for hardware IPs.  The hardware IPs that make
2569  * up each asic are discovered each IP's early_init callback is run.  This
2570  * is the first stage in initializing the asic.
2571  * Returns 0 on success, negative error code on failure.
2572  */
2573 static int amdgpu_device_ip_early_init(struct amdgpu_device *adev)
2574 {
2575         struct amdgpu_ip_block *ip_block;
2576         struct pci_dev *parent;
2577         int i, r;
2578         bool total;
2579
2580         amdgpu_device_enable_virtual_display(adev);
2581
2582         if (amdgpu_sriov_vf(adev)) {
2583                 r = amdgpu_virt_request_full_gpu(adev, true);
2584                 if (r)
2585                         return r;
2586         }
2587
2588         switch (adev->asic_type) {
2589 #ifdef CONFIG_DRM_AMDGPU_SI
2590         case CHIP_VERDE:
2591         case CHIP_TAHITI:
2592         case CHIP_PITCAIRN:
2593         case CHIP_OLAND:
2594         case CHIP_HAINAN:
2595                 adev->family = AMDGPU_FAMILY_SI;
2596                 r = si_set_ip_blocks(adev);
2597                 if (r)
2598                         return r;
2599                 break;
2600 #endif
2601 #ifdef CONFIG_DRM_AMDGPU_CIK
2602         case CHIP_BONAIRE:
2603         case CHIP_HAWAII:
2604         case CHIP_KAVERI:
2605         case CHIP_KABINI:
2606         case CHIP_MULLINS:
2607                 if (adev->flags & AMD_IS_APU)
2608                         adev->family = AMDGPU_FAMILY_KV;
2609                 else
2610                         adev->family = AMDGPU_FAMILY_CI;
2611
2612                 r = cik_set_ip_blocks(adev);
2613                 if (r)
2614                         return r;
2615                 break;
2616 #endif
2617         case CHIP_TOPAZ:
2618         case CHIP_TONGA:
2619         case CHIP_FIJI:
2620         case CHIP_POLARIS10:
2621         case CHIP_POLARIS11:
2622         case CHIP_POLARIS12:
2623         case CHIP_VEGAM:
2624         case CHIP_CARRIZO:
2625         case CHIP_STONEY:
2626                 if (adev->flags & AMD_IS_APU)
2627                         adev->family = AMDGPU_FAMILY_CZ;
2628                 else
2629                         adev->family = AMDGPU_FAMILY_VI;
2630
2631                 r = vi_set_ip_blocks(adev);
2632                 if (r)
2633                         return r;
2634                 break;
2635         default:
2636                 r = amdgpu_discovery_set_ip_blocks(adev);
2637                 if (r)
2638                         return r;
2639                 break;
2640         }
2641
2642         if (amdgpu_has_atpx() &&
2643             (amdgpu_is_atpx_hybrid() ||
2644              amdgpu_has_atpx_dgpu_power_cntl()) &&
2645             ((adev->flags & AMD_IS_APU) == 0) &&
2646             !dev_is_removable(&adev->pdev->dev))
2647                 adev->flags |= AMD_IS_PX;
2648
2649         if (!(adev->flags & AMD_IS_APU)) {
2650                 parent = pcie_find_root_port(adev->pdev);
2651                 adev->has_pr3 = parent ? pci_pr3_present(parent) : false;
2652         }
2653
2654
2655         adev->pm.pp_feature = amdgpu_pp_feature_mask;
2656         if (amdgpu_sriov_vf(adev) || sched_policy == KFD_SCHED_POLICY_NO_HWS)
2657                 adev->pm.pp_feature &= ~PP_GFXOFF_MASK;
2658         if (amdgpu_sriov_vf(adev) && adev->asic_type == CHIP_SIENNA_CICHLID)
2659                 adev->pm.pp_feature &= ~PP_OVERDRIVE_MASK;
2660         if (!amdgpu_device_pcie_dynamic_switching_supported(adev))
2661                 adev->pm.pp_feature &= ~PP_PCIE_DPM_MASK;
2662
2663         total = true;
2664         for (i = 0; i < adev->num_ip_blocks; i++) {
2665                 ip_block = &adev->ip_blocks[i];
2666
2667                 if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
2668                         DRM_WARN("disabled ip block: %d <%s>\n",
2669                                   i, adev->ip_blocks[i].version->funcs->name);
2670                         adev->ip_blocks[i].status.valid = false;
2671                 } else if (ip_block->version->funcs->early_init) {
2672                         r = ip_block->version->funcs->early_init(ip_block);
2673                         if (r == -ENOENT) {
2674                                 adev->ip_blocks[i].status.valid = false;
2675                         } else if (r) {
2676                                 DRM_ERROR("early_init of IP block <%s> failed %d\n",
2677                                           adev->ip_blocks[i].version->funcs->name, r);
2678                                 total = false;
2679                         } else {
2680                                 adev->ip_blocks[i].status.valid = true;
2681                         }
2682                 } else {
2683                         adev->ip_blocks[i].status.valid = true;
2684                 }
2685                 /* get the vbios after the asic_funcs are set up */
2686                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2687                         r = amdgpu_device_parse_gpu_info_fw(adev);
2688                         if (r)
2689                                 return r;
2690
2691                         /* Read BIOS */
2692                         if (amdgpu_device_read_bios(adev)) {
2693                                 if (!amdgpu_get_bios(adev))
2694                                         return -EINVAL;
2695
2696                                 r = amdgpu_atombios_init(adev);
2697                                 if (r) {
2698                                         dev_err(adev->dev, "amdgpu_atombios_init failed\n");
2699                                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_INIT_FAIL, 0, 0);
2700                                         return r;
2701                                 }
2702                         }
2703
2704                         /*get pf2vf msg info at it's earliest time*/
2705                         if (amdgpu_sriov_vf(adev))
2706                                 amdgpu_virt_init_data_exchange(adev);
2707
2708                 }
2709         }
2710         if (!total)
2711                 return -ENODEV;
2712
2713         ip_block = amdgpu_device_ip_get_ip_block(adev, AMD_IP_BLOCK_TYPE_GFX);
2714         if (ip_block->status.valid != false)
2715                 amdgpu_amdkfd_device_probe(adev);
2716
2717         adev->cg_flags &= amdgpu_cg_mask;
2718         adev->pg_flags &= amdgpu_pg_mask;
2719
2720         return 0;
2721 }
2722
2723 static int amdgpu_device_ip_hw_init_phase1(struct amdgpu_device *adev)
2724 {
2725         int i, r;
2726
2727         for (i = 0; i < adev->num_ip_blocks; i++) {
2728                 if (!adev->ip_blocks[i].status.sw)
2729                         continue;
2730                 if (adev->ip_blocks[i].status.hw)
2731                         continue;
2732                 if (!amdgpu_ip_member_of_hwini(
2733                             adev, adev->ip_blocks[i].version->type))
2734                         continue;
2735                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2736                     (amdgpu_sriov_vf(adev) && (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)) ||
2737                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
2738                         r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2739                         if (r) {
2740                                 DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2741                                           adev->ip_blocks[i].version->funcs->name, r);
2742                                 return r;
2743                         }
2744                         adev->ip_blocks[i].status.hw = true;
2745                 }
2746         }
2747
2748         return 0;
2749 }
2750
2751 static int amdgpu_device_ip_hw_init_phase2(struct amdgpu_device *adev)
2752 {
2753         int i, r;
2754
2755         for (i = 0; i < adev->num_ip_blocks; i++) {
2756                 if (!adev->ip_blocks[i].status.sw)
2757                         continue;
2758                 if (adev->ip_blocks[i].status.hw)
2759                         continue;
2760                 if (!amdgpu_ip_member_of_hwini(
2761                             adev, adev->ip_blocks[i].version->type))
2762                         continue;
2763                 r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2764                 if (r) {
2765                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2766                                   adev->ip_blocks[i].version->funcs->name, r);
2767                         return r;
2768                 }
2769                 adev->ip_blocks[i].status.hw = true;
2770         }
2771
2772         return 0;
2773 }
2774
2775 static int amdgpu_device_fw_loading(struct amdgpu_device *adev)
2776 {
2777         int r = 0;
2778         int i;
2779         uint32_t smu_version;
2780
2781         if (adev->asic_type >= CHIP_VEGA10) {
2782                 for (i = 0; i < adev->num_ip_blocks; i++) {
2783                         if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_PSP)
2784                                 continue;
2785
2786                         if (!amdgpu_ip_member_of_hwini(adev,
2787                                                        AMD_IP_BLOCK_TYPE_PSP))
2788                                 break;
2789
2790                         if (!adev->ip_blocks[i].status.sw)
2791                                 continue;
2792
2793                         /* no need to do the fw loading again if already done*/
2794                         if (adev->ip_blocks[i].status.hw == true)
2795                                 break;
2796
2797                         if (amdgpu_in_reset(adev) || adev->in_suspend) {
2798                                 r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
2799                                 if (r)
2800                                         return r;
2801                         } else {
2802                                 r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2803                                 if (r) {
2804                                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2805                                                           adev->ip_blocks[i].version->funcs->name, r);
2806                                         return r;
2807                                 }
2808                                 adev->ip_blocks[i].status.hw = true;
2809                         }
2810                         break;
2811                 }
2812         }
2813
2814         if (!amdgpu_sriov_vf(adev) || adev->asic_type == CHIP_TONGA)
2815                 r = amdgpu_pm_load_smu_firmware(adev, &smu_version);
2816
2817         return r;
2818 }
2819
2820 static int amdgpu_device_init_schedulers(struct amdgpu_device *adev)
2821 {
2822         long timeout;
2823         int r, i;
2824
2825         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2826                 struct amdgpu_ring *ring = adev->rings[i];
2827
2828                 /* No need to setup the GPU scheduler for rings that don't need it */
2829                 if (!ring || ring->no_scheduler)
2830                         continue;
2831
2832                 switch (ring->funcs->type) {
2833                 case AMDGPU_RING_TYPE_GFX:
2834                         timeout = adev->gfx_timeout;
2835                         break;
2836                 case AMDGPU_RING_TYPE_COMPUTE:
2837                         timeout = adev->compute_timeout;
2838                         break;
2839                 case AMDGPU_RING_TYPE_SDMA:
2840                         timeout = adev->sdma_timeout;
2841                         break;
2842                 default:
2843                         timeout = adev->video_timeout;
2844                         break;
2845                 }
2846
2847                 r = drm_sched_init(&ring->sched, &amdgpu_sched_ops, NULL,
2848                                    DRM_SCHED_PRIORITY_COUNT,
2849                                    ring->num_hw_submission, 0,
2850                                    timeout, adev->reset_domain->wq,
2851                                    ring->sched_score, ring->name,
2852                                    adev->dev);
2853                 if (r) {
2854                         DRM_ERROR("Failed to create scheduler on ring %s.\n",
2855                                   ring->name);
2856                         return r;
2857                 }
2858                 r = amdgpu_uvd_entity_init(adev, ring);
2859                 if (r) {
2860                         DRM_ERROR("Failed to create UVD scheduling entity on ring %s.\n",
2861                                   ring->name);
2862                         return r;
2863                 }
2864                 r = amdgpu_vce_entity_init(adev, ring);
2865                 if (r) {
2866                         DRM_ERROR("Failed to create VCE scheduling entity on ring %s.\n",
2867                                   ring->name);
2868                         return r;
2869                 }
2870         }
2871
2872         amdgpu_xcp_update_partition_sched_list(adev);
2873
2874         return 0;
2875 }
2876
2877
2878 /**
2879  * amdgpu_device_ip_init - run init for hardware IPs
2880  *
2881  * @adev: amdgpu_device pointer
2882  *
2883  * Main initialization pass for hardware IPs.  The list of all the hardware
2884  * IPs that make up the asic is walked and the sw_init and hw_init callbacks
2885  * are run.  sw_init initializes the software state associated with each IP
2886  * and hw_init initializes the hardware associated with each IP.
2887  * Returns 0 on success, negative error code on failure.
2888  */
2889 static int amdgpu_device_ip_init(struct amdgpu_device *adev)
2890 {
2891         bool init_badpage;
2892         int i, r;
2893
2894         r = amdgpu_ras_init(adev);
2895         if (r)
2896                 return r;
2897
2898         for (i = 0; i < adev->num_ip_blocks; i++) {
2899                 if (!adev->ip_blocks[i].status.valid)
2900                         continue;
2901                 if (adev->ip_blocks[i].version->funcs->sw_init) {
2902                         r = adev->ip_blocks[i].version->funcs->sw_init(&adev->ip_blocks[i]);
2903                         if (r) {
2904                                 DRM_ERROR("sw_init of IP block <%s> failed %d\n",
2905                                           adev->ip_blocks[i].version->funcs->name, r);
2906                                 goto init_failed;
2907                         }
2908                 }
2909                 adev->ip_blocks[i].status.sw = true;
2910
2911                 if (!amdgpu_ip_member_of_hwini(
2912                             adev, adev->ip_blocks[i].version->type))
2913                         continue;
2914
2915                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2916                         /* need to do common hw init early so everything is set up for gmc */
2917                         r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2918                         if (r) {
2919                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2920                                 goto init_failed;
2921                         }
2922                         adev->ip_blocks[i].status.hw = true;
2923                 } else if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2924                         /* need to do gmc hw init early so we can allocate gpu mem */
2925                         /* Try to reserve bad pages early */
2926                         if (amdgpu_sriov_vf(adev))
2927                                 amdgpu_virt_exchange_data(adev);
2928
2929                         r = amdgpu_device_mem_scratch_init(adev);
2930                         if (r) {
2931                                 DRM_ERROR("amdgpu_mem_scratch_init failed %d\n", r);
2932                                 goto init_failed;
2933                         }
2934                         r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2935                         if (r) {
2936                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2937                                 goto init_failed;
2938                         }
2939                         r = amdgpu_device_wb_init(adev);
2940                         if (r) {
2941                                 DRM_ERROR("amdgpu_device_wb_init failed %d\n", r);
2942                                 goto init_failed;
2943                         }
2944                         adev->ip_blocks[i].status.hw = true;
2945
2946                         /* right after GMC hw init, we create CSA */
2947                         if (adev->gfx.mcbp) {
2948                                 r = amdgpu_allocate_static_csa(adev, &adev->virt.csa_obj,
2949                                                                AMDGPU_GEM_DOMAIN_VRAM |
2950                                                                AMDGPU_GEM_DOMAIN_GTT,
2951                                                                AMDGPU_CSA_SIZE);
2952                                 if (r) {
2953                                         DRM_ERROR("allocate CSA failed %d\n", r);
2954                                         goto init_failed;
2955                                 }
2956                         }
2957
2958                         r = amdgpu_seq64_init(adev);
2959                         if (r) {
2960                                 DRM_ERROR("allocate seq64 failed %d\n", r);
2961                                 goto init_failed;
2962                         }
2963                 }
2964         }
2965
2966         if (amdgpu_sriov_vf(adev))
2967                 amdgpu_virt_init_data_exchange(adev);
2968
2969         r = amdgpu_ib_pool_init(adev);
2970         if (r) {
2971                 dev_err(adev->dev, "IB initialization failed (%d).\n", r);
2972                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_IB_INIT_FAIL, 0, r);
2973                 goto init_failed;
2974         }
2975
2976         r = amdgpu_ucode_create_bo(adev); /* create ucode bo when sw_init complete*/
2977         if (r)
2978                 goto init_failed;
2979
2980         r = amdgpu_device_ip_hw_init_phase1(adev);
2981         if (r)
2982                 goto init_failed;
2983
2984         r = amdgpu_device_fw_loading(adev);
2985         if (r)
2986                 goto init_failed;
2987
2988         r = amdgpu_device_ip_hw_init_phase2(adev);
2989         if (r)
2990                 goto init_failed;
2991
2992         /*
2993          * retired pages will be loaded from eeprom and reserved here,
2994          * it should be called after amdgpu_device_ip_hw_init_phase2  since
2995          * for some ASICs the RAS EEPROM code relies on SMU fully functioning
2996          * for I2C communication which only true at this point.
2997          *
2998          * amdgpu_ras_recovery_init may fail, but the upper only cares the
2999          * failure from bad gpu situation and stop amdgpu init process
3000          * accordingly. For other failed cases, it will still release all
3001          * the resource and print error message, rather than returning one
3002          * negative value to upper level.
3003          *
3004          * Note: theoretically, this should be called before all vram allocations
3005          * to protect retired page from abusing
3006          */
3007         init_badpage = (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI);
3008         r = amdgpu_ras_recovery_init(adev, init_badpage);
3009         if (r)
3010                 goto init_failed;
3011
3012         /**
3013          * In case of XGMI grab extra reference for reset domain for this device
3014          */
3015         if (adev->gmc.xgmi.num_physical_nodes > 1) {
3016                 if (amdgpu_xgmi_add_device(adev) == 0) {
3017                         if (!amdgpu_sriov_vf(adev)) {
3018                                 struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3019
3020                                 if (WARN_ON(!hive)) {
3021                                         r = -ENOENT;
3022                                         goto init_failed;
3023                                 }
3024
3025                                 if (!hive->reset_domain ||
3026                                     !amdgpu_reset_get_reset_domain(hive->reset_domain)) {
3027                                         r = -ENOENT;
3028                                         amdgpu_put_xgmi_hive(hive);
3029                                         goto init_failed;
3030                                 }
3031
3032                                 /* Drop the early temporary reset domain we created for device */
3033                                 amdgpu_reset_put_reset_domain(adev->reset_domain);
3034                                 adev->reset_domain = hive->reset_domain;
3035                                 amdgpu_put_xgmi_hive(hive);
3036                         }
3037                 }
3038         }
3039
3040         r = amdgpu_device_init_schedulers(adev);
3041         if (r)
3042                 goto init_failed;
3043
3044         if (adev->mman.buffer_funcs_ring->sched.ready)
3045                 amdgpu_ttm_set_buffer_funcs_status(adev, true);
3046
3047         /* Don't init kfd if whole hive need to be reset during init */
3048         if (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI) {
3049                 kgd2kfd_init_zone_device(adev);
3050                 amdgpu_amdkfd_device_init(adev);
3051         }
3052
3053         amdgpu_fru_get_product_info(adev);
3054
3055 init_failed:
3056
3057         return r;
3058 }
3059
3060 /**
3061  * amdgpu_device_fill_reset_magic - writes reset magic to gart pointer
3062  *
3063  * @adev: amdgpu_device pointer
3064  *
3065  * Writes a reset magic value to the gart pointer in VRAM.  The driver calls
3066  * this function before a GPU reset.  If the value is retained after a
3067  * GPU reset, VRAM has not been lost.  Some GPU resets may destry VRAM contents.
3068  */
3069 static void amdgpu_device_fill_reset_magic(struct amdgpu_device *adev)
3070 {
3071         memcpy(adev->reset_magic, adev->gart.ptr, AMDGPU_RESET_MAGIC_NUM);
3072 }
3073
3074 /**
3075  * amdgpu_device_check_vram_lost - check if vram is valid
3076  *
3077  * @adev: amdgpu_device pointer
3078  *
3079  * Checks the reset magic value written to the gart pointer in VRAM.
3080  * The driver calls this after a GPU reset to see if the contents of
3081  * VRAM is lost or now.
3082  * returns true if vram is lost, false if not.
3083  */
3084 static bool amdgpu_device_check_vram_lost(struct amdgpu_device *adev)
3085 {
3086         if (memcmp(adev->gart.ptr, adev->reset_magic,
3087                         AMDGPU_RESET_MAGIC_NUM))
3088                 return true;
3089
3090         if (!amdgpu_in_reset(adev))
3091                 return false;
3092
3093         /*
3094          * For all ASICs with baco/mode1 reset, the VRAM is
3095          * always assumed to be lost.
3096          */
3097         switch (amdgpu_asic_reset_method(adev)) {
3098         case AMD_RESET_METHOD_BACO:
3099         case AMD_RESET_METHOD_MODE1:
3100                 return true;
3101         default:
3102                 return false;
3103         }
3104 }
3105
3106 /**
3107  * amdgpu_device_set_cg_state - set clockgating for amdgpu device
3108  *
3109  * @adev: amdgpu_device pointer
3110  * @state: clockgating state (gate or ungate)
3111  *
3112  * The list of all the hardware IPs that make up the asic is walked and the
3113  * set_clockgating_state callbacks are run.
3114  * Late initialization pass enabling clockgating for hardware IPs.
3115  * Fini or suspend, pass disabling clockgating for hardware IPs.
3116  * Returns 0 on success, negative error code on failure.
3117  */
3118
3119 int amdgpu_device_set_cg_state(struct amdgpu_device *adev,
3120                                enum amd_clockgating_state state)
3121 {
3122         int i, j, r;
3123
3124         if (amdgpu_emu_mode == 1)
3125                 return 0;
3126
3127         for (j = 0; j < adev->num_ip_blocks; j++) {
3128                 i = state == AMD_CG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
3129                 if (!adev->ip_blocks[i].status.late_initialized)
3130                         continue;
3131                 /* skip CG for GFX, SDMA on S0ix */
3132                 if (adev->in_s0ix &&
3133                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3134                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SDMA))
3135                         continue;
3136                 /* skip CG for VCE/UVD, it's handled specially */
3137                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
3138                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
3139                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
3140                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
3141                     adev->ip_blocks[i].version->funcs->set_clockgating_state) {
3142                         /* enable clockgating to save power */
3143                         r = adev->ip_blocks[i].version->funcs->set_clockgating_state((void *)adev,
3144                                                                                      state);
3145                         if (r) {
3146                                 DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n",
3147                                           adev->ip_blocks[i].version->funcs->name, r);
3148                                 return r;
3149                         }
3150                 }
3151         }
3152
3153         return 0;
3154 }
3155
3156 int amdgpu_device_set_pg_state(struct amdgpu_device *adev,
3157                                enum amd_powergating_state state)
3158 {
3159         int i, j, r;
3160
3161         if (amdgpu_emu_mode == 1)
3162                 return 0;
3163
3164         for (j = 0; j < adev->num_ip_blocks; j++) {
3165                 i = state == AMD_PG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
3166                 if (!adev->ip_blocks[i].status.late_initialized)
3167                         continue;
3168                 /* skip PG for GFX, SDMA on S0ix */
3169                 if (adev->in_s0ix &&
3170                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3171                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SDMA))
3172                         continue;
3173                 /* skip CG for VCE/UVD, it's handled specially */
3174                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
3175                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
3176                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
3177                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
3178                     adev->ip_blocks[i].version->funcs->set_powergating_state) {
3179                         /* enable powergating to save power */
3180                         r = adev->ip_blocks[i].version->funcs->set_powergating_state((void *)adev,
3181                                                                                         state);
3182                         if (r) {
3183                                 DRM_ERROR("set_powergating_state(gate) of IP block <%s> failed %d\n",
3184                                           adev->ip_blocks[i].version->funcs->name, r);
3185                                 return r;
3186                         }
3187                 }
3188         }
3189         return 0;
3190 }
3191
3192 static int amdgpu_device_enable_mgpu_fan_boost(void)
3193 {
3194         struct amdgpu_gpu_instance *gpu_ins;
3195         struct amdgpu_device *adev;
3196         int i, ret = 0;
3197
3198         mutex_lock(&mgpu_info.mutex);
3199
3200         /*
3201          * MGPU fan boost feature should be enabled
3202          * only when there are two or more dGPUs in
3203          * the system
3204          */
3205         if (mgpu_info.num_dgpu < 2)
3206                 goto out;
3207
3208         for (i = 0; i < mgpu_info.num_dgpu; i++) {
3209                 gpu_ins = &(mgpu_info.gpu_ins[i]);
3210                 adev = gpu_ins->adev;
3211                 if (!(adev->flags & AMD_IS_APU) &&
3212                     !gpu_ins->mgpu_fan_enabled) {
3213                         ret = amdgpu_dpm_enable_mgpu_fan_boost(adev);
3214                         if (ret)
3215                                 break;
3216
3217                         gpu_ins->mgpu_fan_enabled = 1;
3218                 }
3219         }
3220
3221 out:
3222         mutex_unlock(&mgpu_info.mutex);
3223
3224         return ret;
3225 }
3226
3227 /**
3228  * amdgpu_device_ip_late_init - run late init for hardware IPs
3229  *
3230  * @adev: amdgpu_device pointer
3231  *
3232  * Late initialization pass for hardware IPs.  The list of all the hardware
3233  * IPs that make up the asic is walked and the late_init callbacks are run.
3234  * late_init covers any special initialization that an IP requires
3235  * after all of the have been initialized or something that needs to happen
3236  * late in the init process.
3237  * Returns 0 on success, negative error code on failure.
3238  */
3239 static int amdgpu_device_ip_late_init(struct amdgpu_device *adev)
3240 {
3241         struct amdgpu_gpu_instance *gpu_instance;
3242         int i = 0, r;
3243
3244         for (i = 0; i < adev->num_ip_blocks; i++) {
3245                 if (!adev->ip_blocks[i].status.hw)
3246                         continue;
3247                 if (adev->ip_blocks[i].version->funcs->late_init) {
3248                         r = adev->ip_blocks[i].version->funcs->late_init(&adev->ip_blocks[i]);
3249                         if (r) {
3250                                 DRM_ERROR("late_init of IP block <%s> failed %d\n",
3251                                           adev->ip_blocks[i].version->funcs->name, r);
3252                                 return r;
3253                         }
3254                 }
3255                 adev->ip_blocks[i].status.late_initialized = true;
3256         }
3257
3258         r = amdgpu_ras_late_init(adev);
3259         if (r) {
3260                 DRM_ERROR("amdgpu_ras_late_init failed %d", r);
3261                 return r;
3262         }
3263
3264         if (!amdgpu_reset_in_recovery(adev))
3265                 amdgpu_ras_set_error_query_ready(adev, true);
3266
3267         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_GATE);
3268         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_GATE);
3269
3270         amdgpu_device_fill_reset_magic(adev);
3271
3272         r = amdgpu_device_enable_mgpu_fan_boost();
3273         if (r)
3274                 DRM_ERROR("enable mgpu fan boost failed (%d).\n", r);
3275
3276         /* For passthrough configuration on arcturus and aldebaran, enable special handling SBR */
3277         if (amdgpu_passthrough(adev) &&
3278             ((adev->asic_type == CHIP_ARCTURUS && adev->gmc.xgmi.num_physical_nodes > 1) ||
3279              adev->asic_type == CHIP_ALDEBARAN))
3280                 amdgpu_dpm_handle_passthrough_sbr(adev, true);
3281
3282         if (adev->gmc.xgmi.num_physical_nodes > 1) {
3283                 mutex_lock(&mgpu_info.mutex);
3284
3285                 /*
3286                  * Reset device p-state to low as this was booted with high.
3287                  *
3288                  * This should be performed only after all devices from the same
3289                  * hive get initialized.
3290                  *
3291                  * However, it's unknown how many device in the hive in advance.
3292                  * As this is counted one by one during devices initializations.
3293                  *
3294                  * So, we wait for all XGMI interlinked devices initialized.
3295                  * This may bring some delays as those devices may come from
3296                  * different hives. But that should be OK.
3297                  */
3298                 if (mgpu_info.num_dgpu == adev->gmc.xgmi.num_physical_nodes) {
3299                         for (i = 0; i < mgpu_info.num_gpu; i++) {
3300                                 gpu_instance = &(mgpu_info.gpu_ins[i]);
3301                                 if (gpu_instance->adev->flags & AMD_IS_APU)
3302                                         continue;
3303
3304                                 r = amdgpu_xgmi_set_pstate(gpu_instance->adev,
3305                                                 AMDGPU_XGMI_PSTATE_MIN);
3306                                 if (r) {
3307                                         DRM_ERROR("pstate setting failed (%d).\n", r);
3308                                         break;
3309                                 }
3310                         }
3311                 }
3312
3313                 mutex_unlock(&mgpu_info.mutex);
3314         }
3315
3316         return 0;
3317 }
3318
3319 static void amdgpu_ip_block_hw_fini(struct amdgpu_ip_block *ip_block)
3320 {
3321         int r;
3322
3323         if (!ip_block->version->funcs->hw_fini) {
3324                 DRM_ERROR("hw_fini of IP block <%s> not defined\n",
3325                           ip_block->version->funcs->name);
3326         } else {
3327                 r = ip_block->version->funcs->hw_fini(ip_block);
3328                 /* XXX handle errors */
3329                 if (r) {
3330                         DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
3331                                   ip_block->version->funcs->name, r);
3332                 }
3333         }
3334
3335         ip_block->status.hw = false;
3336 }
3337
3338 /**
3339  * amdgpu_device_smu_fini_early - smu hw_fini wrapper
3340  *
3341  * @adev: amdgpu_device pointer
3342  *
3343  * For ASICs need to disable SMC first
3344  */
3345 static void amdgpu_device_smu_fini_early(struct amdgpu_device *adev)
3346 {
3347         int i;
3348
3349         if (amdgpu_ip_version(adev, GC_HWIP, 0) > IP_VERSION(9, 0, 0))
3350                 return;
3351
3352         for (i = 0; i < adev->num_ip_blocks; i++) {
3353                 if (!adev->ip_blocks[i].status.hw)
3354                         continue;
3355                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3356                         amdgpu_ip_block_hw_fini(&adev->ip_blocks[i]);
3357                         break;
3358                 }
3359         }
3360 }
3361
3362 static int amdgpu_device_ip_fini_early(struct amdgpu_device *adev)
3363 {
3364         int i, r;
3365
3366         for (i = 0; i < adev->num_ip_blocks; i++) {
3367                 if (!adev->ip_blocks[i].version->funcs->early_fini)
3368                         continue;
3369
3370                 r = adev->ip_blocks[i].version->funcs->early_fini(&adev->ip_blocks[i]);
3371                 if (r) {
3372                         DRM_DEBUG("early_fini of IP block <%s> failed %d\n",
3373                                   adev->ip_blocks[i].version->funcs->name, r);
3374                 }
3375         }
3376
3377         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
3378         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
3379
3380         amdgpu_amdkfd_suspend(adev, false);
3381
3382         /* Workaroud for ASICs need to disable SMC first */
3383         amdgpu_device_smu_fini_early(adev);
3384
3385         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3386                 if (!adev->ip_blocks[i].status.hw)
3387                         continue;
3388
3389                 amdgpu_ip_block_hw_fini(&adev->ip_blocks[i]);
3390         }
3391
3392         if (amdgpu_sriov_vf(adev)) {
3393                 if (amdgpu_virt_release_full_gpu(adev, false))
3394                         DRM_ERROR("failed to release exclusive mode on fini\n");
3395         }
3396
3397         return 0;
3398 }
3399
3400 /**
3401  * amdgpu_device_ip_fini - run fini for hardware IPs
3402  *
3403  * @adev: amdgpu_device pointer
3404  *
3405  * Main teardown pass for hardware IPs.  The list of all the hardware
3406  * IPs that make up the asic is walked and the hw_fini and sw_fini callbacks
3407  * are run.  hw_fini tears down the hardware associated with each IP
3408  * and sw_fini tears down any software state associated with each IP.
3409  * Returns 0 on success, negative error code on failure.
3410  */
3411 static int amdgpu_device_ip_fini(struct amdgpu_device *adev)
3412 {
3413         int i, r;
3414
3415         if (amdgpu_sriov_vf(adev) && adev->virt.ras_init_done)
3416                 amdgpu_virt_release_ras_err_handler_data(adev);
3417
3418         if (adev->gmc.xgmi.num_physical_nodes > 1)
3419                 amdgpu_xgmi_remove_device(adev);
3420
3421         amdgpu_amdkfd_device_fini_sw(adev);
3422
3423         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3424                 if (!adev->ip_blocks[i].status.sw)
3425                         continue;
3426
3427                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
3428                         amdgpu_ucode_free_bo(adev);
3429                         amdgpu_free_static_csa(&adev->virt.csa_obj);
3430                         amdgpu_device_wb_fini(adev);
3431                         amdgpu_device_mem_scratch_fini(adev);
3432                         amdgpu_ib_pool_fini(adev);
3433                         amdgpu_seq64_fini(adev);
3434                 }
3435                 if (adev->ip_blocks[i].version->funcs->sw_fini) {
3436                         r = adev->ip_blocks[i].version->funcs->sw_fini(&adev->ip_blocks[i]);
3437                         /* XXX handle errors */
3438                         if (r) {
3439                                 DRM_DEBUG("sw_fini of IP block <%s> failed %d\n",
3440                                           adev->ip_blocks[i].version->funcs->name, r);
3441                         }
3442                 }
3443                 adev->ip_blocks[i].status.sw = false;
3444                 adev->ip_blocks[i].status.valid = false;
3445         }
3446
3447         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3448                 if (!adev->ip_blocks[i].status.late_initialized)
3449                         continue;
3450                 if (adev->ip_blocks[i].version->funcs->late_fini)
3451                         adev->ip_blocks[i].version->funcs->late_fini(&adev->ip_blocks[i]);
3452                 adev->ip_blocks[i].status.late_initialized = false;
3453         }
3454
3455         amdgpu_ras_fini(adev);
3456
3457         return 0;
3458 }
3459
3460 /**
3461  * amdgpu_device_delayed_init_work_handler - work handler for IB tests
3462  *
3463  * @work: work_struct.
3464  */
3465 static void amdgpu_device_delayed_init_work_handler(struct work_struct *work)
3466 {
3467         struct amdgpu_device *adev =
3468                 container_of(work, struct amdgpu_device, delayed_init_work.work);
3469         int r;
3470
3471         r = amdgpu_ib_ring_tests(adev);
3472         if (r)
3473                 DRM_ERROR("ib ring test failed (%d).\n", r);
3474 }
3475
3476 static void amdgpu_device_delay_enable_gfx_off(struct work_struct *work)
3477 {
3478         struct amdgpu_device *adev =
3479                 container_of(work, struct amdgpu_device, gfx.gfx_off_delay_work.work);
3480
3481         WARN_ON_ONCE(adev->gfx.gfx_off_state);
3482         WARN_ON_ONCE(adev->gfx.gfx_off_req_count);
3483
3484         if (!amdgpu_dpm_set_powergating_by_smu(adev, AMD_IP_BLOCK_TYPE_GFX, true))
3485                 adev->gfx.gfx_off_state = true;
3486 }
3487
3488 /**
3489  * amdgpu_device_ip_suspend_phase1 - run suspend for hardware IPs (phase 1)
3490  *
3491  * @adev: amdgpu_device pointer
3492  *
3493  * Main suspend function for hardware IPs.  The list of all the hardware
3494  * IPs that make up the asic is walked, clockgating is disabled and the
3495  * suspend callbacks are run.  suspend puts the hardware and software state
3496  * in each IP into a state suitable for suspend.
3497  * Returns 0 on success, negative error code on failure.
3498  */
3499 static int amdgpu_device_ip_suspend_phase1(struct amdgpu_device *adev)
3500 {
3501         int i, r;
3502
3503         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
3504         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
3505
3506         /*
3507          * Per PMFW team's suggestion, driver needs to handle gfxoff
3508          * and df cstate features disablement for gpu reset(e.g. Mode1Reset)
3509          * scenario. Add the missing df cstate disablement here.
3510          */
3511         if (amdgpu_dpm_set_df_cstate(adev, DF_CSTATE_DISALLOW))
3512                 dev_warn(adev->dev, "Failed to disallow df cstate");
3513
3514         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3515                 if (!adev->ip_blocks[i].status.valid)
3516                         continue;
3517
3518                 /* displays are handled separately */
3519                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_DCE)
3520                         continue;
3521
3522                 /* XXX handle errors */
3523                 r = amdgpu_ip_block_suspend(&adev->ip_blocks[i]);
3524                 if (r)
3525                         return r;
3526         }
3527
3528         return 0;
3529 }
3530
3531 /**
3532  * amdgpu_device_ip_suspend_phase2 - run suspend for hardware IPs (phase 2)
3533  *
3534  * @adev: amdgpu_device pointer
3535  *
3536  * Main suspend function for hardware IPs.  The list of all the hardware
3537  * IPs that make up the asic is walked, clockgating is disabled and the
3538  * suspend callbacks are run.  suspend puts the hardware and software state
3539  * in each IP into a state suitable for suspend.
3540  * Returns 0 on success, negative error code on failure.
3541  */
3542 static int amdgpu_device_ip_suspend_phase2(struct amdgpu_device *adev)
3543 {
3544         int i, r;
3545
3546         if (adev->in_s0ix)
3547                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D3Entry);
3548
3549         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3550                 if (!adev->ip_blocks[i].status.valid)
3551                         continue;
3552                 /* displays are handled in phase1 */
3553                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE)
3554                         continue;
3555                 /* PSP lost connection when err_event_athub occurs */
3556                 if (amdgpu_ras_intr_triggered() &&
3557                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
3558                         adev->ip_blocks[i].status.hw = false;
3559                         continue;
3560                 }
3561
3562                 /* skip unnecessary suspend if we do not initialize them yet */
3563                 if (!amdgpu_ip_member_of_hwini(
3564                             adev, adev->ip_blocks[i].version->type))
3565                         continue;
3566
3567                 /* skip suspend of gfx/mes and psp for S0ix
3568                  * gfx is in gfxoff state, so on resume it will exit gfxoff just
3569                  * like at runtime. PSP is also part of the always on hardware
3570                  * so no need to suspend it.
3571                  */
3572                 if (adev->in_s0ix &&
3573                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP ||
3574                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3575                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_MES))
3576                         continue;
3577
3578                 /* SDMA 5.x+ is part of GFX power domain so it's covered by GFXOFF */
3579                 if (adev->in_s0ix &&
3580                     (amdgpu_ip_version(adev, SDMA0_HWIP, 0) >=
3581                      IP_VERSION(5, 0, 0)) &&
3582                     (adev->ip_blocks[i].version->type ==
3583                      AMD_IP_BLOCK_TYPE_SDMA))
3584                         continue;
3585
3586                 /* Once swPSP provides the IMU, RLC FW binaries to TOS during cold-boot.
3587                  * These are in TMR, hence are expected to be reused by PSP-TOS to reload
3588                  * from this location and RLC Autoload automatically also gets loaded
3589                  * from here based on PMFW -> PSP message during re-init sequence.
3590                  * Therefore, the psp suspend & resume should be skipped to avoid destroy
3591                  * the TMR and reload FWs again for IMU enabled APU ASICs.
3592                  */
3593                 if (amdgpu_in_reset(adev) &&
3594                     (adev->flags & AMD_IS_APU) && adev->gfx.imu.funcs &&
3595                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3596                         continue;
3597
3598                 /* XXX handle errors */
3599                 r = amdgpu_ip_block_suspend(&adev->ip_blocks[i]);
3600                 adev->ip_blocks[i].status.hw = false;
3601
3602                 /* handle putting the SMC in the appropriate state */
3603                 if (!amdgpu_sriov_vf(adev)) {
3604                         if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3605                                 r = amdgpu_dpm_set_mp1_state(adev, adev->mp1_state);
3606                                 if (r) {
3607                                         DRM_ERROR("SMC failed to set mp1 state %d, %d\n",
3608                                                         adev->mp1_state, r);
3609                                         return r;
3610                                 }
3611                         }
3612                 }
3613         }
3614
3615         return 0;
3616 }
3617
3618 /**
3619  * amdgpu_device_ip_suspend - run suspend for hardware IPs
3620  *
3621  * @adev: amdgpu_device pointer
3622  *
3623  * Main suspend function for hardware IPs.  The list of all the hardware
3624  * IPs that make up the asic is walked, clockgating is disabled and the
3625  * suspend callbacks are run.  suspend puts the hardware and software state
3626  * in each IP into a state suitable for suspend.
3627  * Returns 0 on success, negative error code on failure.
3628  */
3629 int amdgpu_device_ip_suspend(struct amdgpu_device *adev)
3630 {
3631         int r;
3632
3633         if (amdgpu_sriov_vf(adev)) {
3634                 amdgpu_virt_fini_data_exchange(adev);
3635                 amdgpu_virt_request_full_gpu(adev, false);
3636         }
3637
3638         amdgpu_ttm_set_buffer_funcs_status(adev, false);
3639
3640         r = amdgpu_device_ip_suspend_phase1(adev);
3641         if (r)
3642                 return r;
3643         r = amdgpu_device_ip_suspend_phase2(adev);
3644
3645         if (amdgpu_sriov_vf(adev))
3646                 amdgpu_virt_release_full_gpu(adev, false);
3647
3648         return r;
3649 }
3650
3651 static int amdgpu_device_ip_reinit_early_sriov(struct amdgpu_device *adev)
3652 {
3653         int i, r;
3654
3655         static enum amd_ip_block_type ip_order[] = {
3656                 AMD_IP_BLOCK_TYPE_COMMON,
3657                 AMD_IP_BLOCK_TYPE_GMC,
3658                 AMD_IP_BLOCK_TYPE_PSP,
3659                 AMD_IP_BLOCK_TYPE_IH,
3660         };
3661
3662         for (i = 0; i < adev->num_ip_blocks; i++) {
3663                 int j;
3664                 struct amdgpu_ip_block *block;
3665
3666                 block = &adev->ip_blocks[i];
3667                 block->status.hw = false;
3668
3669                 for (j = 0; j < ARRAY_SIZE(ip_order); j++) {
3670
3671                         if (block->version->type != ip_order[j] ||
3672                                 !block->status.valid)
3673                                 continue;
3674
3675                         r = block->version->funcs->hw_init(&adev->ip_blocks[i]);
3676                         if (r) {
3677                                 dev_err(adev->dev, "RE-INIT-early: %s failed\n",
3678                                          block->version->funcs->name);
3679                                 return r;
3680                         }
3681                         block->status.hw = true;
3682                 }
3683         }
3684
3685         return 0;
3686 }
3687
3688 static int amdgpu_device_ip_reinit_late_sriov(struct amdgpu_device *adev)
3689 {
3690         struct amdgpu_ip_block *block;
3691         int i, r = 0;
3692
3693         static enum amd_ip_block_type ip_order[] = {
3694                 AMD_IP_BLOCK_TYPE_SMC,
3695                 AMD_IP_BLOCK_TYPE_DCE,
3696                 AMD_IP_BLOCK_TYPE_GFX,
3697                 AMD_IP_BLOCK_TYPE_SDMA,
3698                 AMD_IP_BLOCK_TYPE_MES,
3699                 AMD_IP_BLOCK_TYPE_UVD,
3700                 AMD_IP_BLOCK_TYPE_VCE,
3701                 AMD_IP_BLOCK_TYPE_VCN,
3702                 AMD_IP_BLOCK_TYPE_JPEG
3703         };
3704
3705         for (i = 0; i < ARRAY_SIZE(ip_order); i++) {
3706                 block = amdgpu_device_ip_get_ip_block(adev, ip_order[i]);
3707
3708                 if (!block)
3709                         continue;
3710
3711                 if (block->status.valid && !block->status.hw) {
3712                         if (block->version->type == AMD_IP_BLOCK_TYPE_SMC) {
3713                                 r = amdgpu_ip_block_resume(block);
3714                         } else {
3715                                 r = block->version->funcs->hw_init(block);
3716                         }
3717
3718                         if (r) {
3719                                 dev_err(adev->dev, "RE-INIT-late: %s failed\n",
3720                                          block->version->funcs->name);
3721                                 break;
3722                         }
3723                         block->status.hw = true;
3724                 }
3725         }
3726
3727         return r;
3728 }
3729
3730 /**
3731  * amdgpu_device_ip_resume_phase1 - run resume for hardware IPs
3732  *
3733  * @adev: amdgpu_device pointer
3734  *
3735  * First resume function for hardware IPs.  The list of all the hardware
3736  * IPs that make up the asic is walked and the resume callbacks are run for
3737  * COMMON, GMC, and IH.  resume puts the hardware into a functional state
3738  * after a suspend and updates the software state as necessary.  This
3739  * function is also used for restoring the GPU after a GPU reset.
3740  * Returns 0 on success, negative error code on failure.
3741  */
3742 static int amdgpu_device_ip_resume_phase1(struct amdgpu_device *adev)
3743 {
3744         int i, r;
3745
3746         for (i = 0; i < adev->num_ip_blocks; i++) {
3747                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3748                         continue;
3749                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3750                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3751                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3752                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP && amdgpu_sriov_vf(adev))) {
3753
3754                         r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
3755                         if (r)
3756                                 return r;
3757                 }
3758         }
3759
3760         return 0;
3761 }
3762
3763 /**
3764  * amdgpu_device_ip_resume_phase2 - run resume for hardware IPs
3765  *
3766  * @adev: amdgpu_device pointer
3767  *
3768  * Second resume function for hardware IPs.  The list of all the hardware
3769  * IPs that make up the asic is walked and the resume callbacks are run for
3770  * all blocks except COMMON, GMC, and IH.  resume puts the hardware into a
3771  * functional state after a suspend and updates the software state as
3772  * necessary.  This function is also used for restoring the GPU after a GPU
3773  * reset.
3774  * Returns 0 on success, negative error code on failure.
3775  */
3776 static int amdgpu_device_ip_resume_phase2(struct amdgpu_device *adev)
3777 {
3778         int i, r;
3779
3780         for (i = 0; i < adev->num_ip_blocks; i++) {
3781                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3782                         continue;
3783                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3784                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3785                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3786                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE ||
3787                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3788                         continue;
3789                 r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
3790                 if (r)
3791                         return r;
3792         }
3793
3794         return 0;
3795 }
3796
3797 /**
3798  * amdgpu_device_ip_resume_phase3 - run resume for hardware IPs
3799  *
3800  * @adev: amdgpu_device pointer
3801  *
3802  * Third resume function for hardware IPs.  The list of all the hardware
3803  * IPs that make up the asic is walked and the resume callbacks are run for
3804  * all DCE.  resume puts the hardware into a functional state after a suspend
3805  * and updates the software state as necessary.  This function is also used
3806  * for restoring the GPU after a GPU reset.
3807  *
3808  * Returns 0 on success, negative error code on failure.
3809  */
3810 static int amdgpu_device_ip_resume_phase3(struct amdgpu_device *adev)
3811 {
3812         int i, r;
3813
3814         for (i = 0; i < adev->num_ip_blocks; i++) {
3815                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3816                         continue;
3817                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) {
3818                         r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
3819                         if (r)
3820                                 return r;
3821                 }
3822         }
3823
3824         return 0;
3825 }
3826
3827 /**
3828  * amdgpu_device_ip_resume - run resume for hardware IPs
3829  *
3830  * @adev: amdgpu_device pointer
3831  *
3832  * Main resume function for hardware IPs.  The hardware IPs
3833  * are split into two resume functions because they are
3834  * also used in recovering from a GPU reset and some additional
3835  * steps need to be take between them.  In this case (S3/S4) they are
3836  * run sequentially.
3837  * Returns 0 on success, negative error code on failure.
3838  */
3839 static int amdgpu_device_ip_resume(struct amdgpu_device *adev)
3840 {
3841         int r;
3842
3843         r = amdgpu_device_ip_resume_phase1(adev);
3844         if (r)
3845                 return r;
3846
3847         r = amdgpu_device_fw_loading(adev);
3848         if (r)
3849                 return r;
3850
3851         r = amdgpu_device_ip_resume_phase2(adev);
3852
3853         if (adev->mman.buffer_funcs_ring->sched.ready)
3854                 amdgpu_ttm_set_buffer_funcs_status(adev, true);
3855
3856         if (r)
3857                 return r;
3858
3859         amdgpu_fence_driver_hw_init(adev);
3860
3861         r = amdgpu_device_ip_resume_phase3(adev);
3862
3863         return r;
3864 }
3865
3866 /**
3867  * amdgpu_device_detect_sriov_bios - determine if the board supports SR-IOV
3868  *
3869  * @adev: amdgpu_device pointer
3870  *
3871  * Query the VBIOS data tables to determine if the board supports SR-IOV.
3872  */
3873 static void amdgpu_device_detect_sriov_bios(struct amdgpu_device *adev)
3874 {
3875         if (amdgpu_sriov_vf(adev)) {
3876                 if (adev->is_atom_fw) {
3877                         if (amdgpu_atomfirmware_gpu_virtualization_supported(adev))
3878                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3879                 } else {
3880                         if (amdgpu_atombios_has_gpu_virtualization_table(adev))
3881                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3882                 }
3883
3884                 if (!(adev->virt.caps & AMDGPU_SRIOV_CAPS_SRIOV_VBIOS))
3885                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_NO_VBIOS, 0, 0);
3886         }
3887 }
3888
3889 /**
3890  * amdgpu_device_asic_has_dc_support - determine if DC supports the asic
3891  *
3892  * @asic_type: AMD asic type
3893  *
3894  * Check if there is DC (new modesetting infrastructre) support for an asic.
3895  * returns true if DC has support, false if not.
3896  */
3897 bool amdgpu_device_asic_has_dc_support(enum amd_asic_type asic_type)
3898 {
3899         switch (asic_type) {
3900 #ifdef CONFIG_DRM_AMDGPU_SI
3901         case CHIP_HAINAN:
3902 #endif
3903         case CHIP_TOPAZ:
3904                 /* chips with no display hardware */
3905                 return false;
3906 #if defined(CONFIG_DRM_AMD_DC)
3907         case CHIP_TAHITI:
3908         case CHIP_PITCAIRN:
3909         case CHIP_VERDE:
3910         case CHIP_OLAND:
3911                 /*
3912                  * We have systems in the wild with these ASICs that require
3913                  * LVDS and VGA support which is not supported with DC.
3914                  *
3915                  * Fallback to the non-DC driver here by default so as not to
3916                  * cause regressions.
3917                  */
3918 #if defined(CONFIG_DRM_AMD_DC_SI)
3919                 return amdgpu_dc > 0;
3920 #else
3921                 return false;
3922 #endif
3923         case CHIP_BONAIRE:
3924         case CHIP_KAVERI:
3925         case CHIP_KABINI:
3926         case CHIP_MULLINS:
3927                 /*
3928                  * We have systems in the wild with these ASICs that require
3929                  * VGA support which is not supported with DC.
3930                  *
3931                  * Fallback to the non-DC driver here by default so as not to
3932                  * cause regressions.
3933                  */
3934                 return amdgpu_dc > 0;
3935         default:
3936                 return amdgpu_dc != 0;
3937 #else
3938         default:
3939                 if (amdgpu_dc > 0)
3940                         DRM_INFO_ONCE("Display Core has been requested via kernel parameter but isn't supported by ASIC, ignoring\n");
3941                 return false;
3942 #endif
3943         }
3944 }
3945
3946 /**
3947  * amdgpu_device_has_dc_support - check if dc is supported
3948  *
3949  * @adev: amdgpu_device pointer
3950  *
3951  * Returns true for supported, false for not supported
3952  */
3953 bool amdgpu_device_has_dc_support(struct amdgpu_device *adev)
3954 {
3955         if (adev->enable_virtual_display ||
3956             (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
3957                 return false;
3958
3959         return amdgpu_device_asic_has_dc_support(adev->asic_type);
3960 }
3961
3962 static void amdgpu_device_xgmi_reset_func(struct work_struct *__work)
3963 {
3964         struct amdgpu_device *adev =
3965                 container_of(__work, struct amdgpu_device, xgmi_reset_work);
3966         struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3967
3968         /* It's a bug to not have a hive within this function */
3969         if (WARN_ON(!hive))
3970                 return;
3971
3972         /*
3973          * Use task barrier to synchronize all xgmi reset works across the
3974          * hive. task_barrier_enter and task_barrier_exit will block
3975          * until all the threads running the xgmi reset works reach
3976          * those points. task_barrier_full will do both blocks.
3977          */
3978         if (amdgpu_asic_reset_method(adev) == AMD_RESET_METHOD_BACO) {
3979
3980                 task_barrier_enter(&hive->tb);
3981                 adev->asic_reset_res = amdgpu_device_baco_enter(adev_to_drm(adev));
3982
3983                 if (adev->asic_reset_res)
3984                         goto fail;
3985
3986                 task_barrier_exit(&hive->tb);
3987                 adev->asic_reset_res = amdgpu_device_baco_exit(adev_to_drm(adev));
3988
3989                 if (adev->asic_reset_res)
3990                         goto fail;
3991
3992                 amdgpu_ras_reset_error_count(adev, AMDGPU_RAS_BLOCK__MMHUB);
3993         } else {
3994
3995                 task_barrier_full(&hive->tb);
3996                 adev->asic_reset_res =  amdgpu_asic_reset(adev);
3997         }
3998
3999 fail:
4000         if (adev->asic_reset_res)
4001                 DRM_WARN("ASIC reset failed with error, %d for drm dev, %s",
4002                          adev->asic_reset_res, adev_to_drm(adev)->unique);
4003         amdgpu_put_xgmi_hive(hive);
4004 }
4005
4006 static int amdgpu_device_get_job_timeout_settings(struct amdgpu_device *adev)
4007 {
4008         char *input = amdgpu_lockup_timeout;
4009         char *timeout_setting = NULL;
4010         int index = 0;
4011         long timeout;
4012         int ret = 0;
4013
4014         /*
4015          * By default timeout for non compute jobs is 10000
4016          * and 60000 for compute jobs.
4017          * In SR-IOV or passthrough mode, timeout for compute
4018          * jobs are 60000 by default.
4019          */
4020         adev->gfx_timeout = msecs_to_jiffies(10000);
4021         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
4022         if (amdgpu_sriov_vf(adev))
4023                 adev->compute_timeout = amdgpu_sriov_is_pp_one_vf(adev) ?
4024                                         msecs_to_jiffies(60000) : msecs_to_jiffies(10000);
4025         else
4026                 adev->compute_timeout =  msecs_to_jiffies(60000);
4027
4028         if (strnlen(input, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
4029                 while ((timeout_setting = strsep(&input, ",")) &&
4030                                 strnlen(timeout_setting, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
4031                         ret = kstrtol(timeout_setting, 0, &timeout);
4032                         if (ret)
4033                                 return ret;
4034
4035                         if (timeout == 0) {
4036                                 index++;
4037                                 continue;
4038                         } else if (timeout < 0) {
4039                                 timeout = MAX_SCHEDULE_TIMEOUT;
4040                                 dev_warn(adev->dev, "lockup timeout disabled");
4041                                 add_taint(TAINT_SOFTLOCKUP, LOCKDEP_STILL_OK);
4042                         } else {
4043                                 timeout = msecs_to_jiffies(timeout);
4044                         }
4045
4046                         switch (index++) {
4047                         case 0:
4048                                 adev->gfx_timeout = timeout;
4049                                 break;
4050                         case 1:
4051                                 adev->compute_timeout = timeout;
4052                                 break;
4053                         case 2:
4054                                 adev->sdma_timeout = timeout;
4055                                 break;
4056                         case 3:
4057                                 adev->video_timeout = timeout;
4058                                 break;
4059                         default:
4060                                 break;
4061                         }
4062                 }
4063                 /*
4064                  * There is only one value specified and
4065                  * it should apply to all non-compute jobs.
4066                  */
4067                 if (index == 1) {
4068                         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
4069                         if (amdgpu_sriov_vf(adev) || amdgpu_passthrough(adev))
4070                                 adev->compute_timeout = adev->gfx_timeout;
4071                 }
4072         }
4073
4074         return ret;
4075 }
4076
4077 /**
4078  * amdgpu_device_check_iommu_direct_map - check if RAM direct mapped to GPU
4079  *
4080  * @adev: amdgpu_device pointer
4081  *
4082  * RAM direct mapped to GPU if IOMMU is not enabled or is pass through mode
4083  */
4084 static void amdgpu_device_check_iommu_direct_map(struct amdgpu_device *adev)
4085 {
4086         struct iommu_domain *domain;
4087
4088         domain = iommu_get_domain_for_dev(adev->dev);
4089         if (!domain || domain->type == IOMMU_DOMAIN_IDENTITY)
4090                 adev->ram_is_direct_mapped = true;
4091 }
4092
4093 #if defined(CONFIG_HSA_AMD_P2P)
4094 /**
4095  * amdgpu_device_check_iommu_remap - Check if DMA remapping is enabled.
4096  *
4097  * @adev: amdgpu_device pointer
4098  *
4099  * return if IOMMU remapping bar address
4100  */
4101 static bool amdgpu_device_check_iommu_remap(struct amdgpu_device *adev)
4102 {
4103         struct iommu_domain *domain;
4104
4105         domain = iommu_get_domain_for_dev(adev->dev);
4106         if (domain && (domain->type == IOMMU_DOMAIN_DMA ||
4107                 domain->type == IOMMU_DOMAIN_DMA_FQ))
4108                 return true;
4109
4110         return false;
4111 }
4112 #endif
4113
4114 static const struct attribute *amdgpu_dev_attributes[] = {
4115         &dev_attr_pcie_replay_count.attr,
4116         NULL
4117 };
4118
4119 static void amdgpu_device_set_mcbp(struct amdgpu_device *adev)
4120 {
4121         if (amdgpu_mcbp == 1)
4122                 adev->gfx.mcbp = true;
4123         else if (amdgpu_mcbp == 0)
4124                 adev->gfx.mcbp = false;
4125
4126         if (amdgpu_sriov_vf(adev))
4127                 adev->gfx.mcbp = true;
4128
4129         if (adev->gfx.mcbp)
4130                 DRM_INFO("MCBP is enabled\n");
4131 }
4132
4133 /**
4134  * amdgpu_device_init - initialize the driver
4135  *
4136  * @adev: amdgpu_device pointer
4137  * @flags: driver flags
4138  *
4139  * Initializes the driver info and hw (all asics).
4140  * Returns 0 for success or an error on failure.
4141  * Called at driver startup.
4142  */
4143 int amdgpu_device_init(struct amdgpu_device *adev,
4144                        uint32_t flags)
4145 {
4146         struct drm_device *ddev = adev_to_drm(adev);
4147         struct pci_dev *pdev = adev->pdev;
4148         int r, i;
4149         bool px = false;
4150         u32 max_MBps;
4151         int tmp;
4152
4153         adev->shutdown = false;
4154         adev->flags = flags;
4155
4156         if (amdgpu_force_asic_type >= 0 && amdgpu_force_asic_type < CHIP_LAST)
4157                 adev->asic_type = amdgpu_force_asic_type;
4158         else
4159                 adev->asic_type = flags & AMD_ASIC_MASK;
4160
4161         adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
4162         if (amdgpu_emu_mode == 1)
4163                 adev->usec_timeout *= 10;
4164         adev->gmc.gart_size = 512 * 1024 * 1024;
4165         adev->accel_working = false;
4166         adev->num_rings = 0;
4167         RCU_INIT_POINTER(adev->gang_submit, dma_fence_get_stub());
4168         adev->mman.buffer_funcs = NULL;
4169         adev->mman.buffer_funcs_ring = NULL;
4170         adev->vm_manager.vm_pte_funcs = NULL;
4171         adev->vm_manager.vm_pte_num_scheds = 0;
4172         adev->gmc.gmc_funcs = NULL;
4173         adev->harvest_ip_mask = 0x0;
4174         adev->fence_context = dma_fence_context_alloc(AMDGPU_MAX_RINGS);
4175         bitmap_zero(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
4176
4177         adev->smc_rreg = &amdgpu_invalid_rreg;
4178         adev->smc_wreg = &amdgpu_invalid_wreg;
4179         adev->pcie_rreg = &amdgpu_invalid_rreg;
4180         adev->pcie_wreg = &amdgpu_invalid_wreg;
4181         adev->pcie_rreg_ext = &amdgpu_invalid_rreg_ext;
4182         adev->pcie_wreg_ext = &amdgpu_invalid_wreg_ext;
4183         adev->pciep_rreg = &amdgpu_invalid_rreg;
4184         adev->pciep_wreg = &amdgpu_invalid_wreg;
4185         adev->pcie_rreg64 = &amdgpu_invalid_rreg64;
4186         adev->pcie_wreg64 = &amdgpu_invalid_wreg64;
4187         adev->pcie_rreg64_ext = &amdgpu_invalid_rreg64_ext;
4188         adev->pcie_wreg64_ext = &amdgpu_invalid_wreg64_ext;
4189         adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
4190         adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
4191         adev->didt_rreg = &amdgpu_invalid_rreg;
4192         adev->didt_wreg = &amdgpu_invalid_wreg;
4193         adev->gc_cac_rreg = &amdgpu_invalid_rreg;
4194         adev->gc_cac_wreg = &amdgpu_invalid_wreg;
4195         adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
4196         adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
4197
4198         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
4199                  amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
4200                  pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
4201
4202         /* mutex initialization are all done here so we
4203          * can recall function without having locking issues
4204          */
4205         mutex_init(&adev->firmware.mutex);
4206         mutex_init(&adev->pm.mutex);
4207         mutex_init(&adev->gfx.gpu_clock_mutex);
4208         mutex_init(&adev->srbm_mutex);
4209         mutex_init(&adev->gfx.pipe_reserve_mutex);
4210         mutex_init(&adev->gfx.gfx_off_mutex);
4211         mutex_init(&adev->gfx.partition_mutex);
4212         mutex_init(&adev->grbm_idx_mutex);
4213         mutex_init(&adev->mn_lock);
4214         mutex_init(&adev->virt.vf_errors.lock);
4215         mutex_init(&adev->virt.rlcg_reg_lock);
4216         hash_init(adev->mn_hash);
4217         mutex_init(&adev->psp.mutex);
4218         mutex_init(&adev->notifier_lock);
4219         mutex_init(&adev->pm.stable_pstate_ctx_lock);
4220         mutex_init(&adev->benchmark_mutex);
4221         mutex_init(&adev->gfx.reset_sem_mutex);
4222         /* Initialize the mutex for cleaner shader isolation between GFX and compute processes */
4223         mutex_init(&adev->enforce_isolation_mutex);
4224         mutex_init(&adev->gfx.kfd_sch_mutex);
4225
4226         amdgpu_device_init_apu_flags(adev);
4227
4228         r = amdgpu_device_check_arguments(adev);
4229         if (r)
4230                 return r;
4231
4232         spin_lock_init(&adev->mmio_idx_lock);
4233         spin_lock_init(&adev->smc_idx_lock);
4234         spin_lock_init(&adev->pcie_idx_lock);
4235         spin_lock_init(&adev->uvd_ctx_idx_lock);
4236         spin_lock_init(&adev->didt_idx_lock);
4237         spin_lock_init(&adev->gc_cac_idx_lock);
4238         spin_lock_init(&adev->se_cac_idx_lock);
4239         spin_lock_init(&adev->audio_endpt_idx_lock);
4240         spin_lock_init(&adev->mm_stats.lock);
4241         spin_lock_init(&adev->wb.lock);
4242
4243         INIT_LIST_HEAD(&adev->reset_list);
4244
4245         INIT_LIST_HEAD(&adev->ras_list);
4246
4247         INIT_LIST_HEAD(&adev->pm.od_kobj_list);
4248
4249         INIT_DELAYED_WORK(&adev->delayed_init_work,
4250                           amdgpu_device_delayed_init_work_handler);
4251         INIT_DELAYED_WORK(&adev->gfx.gfx_off_delay_work,
4252                           amdgpu_device_delay_enable_gfx_off);
4253         /*
4254          * Initialize the enforce_isolation work structures for each XCP
4255          * partition.  This work handler is responsible for enforcing shader
4256          * isolation on AMD GPUs.  It counts the number of emitted fences for
4257          * each GFX and compute ring.  If there are any fences, it schedules
4258          * the `enforce_isolation_work` to be run after a delay.  If there are
4259          * no fences, it signals the Kernel Fusion Driver (KFD) to resume the
4260          * runqueue.
4261          */
4262         for (i = 0; i < MAX_XCP; i++) {
4263                 INIT_DELAYED_WORK(&adev->gfx.enforce_isolation[i].work,
4264                                   amdgpu_gfx_enforce_isolation_handler);
4265                 adev->gfx.enforce_isolation[i].adev = adev;
4266                 adev->gfx.enforce_isolation[i].xcp_id = i;
4267         }
4268
4269         INIT_WORK(&adev->xgmi_reset_work, amdgpu_device_xgmi_reset_func);
4270
4271         adev->gfx.gfx_off_req_count = 1;
4272         adev->gfx.gfx_off_residency = 0;
4273         adev->gfx.gfx_off_entrycount = 0;
4274         adev->pm.ac_power = power_supply_is_system_supplied() > 0;
4275
4276         atomic_set(&adev->throttling_logging_enabled, 1);
4277         /*
4278          * If throttling continues, logging will be performed every minute
4279          * to avoid log flooding. "-1" is subtracted since the thermal
4280          * throttling interrupt comes every second. Thus, the total logging
4281          * interval is 59 seconds(retelimited printk interval) + 1(waiting
4282          * for throttling interrupt) = 60 seconds.
4283          */
4284         ratelimit_state_init(&adev->throttling_logging_rs, (60 - 1) * HZ, 1);
4285         ratelimit_state_init(&adev->virt.ras_telemetry_rs, 5 * HZ, 1);
4286
4287         ratelimit_set_flags(&adev->throttling_logging_rs, RATELIMIT_MSG_ON_RELEASE);
4288         ratelimit_set_flags(&adev->virt.ras_telemetry_rs, RATELIMIT_MSG_ON_RELEASE);
4289
4290         /* Registers mapping */
4291         /* TODO: block userspace mapping of io register */
4292         if (adev->asic_type >= CHIP_BONAIRE) {
4293                 adev->rmmio_base = pci_resource_start(adev->pdev, 5);
4294                 adev->rmmio_size = pci_resource_len(adev->pdev, 5);
4295         } else {
4296                 adev->rmmio_base = pci_resource_start(adev->pdev, 2);
4297                 adev->rmmio_size = pci_resource_len(adev->pdev, 2);
4298         }
4299
4300         for (i = 0; i < AMD_IP_BLOCK_TYPE_NUM; i++)
4301                 atomic_set(&adev->pm.pwr_state[i], POWER_STATE_UNKNOWN);
4302
4303         adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
4304         if (!adev->rmmio)
4305                 return -ENOMEM;
4306
4307         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
4308         DRM_INFO("register mmio size: %u\n", (unsigned int)adev->rmmio_size);
4309
4310         /*
4311          * Reset domain needs to be present early, before XGMI hive discovered
4312          * (if any) and intitialized to use reset sem and in_gpu reset flag
4313          * early on during init and before calling to RREG32.
4314          */
4315         adev->reset_domain = amdgpu_reset_create_reset_domain(SINGLE_DEVICE, "amdgpu-reset-dev");
4316         if (!adev->reset_domain)
4317                 return -ENOMEM;
4318
4319         /* detect hw virtualization here */
4320         amdgpu_detect_virtualization(adev);
4321
4322         amdgpu_device_get_pcie_info(adev);
4323
4324         r = amdgpu_device_get_job_timeout_settings(adev);
4325         if (r) {
4326                 dev_err(adev->dev, "invalid lockup_timeout parameter syntax\n");
4327                 return r;
4328         }
4329
4330         amdgpu_device_set_mcbp(adev);
4331
4332         /*
4333          * By default, use default mode where all blocks are expected to be
4334          * initialized. At present a 'swinit' of blocks is required to be
4335          * completed before the need for a different level is detected.
4336          */
4337         amdgpu_set_init_level(adev, AMDGPU_INIT_LEVEL_DEFAULT);
4338         /* early init functions */
4339         r = amdgpu_device_ip_early_init(adev);
4340         if (r)
4341                 return r;
4342
4343         /* Get rid of things like offb */
4344         r = aperture_remove_conflicting_pci_devices(adev->pdev, amdgpu_kms_driver.name);
4345         if (r)
4346                 return r;
4347
4348         /* Enable TMZ based on IP_VERSION */
4349         amdgpu_gmc_tmz_set(adev);
4350
4351         if (amdgpu_sriov_vf(adev) &&
4352             amdgpu_ip_version(adev, GC_HWIP, 0) >= IP_VERSION(10, 3, 0))
4353                 /* VF MMIO access (except mailbox range) from CPU
4354                  * will be blocked during sriov runtime
4355                  */
4356                 adev->virt.caps |= AMDGPU_VF_MMIO_ACCESS_PROTECT;
4357
4358         amdgpu_gmc_noretry_set(adev);
4359         /* Need to get xgmi info early to decide the reset behavior*/
4360         if (adev->gmc.xgmi.supported) {
4361                 r = adev->gfxhub.funcs->get_xgmi_info(adev);
4362                 if (r)
4363                         return r;
4364         }
4365
4366         /* enable PCIE atomic ops */
4367         if (amdgpu_sriov_vf(adev)) {
4368                 if (adev->virt.fw_reserve.p_pf2vf)
4369                         adev->have_atomics_support = ((struct amd_sriov_msg_pf2vf_info *)
4370                                                       adev->virt.fw_reserve.p_pf2vf)->pcie_atomic_ops_support_flags ==
4371                                 (PCI_EXP_DEVCAP2_ATOMIC_COMP32 | PCI_EXP_DEVCAP2_ATOMIC_COMP64);
4372         /* APUs w/ gfx9 onwards doesn't reply on PCIe atomics, rather it is a
4373          * internal path natively support atomics, set have_atomics_support to true.
4374          */
4375         } else if ((adev->flags & AMD_IS_APU) &&
4376                    (amdgpu_ip_version(adev, GC_HWIP, 0) >
4377                     IP_VERSION(9, 0, 0))) {
4378                 adev->have_atomics_support = true;
4379         } else {
4380                 adev->have_atomics_support =
4381                         !pci_enable_atomic_ops_to_root(adev->pdev,
4382                                           PCI_EXP_DEVCAP2_ATOMIC_COMP32 |
4383                                           PCI_EXP_DEVCAP2_ATOMIC_COMP64);
4384         }
4385
4386         if (!adev->have_atomics_support)
4387                 dev_info(adev->dev, "PCIE atomic ops is not supported\n");
4388
4389         /* doorbell bar mapping and doorbell index init*/
4390         amdgpu_doorbell_init(adev);
4391
4392         if (amdgpu_emu_mode == 1) {
4393                 /* post the asic on emulation mode */
4394                 emu_soc_asic_init(adev);
4395                 goto fence_driver_init;
4396         }
4397
4398         amdgpu_reset_init(adev);
4399
4400         /* detect if we are with an SRIOV vbios */
4401         if (adev->bios)
4402                 amdgpu_device_detect_sriov_bios(adev);
4403
4404         /* check if we need to reset the asic
4405          *  E.g., driver was not cleanly unloaded previously, etc.
4406          */
4407         if (!amdgpu_sriov_vf(adev) && amdgpu_asic_need_reset_on_init(adev)) {
4408                 if (adev->gmc.xgmi.num_physical_nodes) {
4409                         dev_info(adev->dev, "Pending hive reset.\n");
4410                         amdgpu_set_init_level(adev,
4411                                               AMDGPU_INIT_LEVEL_MINIMAL_XGMI);
4412                 } else if (amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(13, 0, 10) &&
4413                                    !amdgpu_device_has_display_hardware(adev)) {
4414                                         r = psp_gpu_reset(adev);
4415                 } else {
4416                                 tmp = amdgpu_reset_method;
4417                                 /* It should do a default reset when loading or reloading the driver,
4418                                  * regardless of the module parameter reset_method.
4419                                  */
4420                                 amdgpu_reset_method = AMD_RESET_METHOD_NONE;
4421                                 r = amdgpu_asic_reset(adev);
4422                                 amdgpu_reset_method = tmp;
4423                 }
4424
4425                 if (r) {
4426                   dev_err(adev->dev, "asic reset on init failed\n");
4427                   goto failed;
4428                 }
4429         }
4430
4431         /* Post card if necessary */
4432         if (amdgpu_device_need_post(adev)) {
4433                 if (!adev->bios) {
4434                         dev_err(adev->dev, "no vBIOS found\n");
4435                         r = -EINVAL;
4436                         goto failed;
4437                 }
4438                 DRM_INFO("GPU posting now...\n");
4439                 r = amdgpu_device_asic_init(adev);
4440                 if (r) {
4441                         dev_err(adev->dev, "gpu post error!\n");
4442                         goto failed;
4443                 }
4444         }
4445
4446         if (adev->bios) {
4447                 if (adev->is_atom_fw) {
4448                         /* Initialize clocks */
4449                         r = amdgpu_atomfirmware_get_clock_info(adev);
4450                         if (r) {
4451                                 dev_err(adev->dev, "amdgpu_atomfirmware_get_clock_info failed\n");
4452                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
4453                                 goto failed;
4454                         }
4455                 } else {
4456                         /* Initialize clocks */
4457                         r = amdgpu_atombios_get_clock_info(adev);
4458                         if (r) {
4459                                 dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
4460                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
4461                                 goto failed;
4462                         }
4463                         /* init i2c buses */
4464                         if (!amdgpu_device_has_dc_support(adev))
4465                                 amdgpu_atombios_i2c_init(adev);
4466                 }
4467         }
4468
4469 fence_driver_init:
4470         /* Fence driver */
4471         r = amdgpu_fence_driver_sw_init(adev);
4472         if (r) {
4473                 dev_err(adev->dev, "amdgpu_fence_driver_sw_init failed\n");
4474                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_FENCE_INIT_FAIL, 0, 0);
4475                 goto failed;
4476         }
4477
4478         /* init the mode config */
4479         drm_mode_config_init(adev_to_drm(adev));
4480
4481         r = amdgpu_device_ip_init(adev);
4482         if (r) {
4483                 dev_err(adev->dev, "amdgpu_device_ip_init failed\n");
4484                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_INIT_FAIL, 0, 0);
4485                 goto release_ras_con;
4486         }
4487
4488         amdgpu_fence_driver_hw_init(adev);
4489
4490         dev_info(adev->dev,
4491                 "SE %d, SH per SE %d, CU per SH %d, active_cu_number %d\n",
4492                         adev->gfx.config.max_shader_engines,
4493                         adev->gfx.config.max_sh_per_se,
4494                         adev->gfx.config.max_cu_per_sh,
4495                         adev->gfx.cu_info.number);
4496
4497         adev->accel_working = true;
4498
4499         amdgpu_vm_check_compute_bug(adev);
4500
4501         /* Initialize the buffer migration limit. */
4502         if (amdgpu_moverate >= 0)
4503                 max_MBps = amdgpu_moverate;
4504         else
4505                 max_MBps = 8; /* Allow 8 MB/s. */
4506         /* Get a log2 for easy divisions. */
4507         adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
4508
4509         /*
4510          * Register gpu instance before amdgpu_device_enable_mgpu_fan_boost.
4511          * Otherwise the mgpu fan boost feature will be skipped due to the
4512          * gpu instance is counted less.
4513          */
4514         amdgpu_register_gpu_instance(adev);
4515
4516         /* enable clockgating, etc. after ib tests, etc. since some blocks require
4517          * explicit gating rather than handling it automatically.
4518          */
4519         if (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI) {
4520                 r = amdgpu_device_ip_late_init(adev);
4521                 if (r) {
4522                         dev_err(adev->dev, "amdgpu_device_ip_late_init failed\n");
4523                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_LATE_INIT_FAIL, 0, r);
4524                         goto release_ras_con;
4525                 }
4526                 /* must succeed. */
4527                 amdgpu_ras_resume(adev);
4528                 queue_delayed_work(system_wq, &adev->delayed_init_work,
4529                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
4530         }
4531
4532         if (amdgpu_sriov_vf(adev)) {
4533                 amdgpu_virt_release_full_gpu(adev, true);
4534                 flush_delayed_work(&adev->delayed_init_work);
4535         }
4536
4537         /*
4538          * Place those sysfs registering after `late_init`. As some of those
4539          * operations performed in `late_init` might affect the sysfs
4540          * interfaces creating.
4541          */
4542         r = amdgpu_atombios_sysfs_init(adev);
4543         if (r)
4544                 drm_err(&adev->ddev,
4545                         "registering atombios sysfs failed (%d).\n", r);
4546
4547         r = amdgpu_pm_sysfs_init(adev);
4548         if (r)
4549                 DRM_ERROR("registering pm sysfs failed (%d).\n", r);
4550
4551         r = amdgpu_ucode_sysfs_init(adev);
4552         if (r) {
4553                 adev->ucode_sysfs_en = false;
4554                 DRM_ERROR("Creating firmware sysfs failed (%d).\n", r);
4555         } else
4556                 adev->ucode_sysfs_en = true;
4557
4558         r = sysfs_create_files(&adev->dev->kobj, amdgpu_dev_attributes);
4559         if (r)
4560                 dev_err(adev->dev, "Could not create amdgpu device attr\n");
4561
4562         r = devm_device_add_group(adev->dev, &amdgpu_board_attrs_group);
4563         if (r)
4564                 dev_err(adev->dev,
4565                         "Could not create amdgpu board attributes\n");
4566
4567         amdgpu_fru_sysfs_init(adev);
4568         amdgpu_reg_state_sysfs_init(adev);
4569         amdgpu_xcp_cfg_sysfs_init(adev);
4570
4571         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4572                 r = amdgpu_pmu_init(adev);
4573         if (r)
4574                 dev_err(adev->dev, "amdgpu_pmu_init failed\n");
4575
4576         /* Have stored pci confspace at hand for restore in sudden PCI error */
4577         if (amdgpu_device_cache_pci_state(adev->pdev))
4578                 pci_restore_state(pdev);
4579
4580         /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
4581         /* this will fail for cards that aren't VGA class devices, just
4582          * ignore it
4583          */
4584         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4585                 vga_client_register(adev->pdev, amdgpu_device_vga_set_decode);
4586
4587         px = amdgpu_device_supports_px(ddev);
4588
4589         if (px || (!dev_is_removable(&adev->pdev->dev) &&
4590                                 apple_gmux_detect(NULL, NULL)))
4591                 vga_switcheroo_register_client(adev->pdev,
4592                                                &amdgpu_switcheroo_ops, px);
4593
4594         if (px)
4595                 vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
4596
4597         if (adev->init_lvl->level == AMDGPU_INIT_LEVEL_MINIMAL_XGMI)
4598                 amdgpu_xgmi_reset_on_init(adev);
4599
4600         amdgpu_device_check_iommu_direct_map(adev);
4601
4602         return 0;
4603
4604 release_ras_con:
4605         if (amdgpu_sriov_vf(adev))
4606                 amdgpu_virt_release_full_gpu(adev, true);
4607
4608         /* failed in exclusive mode due to timeout */
4609         if (amdgpu_sriov_vf(adev) &&
4610                 !amdgpu_sriov_runtime(adev) &&
4611                 amdgpu_virt_mmio_blocked(adev) &&
4612                 !amdgpu_virt_wait_reset(adev)) {
4613                 dev_err(adev->dev, "VF exclusive mode timeout\n");
4614                 /* Don't send request since VF is inactive. */
4615                 adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
4616                 adev->virt.ops = NULL;
4617                 r = -EAGAIN;
4618         }
4619         amdgpu_release_ras_context(adev);
4620
4621 failed:
4622         amdgpu_vf_error_trans_all(adev);
4623
4624         return r;
4625 }
4626
4627 static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
4628 {
4629
4630         /* Clear all CPU mappings pointing to this device */
4631         unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
4632
4633         /* Unmap all mapped bars - Doorbell, registers and VRAM */
4634         amdgpu_doorbell_fini(adev);
4635
4636         iounmap(adev->rmmio);
4637         adev->rmmio = NULL;
4638         if (adev->mman.aper_base_kaddr)
4639                 iounmap(adev->mman.aper_base_kaddr);
4640         adev->mman.aper_base_kaddr = NULL;
4641
4642         /* Memory manager related */
4643         if (!adev->gmc.xgmi.connected_to_cpu && !adev->gmc.is_app_apu) {
4644                 arch_phys_wc_del(adev->gmc.vram_mtrr);
4645                 arch_io_free_memtype_wc(adev->gmc.aper_base, adev->gmc.aper_size);
4646         }
4647 }
4648
4649 /**
4650  * amdgpu_device_fini_hw - tear down the driver
4651  *
4652  * @adev: amdgpu_device pointer
4653  *
4654  * Tear down the driver info (all asics).
4655  * Called at driver shutdown.
4656  */
4657 void amdgpu_device_fini_hw(struct amdgpu_device *adev)
4658 {
4659         dev_info(adev->dev, "amdgpu: finishing device.\n");
4660         flush_delayed_work(&adev->delayed_init_work);
4661
4662         if (adev->mman.initialized)
4663                 drain_workqueue(adev->mman.bdev.wq);
4664         adev->shutdown = true;
4665
4666         /* make sure IB test finished before entering exclusive mode
4667          * to avoid preemption on IB test
4668          */
4669         if (amdgpu_sriov_vf(adev)) {
4670                 amdgpu_virt_request_full_gpu(adev, false);
4671                 amdgpu_virt_fini_data_exchange(adev);
4672         }
4673
4674         /* disable all interrupts */
4675         amdgpu_irq_disable_all(adev);
4676         if (adev->mode_info.mode_config_initialized) {
4677                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(adev)))
4678                         drm_helper_force_disable_all(adev_to_drm(adev));
4679                 else
4680                         drm_atomic_helper_shutdown(adev_to_drm(adev));
4681         }
4682         amdgpu_fence_driver_hw_fini(adev);
4683
4684         if (adev->pm.sysfs_initialized)
4685                 amdgpu_pm_sysfs_fini(adev);
4686         if (adev->ucode_sysfs_en)
4687                 amdgpu_ucode_sysfs_fini(adev);
4688         sysfs_remove_files(&adev->dev->kobj, amdgpu_dev_attributes);
4689         amdgpu_fru_sysfs_fini(adev);
4690
4691         amdgpu_reg_state_sysfs_fini(adev);
4692         amdgpu_xcp_cfg_sysfs_fini(adev);
4693
4694         /* disable ras feature must before hw fini */
4695         amdgpu_ras_pre_fini(adev);
4696
4697         amdgpu_ttm_set_buffer_funcs_status(adev, false);
4698
4699         amdgpu_device_ip_fini_early(adev);
4700
4701         amdgpu_irq_fini_hw(adev);
4702
4703         if (adev->mman.initialized)
4704                 ttm_device_clear_dma_mappings(&adev->mman.bdev);
4705
4706         amdgpu_gart_dummy_page_fini(adev);
4707
4708         if (drm_dev_is_unplugged(adev_to_drm(adev)))
4709                 amdgpu_device_unmap_mmio(adev);
4710
4711 }
4712
4713 void amdgpu_device_fini_sw(struct amdgpu_device *adev)
4714 {
4715         int idx;
4716         bool px;
4717
4718         amdgpu_device_ip_fini(adev);
4719         amdgpu_fence_driver_sw_fini(adev);
4720         amdgpu_ucode_release(&adev->firmware.gpu_info_fw);
4721         adev->accel_working = false;
4722         dma_fence_put(rcu_dereference_protected(adev->gang_submit, true));
4723
4724         amdgpu_reset_fini(adev);
4725
4726         /* free i2c buses */
4727         if (!amdgpu_device_has_dc_support(adev))
4728                 amdgpu_i2c_fini(adev);
4729
4730         if (amdgpu_emu_mode != 1)
4731                 amdgpu_atombios_fini(adev);
4732
4733         kfree(adev->bios);
4734         adev->bios = NULL;
4735
4736         kfree(adev->fru_info);
4737         adev->fru_info = NULL;
4738
4739         px = amdgpu_device_supports_px(adev_to_drm(adev));
4740
4741         if (px || (!dev_is_removable(&adev->pdev->dev) &&
4742                                 apple_gmux_detect(NULL, NULL)))
4743                 vga_switcheroo_unregister_client(adev->pdev);
4744
4745         if (px)
4746                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
4747
4748         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4749                 vga_client_unregister(adev->pdev);
4750
4751         if (drm_dev_enter(adev_to_drm(adev), &idx)) {
4752
4753                 iounmap(adev->rmmio);
4754                 adev->rmmio = NULL;
4755                 amdgpu_doorbell_fini(adev);
4756                 drm_dev_exit(idx);
4757         }
4758
4759         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4760                 amdgpu_pmu_fini(adev);
4761         if (adev->mman.discovery_bin)
4762                 amdgpu_discovery_fini(adev);
4763
4764         amdgpu_reset_put_reset_domain(adev->reset_domain);
4765         adev->reset_domain = NULL;
4766
4767         kfree(adev->pci_state);
4768
4769 }
4770
4771 /**
4772  * amdgpu_device_evict_resources - evict device resources
4773  * @adev: amdgpu device object
4774  *
4775  * Evicts all ttm device resources(vram BOs, gart table) from the lru list
4776  * of the vram memory type. Mainly used for evicting device resources
4777  * at suspend time.
4778  *
4779  */
4780 static int amdgpu_device_evict_resources(struct amdgpu_device *adev)
4781 {
4782         int ret;
4783
4784         /* No need to evict vram on APUs for suspend to ram or s2idle */
4785         if ((adev->in_s3 || adev->in_s0ix) && (adev->flags & AMD_IS_APU))
4786                 return 0;
4787
4788         ret = amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM);
4789         if (ret)
4790                 DRM_WARN("evicting device resources failed\n");
4791         return ret;
4792 }
4793
4794 /*
4795  * Suspend & resume.
4796  */
4797 /**
4798  * amdgpu_device_prepare - prepare for device suspend
4799  *
4800  * @dev: drm dev pointer
4801  *
4802  * Prepare to put the hw in the suspend state (all asics).
4803  * Returns 0 for success or an error on failure.
4804  * Called at driver suspend.
4805  */
4806 int amdgpu_device_prepare(struct drm_device *dev)
4807 {
4808         struct amdgpu_device *adev = drm_to_adev(dev);
4809         int i, r;
4810
4811         amdgpu_choose_low_power_state(adev);
4812
4813         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4814                 return 0;
4815
4816         /* Evict the majority of BOs before starting suspend sequence */
4817         r = amdgpu_device_evict_resources(adev);
4818         if (r)
4819                 goto unprepare;
4820
4821         flush_delayed_work(&adev->gfx.gfx_off_delay_work);
4822
4823         for (i = 0; i < adev->num_ip_blocks; i++) {
4824                 if (!adev->ip_blocks[i].status.valid)
4825                         continue;
4826                 if (!adev->ip_blocks[i].version->funcs->prepare_suspend)
4827                         continue;
4828                 r = adev->ip_blocks[i].version->funcs->prepare_suspend(&adev->ip_blocks[i]);
4829                 if (r)
4830                         goto unprepare;
4831         }
4832
4833         return 0;
4834
4835 unprepare:
4836         adev->in_s0ix = adev->in_s3 = false;
4837
4838         return r;
4839 }
4840
4841 /**
4842  * amdgpu_device_suspend - initiate device suspend
4843  *
4844  * @dev: drm dev pointer
4845  * @notify_clients: notify in-kernel DRM clients
4846  *
4847  * Puts the hw in the suspend state (all asics).
4848  * Returns 0 for success or an error on failure.
4849  * Called at driver suspend.
4850  */
4851 int amdgpu_device_suspend(struct drm_device *dev, bool notify_clients)
4852 {
4853         struct amdgpu_device *adev = drm_to_adev(dev);
4854         int r = 0;
4855
4856         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4857                 return 0;
4858
4859         adev->in_suspend = true;
4860
4861         if (amdgpu_sriov_vf(adev)) {
4862                 amdgpu_virt_fini_data_exchange(adev);
4863                 r = amdgpu_virt_request_full_gpu(adev, false);
4864                 if (r)
4865                         return r;
4866         }
4867
4868         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D3))
4869                 DRM_WARN("smart shift update failed\n");
4870
4871         if (notify_clients)
4872                 drm_client_dev_suspend(adev_to_drm(adev), false);
4873
4874         cancel_delayed_work_sync(&adev->delayed_init_work);
4875
4876         amdgpu_ras_suspend(adev);
4877
4878         amdgpu_device_ip_suspend_phase1(adev);
4879
4880         if (!adev->in_s0ix)
4881                 amdgpu_amdkfd_suspend(adev, adev->in_runpm);
4882
4883         r = amdgpu_device_evict_resources(adev);
4884         if (r)
4885                 return r;
4886
4887         amdgpu_ttm_set_buffer_funcs_status(adev, false);
4888
4889         amdgpu_fence_driver_hw_fini(adev);
4890
4891         amdgpu_device_ip_suspend_phase2(adev);
4892
4893         if (amdgpu_sriov_vf(adev))
4894                 amdgpu_virt_release_full_gpu(adev, false);
4895
4896         r = amdgpu_dpm_notify_rlc_state(adev, false);
4897         if (r)
4898                 return r;
4899
4900         return 0;
4901 }
4902
4903 /**
4904  * amdgpu_device_resume - initiate device resume
4905  *
4906  * @dev: drm dev pointer
4907  * @notify_clients: notify in-kernel DRM clients
4908  *
4909  * Bring the hw back to operating state (all asics).
4910  * Returns 0 for success or an error on failure.
4911  * Called at driver resume.
4912  */
4913 int amdgpu_device_resume(struct drm_device *dev, bool notify_clients)
4914 {
4915         struct amdgpu_device *adev = drm_to_adev(dev);
4916         int r = 0;
4917
4918         if (amdgpu_sriov_vf(adev)) {
4919                 r = amdgpu_virt_request_full_gpu(adev, true);
4920                 if (r)
4921                         return r;
4922         }
4923
4924         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4925                 return 0;
4926
4927         if (adev->in_s0ix)
4928                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D0Entry);
4929
4930         /* post card */
4931         if (amdgpu_device_need_post(adev)) {
4932                 r = amdgpu_device_asic_init(adev);
4933                 if (r)
4934                         dev_err(adev->dev, "amdgpu asic init failed\n");
4935         }
4936
4937         r = amdgpu_device_ip_resume(adev);
4938
4939         if (r) {
4940                 dev_err(adev->dev, "amdgpu_device_ip_resume failed (%d).\n", r);
4941                 goto exit;
4942         }
4943
4944         if (!adev->in_s0ix) {
4945                 r = amdgpu_amdkfd_resume(adev, adev->in_runpm);
4946                 if (r)
4947                         goto exit;
4948         }
4949
4950         r = amdgpu_device_ip_late_init(adev);
4951         if (r)
4952                 goto exit;
4953
4954         queue_delayed_work(system_wq, &adev->delayed_init_work,
4955                            msecs_to_jiffies(AMDGPU_RESUME_MS));
4956 exit:
4957         if (amdgpu_sriov_vf(adev)) {
4958                 amdgpu_virt_init_data_exchange(adev);
4959                 amdgpu_virt_release_full_gpu(adev, true);
4960         }
4961
4962         if (r)
4963                 return r;
4964
4965         /* Make sure IB tests flushed */
4966         flush_delayed_work(&adev->delayed_init_work);
4967
4968         if (notify_clients)
4969                 drm_client_dev_resume(adev_to_drm(adev), false);
4970
4971         amdgpu_ras_resume(adev);
4972
4973         if (adev->mode_info.num_crtc) {
4974                 /*
4975                  * Most of the connector probing functions try to acquire runtime pm
4976                  * refs to ensure that the GPU is powered on when connector polling is
4977                  * performed. Since we're calling this from a runtime PM callback,
4978                  * trying to acquire rpm refs will cause us to deadlock.
4979                  *
4980                  * Since we're guaranteed to be holding the rpm lock, it's safe to
4981                  * temporarily disable the rpm helpers so this doesn't deadlock us.
4982                  */
4983 #ifdef CONFIG_PM
4984                 dev->dev->power.disable_depth++;
4985 #endif
4986                 if (!adev->dc_enabled)
4987                         drm_helper_hpd_irq_event(dev);
4988                 else
4989                         drm_kms_helper_hotplug_event(dev);
4990 #ifdef CONFIG_PM
4991                 dev->dev->power.disable_depth--;
4992 #endif
4993         }
4994         adev->in_suspend = false;
4995
4996         if (adev->enable_mes)
4997                 amdgpu_mes_self_test(adev);
4998
4999         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D0))
5000                 DRM_WARN("smart shift update failed\n");
5001
5002         return 0;
5003 }
5004
5005 /**
5006  * amdgpu_device_ip_check_soft_reset - did soft reset succeed
5007  *
5008  * @adev: amdgpu_device pointer
5009  *
5010  * The list of all the hardware IPs that make up the asic is walked and
5011  * the check_soft_reset callbacks are run.  check_soft_reset determines
5012  * if the asic is still hung or not.
5013  * Returns true if any of the IPs are still in a hung state, false if not.
5014  */
5015 static bool amdgpu_device_ip_check_soft_reset(struct amdgpu_device *adev)
5016 {
5017         int i;
5018         bool asic_hang = false;
5019
5020         if (amdgpu_sriov_vf(adev))
5021                 return true;
5022
5023         if (amdgpu_asic_need_full_reset(adev))
5024                 return true;
5025
5026         for (i = 0; i < adev->num_ip_blocks; i++) {
5027                 if (!adev->ip_blocks[i].status.valid)
5028                         continue;
5029                 if (adev->ip_blocks[i].version->funcs->check_soft_reset)
5030                         adev->ip_blocks[i].status.hang =
5031                                 adev->ip_blocks[i].version->funcs->check_soft_reset(
5032                                         &adev->ip_blocks[i]);
5033                 if (adev->ip_blocks[i].status.hang) {
5034                         dev_info(adev->dev, "IP block:%s is hung!\n", adev->ip_blocks[i].version->funcs->name);
5035                         asic_hang = true;
5036                 }
5037         }
5038         return asic_hang;
5039 }
5040
5041 /**
5042  * amdgpu_device_ip_pre_soft_reset - prepare for soft reset
5043  *
5044  * @adev: amdgpu_device pointer
5045  *
5046  * The list of all the hardware IPs that make up the asic is walked and the
5047  * pre_soft_reset callbacks are run if the block is hung.  pre_soft_reset
5048  * handles any IP specific hardware or software state changes that are
5049  * necessary for a soft reset to succeed.
5050  * Returns 0 on success, negative error code on failure.
5051  */
5052 static int amdgpu_device_ip_pre_soft_reset(struct amdgpu_device *adev)
5053 {
5054         int i, r = 0;
5055
5056         for (i = 0; i < adev->num_ip_blocks; i++) {
5057                 if (!adev->ip_blocks[i].status.valid)
5058                         continue;
5059                 if (adev->ip_blocks[i].status.hang &&
5060                     adev->ip_blocks[i].version->funcs->pre_soft_reset) {
5061                         r = adev->ip_blocks[i].version->funcs->pre_soft_reset(&adev->ip_blocks[i]);
5062                         if (r)
5063                                 return r;
5064                 }
5065         }
5066
5067         return 0;
5068 }
5069
5070 /**
5071  * amdgpu_device_ip_need_full_reset - check if a full asic reset is needed
5072  *
5073  * @adev: amdgpu_device pointer
5074  *
5075  * Some hardware IPs cannot be soft reset.  If they are hung, a full gpu
5076  * reset is necessary to recover.
5077  * Returns true if a full asic reset is required, false if not.
5078  */
5079 static bool amdgpu_device_ip_need_full_reset(struct amdgpu_device *adev)
5080 {
5081         int i;
5082
5083         if (amdgpu_asic_need_full_reset(adev))
5084                 return true;
5085
5086         for (i = 0; i < adev->num_ip_blocks; i++) {
5087                 if (!adev->ip_blocks[i].status.valid)
5088                         continue;
5089                 if ((adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) ||
5090                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) ||
5091                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_ACP) ||
5092                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) ||
5093                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
5094                         if (adev->ip_blocks[i].status.hang) {
5095                                 dev_info(adev->dev, "Some block need full reset!\n");
5096                                 return true;
5097                         }
5098                 }
5099         }
5100         return false;
5101 }
5102
5103 /**
5104  * amdgpu_device_ip_soft_reset - do a soft reset
5105  *
5106  * @adev: amdgpu_device pointer
5107  *
5108  * The list of all the hardware IPs that make up the asic is walked and the
5109  * soft_reset callbacks are run if the block is hung.  soft_reset handles any
5110  * IP specific hardware or software state changes that are necessary to soft
5111  * reset the IP.
5112  * Returns 0 on success, negative error code on failure.
5113  */
5114 static int amdgpu_device_ip_soft_reset(struct amdgpu_device *adev)
5115 {
5116         int i, r = 0;
5117
5118         for (i = 0; i < adev->num_ip_blocks; i++) {
5119                 if (!adev->ip_blocks[i].status.valid)
5120                         continue;
5121                 if (adev->ip_blocks[i].status.hang &&
5122                     adev->ip_blocks[i].version->funcs->soft_reset) {
5123                         r = adev->ip_blocks[i].version->funcs->soft_reset(&adev->ip_blocks[i]);
5124                         if (r)
5125                                 return r;
5126                 }
5127         }
5128
5129         return 0;
5130 }
5131
5132 /**
5133  * amdgpu_device_ip_post_soft_reset - clean up from soft reset
5134  *
5135  * @adev: amdgpu_device pointer
5136  *
5137  * The list of all the hardware IPs that make up the asic is walked and the
5138  * post_soft_reset callbacks are run if the asic was hung.  post_soft_reset
5139  * handles any IP specific hardware or software state changes that are
5140  * necessary after the IP has been soft reset.
5141  * Returns 0 on success, negative error code on failure.
5142  */
5143 static int amdgpu_device_ip_post_soft_reset(struct amdgpu_device *adev)
5144 {
5145         int i, r = 0;
5146
5147         for (i = 0; i < adev->num_ip_blocks; i++) {
5148                 if (!adev->ip_blocks[i].status.valid)
5149                         continue;
5150                 if (adev->ip_blocks[i].status.hang &&
5151                     adev->ip_blocks[i].version->funcs->post_soft_reset)
5152                         r = adev->ip_blocks[i].version->funcs->post_soft_reset(&adev->ip_blocks[i]);
5153                 if (r)
5154                         return r;
5155         }
5156
5157         return 0;
5158 }
5159
5160 /**
5161  * amdgpu_device_reset_sriov - reset ASIC for SR-IOV vf
5162  *
5163  * @adev: amdgpu_device pointer
5164  * @reset_context: amdgpu reset context pointer
5165  *
5166  * do VF FLR and reinitialize Asic
5167  * return 0 means succeeded otherwise failed
5168  */
5169 static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
5170                                      struct amdgpu_reset_context *reset_context)
5171 {
5172         int r;
5173         struct amdgpu_hive_info *hive = NULL;
5174
5175         if (test_bit(AMDGPU_HOST_FLR, &reset_context->flags)) {
5176                 if (!amdgpu_ras_get_fed_status(adev))
5177                         amdgpu_virt_ready_to_reset(adev);
5178                 amdgpu_virt_wait_reset(adev);
5179                 clear_bit(AMDGPU_HOST_FLR, &reset_context->flags);
5180                 r = amdgpu_virt_request_full_gpu(adev, true);
5181         } else {
5182                 r = amdgpu_virt_reset_gpu(adev);
5183         }
5184         if (r)
5185                 return r;
5186
5187         amdgpu_ras_set_fed(adev, false);
5188         amdgpu_irq_gpu_reset_resume_helper(adev);
5189
5190         /* some sw clean up VF needs to do before recover */
5191         amdgpu_virt_post_reset(adev);
5192
5193         /* Resume IP prior to SMC */
5194         r = amdgpu_device_ip_reinit_early_sriov(adev);
5195         if (r)
5196                 return r;
5197
5198         amdgpu_virt_init_data_exchange(adev);
5199
5200         r = amdgpu_device_fw_loading(adev);
5201         if (r)
5202                 return r;
5203
5204         /* now we are okay to resume SMC/CP/SDMA */
5205         r = amdgpu_device_ip_reinit_late_sriov(adev);
5206         if (r)
5207                 return r;
5208
5209         hive = amdgpu_get_xgmi_hive(adev);
5210         /* Update PSP FW topology after reset */
5211         if (hive && adev->gmc.xgmi.num_physical_nodes > 1)
5212                 r = amdgpu_xgmi_update_topology(hive, adev);
5213         if (hive)
5214                 amdgpu_put_xgmi_hive(hive);
5215         if (r)
5216                 return r;
5217
5218         r = amdgpu_ib_ring_tests(adev);
5219         if (r)
5220                 return r;
5221
5222         if (adev->virt.gim_feature & AMDGIM_FEATURE_GIM_FLR_VRAMLOST)
5223                 amdgpu_inc_vram_lost(adev);
5224
5225         /* need to be called during full access so we can't do it later like
5226          * bare-metal does.
5227          */
5228         amdgpu_amdkfd_post_reset(adev);
5229         amdgpu_virt_release_full_gpu(adev, true);
5230
5231         /* Aldebaran and gfx_11_0_3 support ras in SRIOV, so need resume ras during reset */
5232         if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 2) ||
5233             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
5234             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4) ||
5235             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(11, 0, 3))
5236                 amdgpu_ras_resume(adev);
5237
5238         amdgpu_virt_ras_telemetry_post_reset(adev);
5239
5240         return 0;
5241 }
5242
5243 /**
5244  * amdgpu_device_has_job_running - check if there is any job in mirror list
5245  *
5246  * @adev: amdgpu_device pointer
5247  *
5248  * check if there is any job in mirror list
5249  */
5250 bool amdgpu_device_has_job_running(struct amdgpu_device *adev)
5251 {
5252         int i;
5253         struct drm_sched_job *job;
5254
5255         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5256                 struct amdgpu_ring *ring = adev->rings[i];
5257
5258                 if (!amdgpu_ring_sched_ready(ring))
5259                         continue;
5260
5261                 spin_lock(&ring->sched.job_list_lock);
5262                 job = list_first_entry_or_null(&ring->sched.pending_list,
5263                                                struct drm_sched_job, list);
5264                 spin_unlock(&ring->sched.job_list_lock);
5265                 if (job)
5266                         return true;
5267         }
5268         return false;
5269 }
5270
5271 /**
5272  * amdgpu_device_should_recover_gpu - check if we should try GPU recovery
5273  *
5274  * @adev: amdgpu_device pointer
5275  *
5276  * Check amdgpu_gpu_recovery and SRIOV status to see if we should try to recover
5277  * a hung GPU.
5278  */
5279 bool amdgpu_device_should_recover_gpu(struct amdgpu_device *adev)
5280 {
5281
5282         if (amdgpu_gpu_recovery == 0)
5283                 goto disabled;
5284
5285         /* Skip soft reset check in fatal error mode */
5286         if (!amdgpu_ras_is_poison_mode_supported(adev))
5287                 return true;
5288
5289         if (amdgpu_sriov_vf(adev))
5290                 return true;
5291
5292         if (amdgpu_gpu_recovery == -1) {
5293                 switch (adev->asic_type) {
5294 #ifdef CONFIG_DRM_AMDGPU_SI
5295                 case CHIP_VERDE:
5296                 case CHIP_TAHITI:
5297                 case CHIP_PITCAIRN:
5298                 case CHIP_OLAND:
5299                 case CHIP_HAINAN:
5300 #endif
5301 #ifdef CONFIG_DRM_AMDGPU_CIK
5302                 case CHIP_KAVERI:
5303                 case CHIP_KABINI:
5304                 case CHIP_MULLINS:
5305 #endif
5306                 case CHIP_CARRIZO:
5307                 case CHIP_STONEY:
5308                 case CHIP_CYAN_SKILLFISH:
5309                         goto disabled;
5310                 default:
5311                         break;
5312                 }
5313         }
5314
5315         return true;
5316
5317 disabled:
5318                 dev_info(adev->dev, "GPU recovery disabled.\n");
5319                 return false;
5320 }
5321
5322 int amdgpu_device_mode1_reset(struct amdgpu_device *adev)
5323 {
5324         u32 i;
5325         int ret = 0;
5326
5327         amdgpu_atombios_scratch_regs_engine_hung(adev, true);
5328
5329         dev_info(adev->dev, "GPU mode1 reset\n");
5330
5331         /* Cache the state before bus master disable. The saved config space
5332          * values are used in other cases like restore after mode-2 reset.
5333          */
5334         amdgpu_device_cache_pci_state(adev->pdev);
5335
5336         /* disable BM */
5337         pci_clear_master(adev->pdev);
5338
5339         if (amdgpu_dpm_is_mode1_reset_supported(adev)) {
5340                 dev_info(adev->dev, "GPU smu mode1 reset\n");
5341                 ret = amdgpu_dpm_mode1_reset(adev);
5342         } else {
5343                 dev_info(adev->dev, "GPU psp mode1 reset\n");
5344                 ret = psp_gpu_reset(adev);
5345         }
5346
5347         if (ret)
5348                 goto mode1_reset_failed;
5349
5350         amdgpu_device_load_pci_state(adev->pdev);
5351         ret = amdgpu_psp_wait_for_bootloader(adev);
5352         if (ret)
5353                 goto mode1_reset_failed;
5354
5355         /* wait for asic to come out of reset */
5356         for (i = 0; i < adev->usec_timeout; i++) {
5357                 u32 memsize = adev->nbio.funcs->get_memsize(adev);
5358
5359                 if (memsize != 0xffffffff)
5360                         break;
5361                 udelay(1);
5362         }
5363
5364         if (i >= adev->usec_timeout) {
5365                 ret = -ETIMEDOUT;
5366                 goto mode1_reset_failed;
5367         }
5368
5369         amdgpu_atombios_scratch_regs_engine_hung(adev, false);
5370
5371         return 0;
5372
5373 mode1_reset_failed:
5374         dev_err(adev->dev, "GPU mode1 reset failed\n");
5375         return ret;
5376 }
5377
5378 int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev,
5379                                  struct amdgpu_reset_context *reset_context)
5380 {
5381         int i, r = 0;
5382         struct amdgpu_job *job = NULL;
5383         struct amdgpu_device *tmp_adev = reset_context->reset_req_dev;
5384         bool need_full_reset =
5385                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5386
5387         if (reset_context->reset_req_dev == adev)
5388                 job = reset_context->job;
5389
5390         if (amdgpu_sriov_vf(adev))
5391                 amdgpu_virt_pre_reset(adev);
5392
5393         amdgpu_fence_driver_isr_toggle(adev, true);
5394
5395         /* block all schedulers and reset given job's ring */
5396         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5397                 struct amdgpu_ring *ring = adev->rings[i];
5398
5399                 if (!amdgpu_ring_sched_ready(ring))
5400                         continue;
5401
5402                 /* Clear job fence from fence drv to avoid force_completion
5403                  * leave NULL and vm flush fence in fence drv
5404                  */
5405                 amdgpu_fence_driver_clear_job_fences(ring);
5406
5407                 /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
5408                 amdgpu_fence_driver_force_completion(ring);
5409         }
5410
5411         amdgpu_fence_driver_isr_toggle(adev, false);
5412
5413         if (job && job->vm)
5414                 drm_sched_increase_karma(&job->base);
5415
5416         r = amdgpu_reset_prepare_hwcontext(adev, reset_context);
5417         /* If reset handler not implemented, continue; otherwise return */
5418         if (r == -EOPNOTSUPP)
5419                 r = 0;
5420         else
5421                 return r;
5422
5423         /* Don't suspend on bare metal if we are not going to HW reset the ASIC */
5424         if (!amdgpu_sriov_vf(adev)) {
5425
5426                 if (!need_full_reset)
5427                         need_full_reset = amdgpu_device_ip_need_full_reset(adev);
5428
5429                 if (!need_full_reset && amdgpu_gpu_recovery &&
5430                     amdgpu_device_ip_check_soft_reset(adev)) {
5431                         amdgpu_device_ip_pre_soft_reset(adev);
5432                         r = amdgpu_device_ip_soft_reset(adev);
5433                         amdgpu_device_ip_post_soft_reset(adev);
5434                         if (r || amdgpu_device_ip_check_soft_reset(adev)) {
5435                                 dev_info(adev->dev, "soft reset failed, will fallback to full reset!\n");
5436                                 need_full_reset = true;
5437                         }
5438                 }
5439
5440                 if (!test_bit(AMDGPU_SKIP_COREDUMP, &reset_context->flags)) {
5441                         dev_info(tmp_adev->dev, "Dumping IP State\n");
5442                         /* Trigger ip dump before we reset the asic */
5443                         for (i = 0; i < tmp_adev->num_ip_blocks; i++)
5444                                 if (tmp_adev->ip_blocks[i].version->funcs->dump_ip_state)
5445                                         tmp_adev->ip_blocks[i].version->funcs
5446                                                 ->dump_ip_state((void *)&tmp_adev->ip_blocks[i]);
5447                         dev_info(tmp_adev->dev, "Dumping IP State Completed\n");
5448                 }
5449
5450                 if (need_full_reset)
5451                         r = amdgpu_device_ip_suspend(adev);
5452                 if (need_full_reset)
5453                         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5454                 else
5455                         clear_bit(AMDGPU_NEED_FULL_RESET,
5456                                   &reset_context->flags);
5457         }
5458
5459         return r;
5460 }
5461
5462 int amdgpu_device_reinit_after_reset(struct amdgpu_reset_context *reset_context)
5463 {
5464         struct list_head *device_list_handle;
5465         bool full_reset, vram_lost = false;
5466         struct amdgpu_device *tmp_adev;
5467         int r, init_level;
5468
5469         device_list_handle = reset_context->reset_device_list;
5470
5471         if (!device_list_handle)
5472                 return -EINVAL;
5473
5474         full_reset = test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5475
5476         /**
5477          * If it's reset on init, it's default init level, otherwise keep level
5478          * as recovery level.
5479          */
5480         if (reset_context->method == AMD_RESET_METHOD_ON_INIT)
5481                         init_level = AMDGPU_INIT_LEVEL_DEFAULT;
5482         else
5483                         init_level = AMDGPU_INIT_LEVEL_RESET_RECOVERY;
5484
5485         r = 0;
5486         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5487                 amdgpu_set_init_level(tmp_adev, init_level);
5488                 if (full_reset) {
5489                         /* post card */
5490                         amdgpu_ras_set_fed(tmp_adev, false);
5491                         r = amdgpu_device_asic_init(tmp_adev);
5492                         if (r) {
5493                                 dev_warn(tmp_adev->dev, "asic atom init failed!");
5494                         } else {
5495                                 dev_info(tmp_adev->dev, "GPU reset succeeded, trying to resume\n");
5496
5497                                 r = amdgpu_device_ip_resume_phase1(tmp_adev);
5498                                 if (r)
5499                                         goto out;
5500
5501                                 vram_lost = amdgpu_device_check_vram_lost(tmp_adev);
5502
5503                                 if (!test_bit(AMDGPU_SKIP_COREDUMP, &reset_context->flags))
5504                                         amdgpu_coredump(tmp_adev, false, vram_lost, reset_context->job);
5505
5506                                 if (vram_lost) {
5507                                         DRM_INFO("VRAM is lost due to GPU reset!\n");
5508                                         amdgpu_inc_vram_lost(tmp_adev);
5509                                 }
5510
5511                                 r = amdgpu_device_fw_loading(tmp_adev);
5512                                 if (r)
5513                                         return r;
5514
5515                                 r = amdgpu_xcp_restore_partition_mode(
5516                                         tmp_adev->xcp_mgr);
5517                                 if (r)
5518                                         goto out;
5519
5520                                 r = amdgpu_device_ip_resume_phase2(tmp_adev);
5521                                 if (r)
5522                                         goto out;
5523
5524                                 if (tmp_adev->mman.buffer_funcs_ring->sched.ready)
5525                                         amdgpu_ttm_set_buffer_funcs_status(tmp_adev, true);
5526
5527                                 r = amdgpu_device_ip_resume_phase3(tmp_adev);
5528                                 if (r)
5529                                         goto out;
5530
5531                                 if (vram_lost)
5532                                         amdgpu_device_fill_reset_magic(tmp_adev);
5533
5534                                 /*
5535                                  * Add this ASIC as tracked as reset was already
5536                                  * complete successfully.
5537                                  */
5538                                 amdgpu_register_gpu_instance(tmp_adev);
5539
5540                                 if (!reset_context->hive &&
5541                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
5542                                         amdgpu_xgmi_add_device(tmp_adev);
5543
5544                                 r = amdgpu_device_ip_late_init(tmp_adev);
5545                                 if (r)
5546                                         goto out;
5547
5548                                 drm_client_dev_resume(adev_to_drm(tmp_adev), false);
5549
5550                                 /*
5551                                  * The GPU enters bad state once faulty pages
5552                                  * by ECC has reached the threshold, and ras
5553                                  * recovery is scheduled next. So add one check
5554                                  * here to break recovery if it indeed exceeds
5555                                  * bad page threshold, and remind user to
5556                                  * retire this GPU or setting one bigger
5557                                  * bad_page_threshold value to fix this once
5558                                  * probing driver again.
5559                                  */
5560                                 if (!amdgpu_ras_is_rma(tmp_adev)) {
5561                                         /* must succeed. */
5562                                         amdgpu_ras_resume(tmp_adev);
5563                                 } else {
5564                                         r = -EINVAL;
5565                                         goto out;
5566                                 }
5567
5568                                 /* Update PSP FW topology after reset */
5569                                 if (reset_context->hive &&
5570                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
5571                                         r = amdgpu_xgmi_update_topology(
5572                                                 reset_context->hive, tmp_adev);
5573                         }
5574                 }
5575
5576 out:
5577                 if (!r) {
5578                         /* IP init is complete now, set level as default */
5579                         amdgpu_set_init_level(tmp_adev,
5580                                               AMDGPU_INIT_LEVEL_DEFAULT);
5581                         amdgpu_irq_gpu_reset_resume_helper(tmp_adev);
5582                         r = amdgpu_ib_ring_tests(tmp_adev);
5583                         if (r) {
5584                                 dev_err(tmp_adev->dev, "ib ring test failed (%d).\n", r);
5585                                 r = -EAGAIN;
5586                                 goto end;
5587                         }
5588                 }
5589
5590                 if (r)
5591                         tmp_adev->asic_reset_res = r;
5592         }
5593
5594 end:
5595         return r;
5596 }
5597
5598 int amdgpu_do_asic_reset(struct list_head *device_list_handle,
5599                          struct amdgpu_reset_context *reset_context)
5600 {
5601         struct amdgpu_device *tmp_adev = NULL;
5602         bool need_full_reset, skip_hw_reset;
5603         int r = 0;
5604
5605         /* Try reset handler method first */
5606         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5607                                     reset_list);
5608
5609         reset_context->reset_device_list = device_list_handle;
5610         r = amdgpu_reset_perform_reset(tmp_adev, reset_context);
5611         /* If reset handler not implemented, continue; otherwise return */
5612         if (r == -EOPNOTSUPP)
5613                 r = 0;
5614         else
5615                 return r;
5616
5617         /* Reset handler not implemented, use the default method */
5618         need_full_reset =
5619                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5620         skip_hw_reset = test_bit(AMDGPU_SKIP_HW_RESET, &reset_context->flags);
5621
5622         /*
5623          * ASIC reset has to be done on all XGMI hive nodes ASAP
5624          * to allow proper links negotiation in FW (within 1 sec)
5625          */
5626         if (!skip_hw_reset && need_full_reset) {
5627                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5628                         /* For XGMI run all resets in parallel to speed up the process */
5629                         if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
5630                                 if (!queue_work(system_unbound_wq,
5631                                                 &tmp_adev->xgmi_reset_work))
5632                                         r = -EALREADY;
5633                         } else
5634                                 r = amdgpu_asic_reset(tmp_adev);
5635
5636                         if (r) {
5637                                 dev_err(tmp_adev->dev,
5638                                         "ASIC reset failed with error, %d for drm dev, %s",
5639                                         r, adev_to_drm(tmp_adev)->unique);
5640                                 goto out;
5641                         }
5642                 }
5643
5644                 /* For XGMI wait for all resets to complete before proceed */
5645                 if (!r) {
5646                         list_for_each_entry(tmp_adev, device_list_handle,
5647                                             reset_list) {
5648                                 if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
5649                                         flush_work(&tmp_adev->xgmi_reset_work);
5650                                         r = tmp_adev->asic_reset_res;
5651                                         if (r)
5652                                                 break;
5653                                 }
5654                         }
5655                 }
5656         }
5657
5658         if (!r && amdgpu_ras_intr_triggered()) {
5659                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5660                         amdgpu_ras_reset_error_count(tmp_adev,
5661                                                      AMDGPU_RAS_BLOCK__MMHUB);
5662                 }
5663
5664                 amdgpu_ras_intr_cleared();
5665         }
5666
5667         r = amdgpu_device_reinit_after_reset(reset_context);
5668         if (r == -EAGAIN)
5669                 set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5670         else
5671                 clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5672
5673 out:
5674         return r;
5675 }
5676
5677 static void amdgpu_device_set_mp1_state(struct amdgpu_device *adev)
5678 {
5679
5680         switch (amdgpu_asic_reset_method(adev)) {
5681         case AMD_RESET_METHOD_MODE1:
5682                 adev->mp1_state = PP_MP1_STATE_SHUTDOWN;
5683                 break;
5684         case AMD_RESET_METHOD_MODE2:
5685                 adev->mp1_state = PP_MP1_STATE_RESET;
5686                 break;
5687         default:
5688                 adev->mp1_state = PP_MP1_STATE_NONE;
5689                 break;
5690         }
5691 }
5692
5693 static void amdgpu_device_unset_mp1_state(struct amdgpu_device *adev)
5694 {
5695         amdgpu_vf_error_trans_all(adev);
5696         adev->mp1_state = PP_MP1_STATE_NONE;
5697 }
5698
5699 static void amdgpu_device_resume_display_audio(struct amdgpu_device *adev)
5700 {
5701         struct pci_dev *p = NULL;
5702
5703         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5704                         adev->pdev->bus->number, 1);
5705         if (p) {
5706                 pm_runtime_enable(&(p->dev));
5707                 pm_runtime_resume(&(p->dev));
5708         }
5709
5710         pci_dev_put(p);
5711 }
5712
5713 static int amdgpu_device_suspend_display_audio(struct amdgpu_device *adev)
5714 {
5715         enum amd_reset_method reset_method;
5716         struct pci_dev *p = NULL;
5717         u64 expires;
5718
5719         /*
5720          * For now, only BACO and mode1 reset are confirmed
5721          * to suffer the audio issue without proper suspended.
5722          */
5723         reset_method = amdgpu_asic_reset_method(adev);
5724         if ((reset_method != AMD_RESET_METHOD_BACO) &&
5725              (reset_method != AMD_RESET_METHOD_MODE1))
5726                 return -EINVAL;
5727
5728         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5729                         adev->pdev->bus->number, 1);
5730         if (!p)
5731                 return -ENODEV;
5732
5733         expires = pm_runtime_autosuspend_expiration(&(p->dev));
5734         if (!expires)
5735                 /*
5736                  * If we cannot get the audio device autosuspend delay,
5737                  * a fixed 4S interval will be used. Considering 3S is
5738                  * the audio controller default autosuspend delay setting.
5739                  * 4S used here is guaranteed to cover that.
5740                  */
5741                 expires = ktime_get_mono_fast_ns() + NSEC_PER_SEC * 4ULL;
5742
5743         while (!pm_runtime_status_suspended(&(p->dev))) {
5744                 if (!pm_runtime_suspend(&(p->dev)))
5745                         break;
5746
5747                 if (expires < ktime_get_mono_fast_ns()) {
5748                         dev_warn(adev->dev, "failed to suspend display audio\n");
5749                         pci_dev_put(p);
5750                         /* TODO: abort the succeeding gpu reset? */
5751                         return -ETIMEDOUT;
5752                 }
5753         }
5754
5755         pm_runtime_disable(&(p->dev));
5756
5757         pci_dev_put(p);
5758         return 0;
5759 }
5760
5761 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev)
5762 {
5763         struct amdgpu_ras *con = amdgpu_ras_get_context(adev);
5764
5765 #if defined(CONFIG_DEBUG_FS)
5766         if (!amdgpu_sriov_vf(adev))
5767                 cancel_work(&adev->reset_work);
5768 #endif
5769
5770         if (adev->kfd.dev)
5771                 cancel_work(&adev->kfd.reset_work);
5772
5773         if (amdgpu_sriov_vf(adev))
5774                 cancel_work(&adev->virt.flr_work);
5775
5776         if (con && adev->ras_enabled)
5777                 cancel_work(&con->recovery_work);
5778
5779 }
5780
5781 static int amdgpu_device_health_check(struct list_head *device_list_handle)
5782 {
5783         struct amdgpu_device *tmp_adev;
5784         int ret = 0;
5785         u32 status;
5786
5787         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5788                 pci_read_config_dword(tmp_adev->pdev, PCI_COMMAND, &status);
5789                 if (PCI_POSSIBLE_ERROR(status)) {
5790                         dev_err(tmp_adev->dev, "device lost from bus!");
5791                         ret = -ENODEV;
5792                 }
5793         }
5794
5795         return ret;
5796 }
5797
5798 /**
5799  * amdgpu_device_gpu_recover - reset the asic and recover scheduler
5800  *
5801  * @adev: amdgpu_device pointer
5802  * @job: which job trigger hang
5803  * @reset_context: amdgpu reset context pointer
5804  *
5805  * Attempt to reset the GPU if it has hung (all asics).
5806  * Attempt to do soft-reset or full-reset and reinitialize Asic
5807  * Returns 0 for success or an error on failure.
5808  */
5809
5810 int amdgpu_device_gpu_recover(struct amdgpu_device *adev,
5811                               struct amdgpu_job *job,
5812                               struct amdgpu_reset_context *reset_context)
5813 {
5814         struct list_head device_list, *device_list_handle =  NULL;
5815         bool job_signaled = false;
5816         struct amdgpu_hive_info *hive = NULL;
5817         struct amdgpu_device *tmp_adev = NULL;
5818         int i, r = 0;
5819         bool need_emergency_restart = false;
5820         bool audio_suspended = false;
5821         int retry_limit = AMDGPU_MAX_RETRY_LIMIT;
5822
5823         /*
5824          * Special case: RAS triggered and full reset isn't supported
5825          */
5826         need_emergency_restart = amdgpu_ras_need_emergency_restart(adev);
5827
5828         /*
5829          * Flush RAM to disk so that after reboot
5830          * the user can read log and see why the system rebooted.
5831          */
5832         if (need_emergency_restart && amdgpu_ras_get_context(adev) &&
5833                 amdgpu_ras_get_context(adev)->reboot) {
5834                 DRM_WARN("Emergency reboot.");
5835
5836                 ksys_sync_helper();
5837                 emergency_restart();
5838         }
5839
5840         dev_info(adev->dev, "GPU %s begin!\n",
5841                 need_emergency_restart ? "jobs stop":"reset");
5842
5843         if (!amdgpu_sriov_vf(adev))
5844                 hive = amdgpu_get_xgmi_hive(adev);
5845         if (hive)
5846                 mutex_lock(&hive->hive_lock);
5847
5848         reset_context->job = job;
5849         reset_context->hive = hive;
5850         /*
5851          * Build list of devices to reset.
5852          * In case we are in XGMI hive mode, resort the device list
5853          * to put adev in the 1st position.
5854          */
5855         INIT_LIST_HEAD(&device_list);
5856         if (!amdgpu_sriov_vf(adev) && (adev->gmc.xgmi.num_physical_nodes > 1) && hive) {
5857                 list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head) {
5858                         list_add_tail(&tmp_adev->reset_list, &device_list);
5859                         if (adev->shutdown)
5860                                 tmp_adev->shutdown = true;
5861                 }
5862                 if (!list_is_first(&adev->reset_list, &device_list))
5863                         list_rotate_to_front(&adev->reset_list, &device_list);
5864                 device_list_handle = &device_list;
5865         } else {
5866                 list_add_tail(&adev->reset_list, &device_list);
5867                 device_list_handle = &device_list;
5868         }
5869
5870         if (!amdgpu_sriov_vf(adev)) {
5871                 r = amdgpu_device_health_check(device_list_handle);
5872                 if (r)
5873                         goto end_reset;
5874         }
5875
5876         /* We need to lock reset domain only once both for XGMI and single device */
5877         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5878                                     reset_list);
5879         amdgpu_device_lock_reset_domain(tmp_adev->reset_domain);
5880
5881         /* block all schedulers and reset given job's ring */
5882         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5883
5884                 amdgpu_device_set_mp1_state(tmp_adev);
5885
5886                 /*
5887                  * Try to put the audio codec into suspend state
5888                  * before gpu reset started.
5889                  *
5890                  * Due to the power domain of the graphics device
5891                  * is shared with AZ power domain. Without this,
5892                  * we may change the audio hardware from behind
5893                  * the audio driver's back. That will trigger
5894                  * some audio codec errors.
5895                  */
5896                 if (!amdgpu_device_suspend_display_audio(tmp_adev))
5897                         audio_suspended = true;
5898
5899                 amdgpu_ras_set_error_query_ready(tmp_adev, false);
5900
5901                 cancel_delayed_work_sync(&tmp_adev->delayed_init_work);
5902
5903                 amdgpu_amdkfd_pre_reset(tmp_adev, reset_context);
5904
5905                 /*
5906                  * Mark these ASICs to be reseted as untracked first
5907                  * And add them back after reset completed
5908                  */
5909                 amdgpu_unregister_gpu_instance(tmp_adev);
5910
5911                 drm_client_dev_suspend(adev_to_drm(tmp_adev), false);
5912
5913                 /* disable ras on ALL IPs */
5914                 if (!need_emergency_restart &&
5915                       amdgpu_device_ip_need_full_reset(tmp_adev))
5916                         amdgpu_ras_suspend(tmp_adev);
5917
5918                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5919                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5920
5921                         if (!amdgpu_ring_sched_ready(ring))
5922                                 continue;
5923
5924                         drm_sched_stop(&ring->sched, job ? &job->base : NULL);
5925
5926                         if (need_emergency_restart)
5927                                 amdgpu_job_stop_all_jobs_on_sched(&ring->sched);
5928                 }
5929                 atomic_inc(&tmp_adev->gpu_reset_counter);
5930         }
5931
5932         if (need_emergency_restart)
5933                 goto skip_sched_resume;
5934
5935         /*
5936          * Must check guilty signal here since after this point all old
5937          * HW fences are force signaled.
5938          *
5939          * job->base holds a reference to parent fence
5940          */
5941         if (job && dma_fence_is_signaled(&job->hw_fence)) {
5942                 job_signaled = true;
5943                 dev_info(adev->dev, "Guilty job already signaled, skipping HW reset");
5944                 goto skip_hw_reset;
5945         }
5946
5947 retry:  /* Rest of adevs pre asic reset from XGMI hive. */
5948         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5949                 r = amdgpu_device_pre_asic_reset(tmp_adev, reset_context);
5950                 /*TODO Should we stop ?*/
5951                 if (r) {
5952                         dev_err(tmp_adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
5953                                   r, adev_to_drm(tmp_adev)->unique);
5954                         tmp_adev->asic_reset_res = r;
5955                 }
5956         }
5957
5958         /* Actual ASIC resets if needed.*/
5959         /* Host driver will handle XGMI hive reset for SRIOV */
5960         if (amdgpu_sriov_vf(adev)) {
5961                 if (amdgpu_ras_get_fed_status(adev) || amdgpu_virt_rcvd_ras_interrupt(adev)) {
5962                         dev_dbg(adev->dev, "Detected RAS error, wait for FLR completion\n");
5963                         amdgpu_ras_set_fed(adev, true);
5964                         set_bit(AMDGPU_HOST_FLR, &reset_context->flags);
5965                 }
5966
5967                 r = amdgpu_device_reset_sriov(adev, reset_context);
5968                 if (AMDGPU_RETRY_SRIOV_RESET(r) && (retry_limit--) > 0) {
5969                         amdgpu_virt_release_full_gpu(adev, true);
5970                         goto retry;
5971                 }
5972                 if (r)
5973                         adev->asic_reset_res = r;
5974         } else {
5975                 r = amdgpu_do_asic_reset(device_list_handle, reset_context);
5976                 if (r && r == -EAGAIN)
5977                         goto retry;
5978         }
5979
5980         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5981                 /*
5982                  * Drop any pending non scheduler resets queued before reset is done.
5983                  * Any reset scheduled after this point would be valid. Scheduler resets
5984                  * were already dropped during drm_sched_stop and no new ones can come
5985                  * in before drm_sched_start.
5986                  */
5987                 amdgpu_device_stop_pending_resets(tmp_adev);
5988         }
5989
5990 skip_hw_reset:
5991
5992         /* Post ASIC reset for all devs .*/
5993         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5994
5995                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5996                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5997
5998                         if (!amdgpu_ring_sched_ready(ring))
5999                                 continue;
6000
6001                         drm_sched_start(&ring->sched, 0);
6002                 }
6003
6004                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(tmp_adev)) && !job_signaled)
6005                         drm_helper_resume_force_mode(adev_to_drm(tmp_adev));
6006
6007                 if (tmp_adev->asic_reset_res)
6008                         r = tmp_adev->asic_reset_res;
6009
6010                 tmp_adev->asic_reset_res = 0;
6011
6012                 if (r) {
6013                         /* bad news, how to tell it to userspace ?
6014                          * for ras error, we should report GPU bad status instead of
6015                          * reset failure
6016                          */
6017                         if (reset_context->src != AMDGPU_RESET_SRC_RAS ||
6018                             !amdgpu_ras_eeprom_check_err_threshold(tmp_adev))
6019                                 dev_info(tmp_adev->dev, "GPU reset(%d) failed\n",
6020                                         atomic_read(&tmp_adev->gpu_reset_counter));
6021                         amdgpu_vf_error_put(tmp_adev, AMDGIM_ERROR_VF_GPU_RESET_FAIL, 0, r);
6022                 } else {
6023                         dev_info(tmp_adev->dev, "GPU reset(%d) succeeded!\n", atomic_read(&tmp_adev->gpu_reset_counter));
6024                         if (amdgpu_acpi_smart_shift_update(adev_to_drm(tmp_adev), AMDGPU_SS_DEV_D0))
6025                                 DRM_WARN("smart shift update failed\n");
6026                 }
6027         }
6028
6029 skip_sched_resume:
6030         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
6031                 /* unlock kfd: SRIOV would do it separately */
6032                 if (!need_emergency_restart && !amdgpu_sriov_vf(tmp_adev))
6033                         amdgpu_amdkfd_post_reset(tmp_adev);
6034
6035                 /* kfd_post_reset will do nothing if kfd device is not initialized,
6036                  * need to bring up kfd here if it's not be initialized before
6037                  */
6038                 if (!adev->kfd.init_complete)
6039                         amdgpu_amdkfd_device_init(adev);
6040
6041                 if (audio_suspended)
6042                         amdgpu_device_resume_display_audio(tmp_adev);
6043
6044                 amdgpu_device_unset_mp1_state(tmp_adev);
6045
6046                 amdgpu_ras_set_error_query_ready(tmp_adev, true);
6047         }
6048
6049         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
6050                                             reset_list);
6051         amdgpu_device_unlock_reset_domain(tmp_adev->reset_domain);
6052
6053 end_reset:
6054         if (hive) {
6055                 mutex_unlock(&hive->hive_lock);
6056                 amdgpu_put_xgmi_hive(hive);
6057         }
6058
6059         if (r)
6060                 dev_info(adev->dev, "GPU reset end with ret = %d\n", r);
6061
6062         atomic_set(&adev->reset_domain->reset_res, r);
6063         return r;
6064 }
6065
6066 /**
6067  * amdgpu_device_partner_bandwidth - find the bandwidth of appropriate partner
6068  *
6069  * @adev: amdgpu_device pointer
6070  * @speed: pointer to the speed of the link
6071  * @width: pointer to the width of the link
6072  *
6073  * Evaluate the hierarchy to find the speed and bandwidth capabilities of the
6074  * first physical partner to an AMD dGPU.
6075  * This will exclude any virtual switches and links.
6076  */
6077 static void amdgpu_device_partner_bandwidth(struct amdgpu_device *adev,
6078                                             enum pci_bus_speed *speed,
6079                                             enum pcie_link_width *width)
6080 {
6081         struct pci_dev *parent = adev->pdev;
6082
6083         if (!speed || !width)
6084                 return;
6085
6086         *speed = PCI_SPEED_UNKNOWN;
6087         *width = PCIE_LNK_WIDTH_UNKNOWN;
6088
6089         if (amdgpu_device_pcie_dynamic_switching_supported(adev)) {
6090                 while ((parent = pci_upstream_bridge(parent))) {
6091                         /* skip upstream/downstream switches internal to dGPU*/
6092                         if (parent->vendor == PCI_VENDOR_ID_ATI)
6093                                 continue;
6094                         *speed = pcie_get_speed_cap(parent);
6095                         *width = pcie_get_width_cap(parent);
6096                         break;
6097                 }
6098         } else {
6099                 /* use the current speeds rather than max if switching is not supported */
6100                 pcie_bandwidth_available(adev->pdev, NULL, speed, width);
6101         }
6102 }
6103
6104 /**
6105  * amdgpu_device_get_pcie_info - fence pcie info about the PCIE slot
6106  *
6107  * @adev: amdgpu_device pointer
6108  *
6109  * Fetchs and stores in the driver the PCIE capabilities (gen speed
6110  * and lanes) of the slot the device is in. Handles APUs and
6111  * virtualized environments where PCIE config space may not be available.
6112  */
6113 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev)
6114 {
6115         struct pci_dev *pdev;
6116         enum pci_bus_speed speed_cap, platform_speed_cap;
6117         enum pcie_link_width platform_link_width;
6118
6119         if (amdgpu_pcie_gen_cap)
6120                 adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
6121
6122         if (amdgpu_pcie_lane_cap)
6123                 adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
6124
6125         /* covers APUs as well */
6126         if (pci_is_root_bus(adev->pdev->bus) && !amdgpu_passthrough(adev)) {
6127                 if (adev->pm.pcie_gen_mask == 0)
6128                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
6129                 if (adev->pm.pcie_mlw_mask == 0)
6130                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
6131                 return;
6132         }
6133
6134         if (adev->pm.pcie_gen_mask && adev->pm.pcie_mlw_mask)
6135                 return;
6136
6137         amdgpu_device_partner_bandwidth(adev, &platform_speed_cap,
6138                                         &platform_link_width);
6139
6140         if (adev->pm.pcie_gen_mask == 0) {
6141                 /* asic caps */
6142                 pdev = adev->pdev;
6143                 speed_cap = pcie_get_speed_cap(pdev);
6144                 if (speed_cap == PCI_SPEED_UNKNOWN) {
6145                         adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6146                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6147                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
6148                 } else {
6149                         if (speed_cap == PCIE_SPEED_32_0GT)
6150                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6151                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6152                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6153                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4 |
6154                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN5);
6155                         else if (speed_cap == PCIE_SPEED_16_0GT)
6156                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6157                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6158                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6159                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4);
6160                         else if (speed_cap == PCIE_SPEED_8_0GT)
6161                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6162                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6163                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
6164                         else if (speed_cap == PCIE_SPEED_5_0GT)
6165                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6166                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2);
6167                         else
6168                                 adev->pm.pcie_gen_mask |= CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1;
6169                 }
6170                 /* platform caps */
6171                 if (platform_speed_cap == PCI_SPEED_UNKNOWN) {
6172                         adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6173                                                    CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
6174                 } else {
6175                         if (platform_speed_cap == PCIE_SPEED_32_0GT)
6176                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6177                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6178                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6179                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4 |
6180                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN5);
6181                         else if (platform_speed_cap == PCIE_SPEED_16_0GT)
6182                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6183                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6184                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6185                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4);
6186                         else if (platform_speed_cap == PCIE_SPEED_8_0GT)
6187                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6188                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6189                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3);
6190                         else if (platform_speed_cap == PCIE_SPEED_5_0GT)
6191                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6192                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
6193                         else
6194                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
6195
6196                 }
6197         }
6198         if (adev->pm.pcie_mlw_mask == 0) {
6199                 if (platform_link_width == PCIE_LNK_WIDTH_UNKNOWN) {
6200                         adev->pm.pcie_mlw_mask |= AMDGPU_DEFAULT_PCIE_MLW_MASK;
6201                 } else {
6202                         switch (platform_link_width) {
6203                         case PCIE_LNK_X32:
6204                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
6205                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
6206                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6207                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6208                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6209                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6210                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6211                                 break;
6212                         case PCIE_LNK_X16:
6213                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
6214                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6215                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6216                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6217                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6218                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6219                                 break;
6220                         case PCIE_LNK_X12:
6221                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6222                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6223                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6224                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6225                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6226                                 break;
6227                         case PCIE_LNK_X8:
6228                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6229                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6230                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6231                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6232                                 break;
6233                         case PCIE_LNK_X4:
6234                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6235                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6236                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6237                                 break;
6238                         case PCIE_LNK_X2:
6239                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6240                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6241                                 break;
6242                         case PCIE_LNK_X1:
6243                                 adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
6244                                 break;
6245                         default:
6246                                 break;
6247                         }
6248                 }
6249         }
6250 }
6251
6252 /**
6253  * amdgpu_device_is_peer_accessible - Check peer access through PCIe BAR
6254  *
6255  * @adev: amdgpu_device pointer
6256  * @peer_adev: amdgpu_device pointer for peer device trying to access @adev
6257  *
6258  * Return true if @peer_adev can access (DMA) @adev through the PCIe
6259  * BAR, i.e. @adev is "large BAR" and the BAR matches the DMA mask of
6260  * @peer_adev.
6261  */
6262 bool amdgpu_device_is_peer_accessible(struct amdgpu_device *adev,
6263                                       struct amdgpu_device *peer_adev)
6264 {
6265 #ifdef CONFIG_HSA_AMD_P2P
6266         bool p2p_access =
6267                 !adev->gmc.xgmi.connected_to_cpu &&
6268                 !(pci_p2pdma_distance(adev->pdev, peer_adev->dev, false) < 0);
6269         if (!p2p_access)
6270                 dev_info(adev->dev, "PCIe P2P access from peer device %s is not supported by the chipset\n",
6271                         pci_name(peer_adev->pdev));
6272
6273         bool is_large_bar = adev->gmc.visible_vram_size &&
6274                 adev->gmc.real_vram_size == adev->gmc.visible_vram_size;
6275         bool p2p_addressable = amdgpu_device_check_iommu_remap(peer_adev);
6276
6277         if (!p2p_addressable) {
6278                 uint64_t address_mask = peer_adev->dev->dma_mask ?
6279                         ~*peer_adev->dev->dma_mask : ~((1ULL << 32) - 1);
6280                 resource_size_t aper_limit =
6281                         adev->gmc.aper_base + adev->gmc.aper_size - 1;
6282
6283                 p2p_addressable = !(adev->gmc.aper_base & address_mask ||
6284                                      aper_limit & address_mask);
6285         }
6286         return pcie_p2p && is_large_bar && p2p_access && p2p_addressable;
6287 #else
6288         return false;
6289 #endif
6290 }
6291
6292 int amdgpu_device_baco_enter(struct drm_device *dev)
6293 {
6294         struct amdgpu_device *adev = drm_to_adev(dev);
6295         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
6296
6297         if (!amdgpu_device_supports_baco(dev))
6298                 return -ENOTSUPP;
6299
6300         if (ras && adev->ras_enabled &&
6301             adev->nbio.funcs->enable_doorbell_interrupt)
6302                 adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
6303
6304         return amdgpu_dpm_baco_enter(adev);
6305 }
6306
6307 int amdgpu_device_baco_exit(struct drm_device *dev)
6308 {
6309         struct amdgpu_device *adev = drm_to_adev(dev);
6310         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
6311         int ret = 0;
6312
6313         if (!amdgpu_device_supports_baco(dev))
6314                 return -ENOTSUPP;
6315
6316         ret = amdgpu_dpm_baco_exit(adev);
6317         if (ret)
6318                 return ret;
6319
6320         if (ras && adev->ras_enabled &&
6321             adev->nbio.funcs->enable_doorbell_interrupt)
6322                 adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
6323
6324         if (amdgpu_passthrough(adev) && adev->nbio.funcs &&
6325             adev->nbio.funcs->clear_doorbell_interrupt)
6326                 adev->nbio.funcs->clear_doorbell_interrupt(adev);
6327
6328         return 0;
6329 }
6330
6331 /**
6332  * amdgpu_pci_error_detected - Called when a PCI error is detected.
6333  * @pdev: PCI device struct
6334  * @state: PCI channel state
6335  *
6336  * Description: Called when a PCI error is detected.
6337  *
6338  * Return: PCI_ERS_RESULT_NEED_RESET or PCI_ERS_RESULT_DISCONNECT.
6339  */
6340 pci_ers_result_t amdgpu_pci_error_detected(struct pci_dev *pdev, pci_channel_state_t state)
6341 {
6342         struct drm_device *dev = pci_get_drvdata(pdev);
6343         struct amdgpu_device *adev = drm_to_adev(dev);
6344         int i;
6345
6346         DRM_INFO("PCI error: detected callback, state(%d)!!\n", state);
6347
6348         if (adev->gmc.xgmi.num_physical_nodes > 1) {
6349                 DRM_WARN("No support for XGMI hive yet...");
6350                 return PCI_ERS_RESULT_DISCONNECT;
6351         }
6352
6353         adev->pci_channel_state = state;
6354
6355         switch (state) {
6356         case pci_channel_io_normal:
6357                 return PCI_ERS_RESULT_CAN_RECOVER;
6358         /* Fatal error, prepare for slot reset */
6359         case pci_channel_io_frozen:
6360                 /*
6361                  * Locking adev->reset_domain->sem will prevent any external access
6362                  * to GPU during PCI error recovery
6363                  */
6364                 amdgpu_device_lock_reset_domain(adev->reset_domain);
6365                 amdgpu_device_set_mp1_state(adev);
6366
6367                 /*
6368                  * Block any work scheduling as we do for regular GPU reset
6369                  * for the duration of the recovery
6370                  */
6371                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6372                         struct amdgpu_ring *ring = adev->rings[i];
6373
6374                         if (!amdgpu_ring_sched_ready(ring))
6375                                 continue;
6376
6377                         drm_sched_stop(&ring->sched, NULL);
6378                 }
6379                 atomic_inc(&adev->gpu_reset_counter);
6380                 return PCI_ERS_RESULT_NEED_RESET;
6381         case pci_channel_io_perm_failure:
6382                 /* Permanent error, prepare for device removal */
6383                 return PCI_ERS_RESULT_DISCONNECT;
6384         }
6385
6386         return PCI_ERS_RESULT_NEED_RESET;
6387 }
6388
6389 /**
6390  * amdgpu_pci_mmio_enabled - Enable MMIO and dump debug registers
6391  * @pdev: pointer to PCI device
6392  */
6393 pci_ers_result_t amdgpu_pci_mmio_enabled(struct pci_dev *pdev)
6394 {
6395
6396         DRM_INFO("PCI error: mmio enabled callback!!\n");
6397
6398         /* TODO - dump whatever for debugging purposes */
6399
6400         /* This called only if amdgpu_pci_error_detected returns
6401          * PCI_ERS_RESULT_CAN_RECOVER. Read/write to the device still
6402          * works, no need to reset slot.
6403          */
6404
6405         return PCI_ERS_RESULT_RECOVERED;
6406 }
6407
6408 /**
6409  * amdgpu_pci_slot_reset - Called when PCI slot has been reset.
6410  * @pdev: PCI device struct
6411  *
6412  * Description: This routine is called by the pci error recovery
6413  * code after the PCI slot has been reset, just before we
6414  * should resume normal operations.
6415  */
6416 pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
6417 {
6418         struct drm_device *dev = pci_get_drvdata(pdev);
6419         struct amdgpu_device *adev = drm_to_adev(dev);
6420         int r, i;
6421         struct amdgpu_reset_context reset_context;
6422         u32 memsize;
6423         struct list_head device_list;
6424
6425         /* PCI error slot reset should be skipped During RAS recovery */
6426         if ((amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
6427             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4)) &&
6428             amdgpu_ras_in_recovery(adev))
6429                 return PCI_ERS_RESULT_RECOVERED;
6430
6431         DRM_INFO("PCI error: slot reset callback!!\n");
6432
6433         memset(&reset_context, 0, sizeof(reset_context));
6434
6435         INIT_LIST_HEAD(&device_list);
6436         list_add_tail(&adev->reset_list, &device_list);
6437
6438         /* wait for asic to come out of reset */
6439         msleep(500);
6440
6441         /* Restore PCI confspace */
6442         amdgpu_device_load_pci_state(pdev);
6443
6444         /* confirm  ASIC came out of reset */
6445         for (i = 0; i < adev->usec_timeout; i++) {
6446                 memsize = amdgpu_asic_get_config_memsize(adev);
6447
6448                 if (memsize != 0xffffffff)
6449                         break;
6450                 udelay(1);
6451         }
6452         if (memsize == 0xffffffff) {
6453                 r = -ETIME;
6454                 goto out;
6455         }
6456
6457         reset_context.method = AMD_RESET_METHOD_NONE;
6458         reset_context.reset_req_dev = adev;
6459         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
6460         set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
6461
6462         adev->no_hw_access = true;
6463         r = amdgpu_device_pre_asic_reset(adev, &reset_context);
6464         adev->no_hw_access = false;
6465         if (r)
6466                 goto out;
6467
6468         r = amdgpu_do_asic_reset(&device_list, &reset_context);
6469
6470 out:
6471         if (!r) {
6472                 if (amdgpu_device_cache_pci_state(adev->pdev))
6473                         pci_restore_state(adev->pdev);
6474
6475                 DRM_INFO("PCIe error recovery succeeded\n");
6476         } else {
6477                 DRM_ERROR("PCIe error recovery failed, err:%d", r);
6478                 amdgpu_device_unset_mp1_state(adev);
6479                 amdgpu_device_unlock_reset_domain(adev->reset_domain);
6480         }
6481
6482         return r ? PCI_ERS_RESULT_DISCONNECT : PCI_ERS_RESULT_RECOVERED;
6483 }
6484
6485 /**
6486  * amdgpu_pci_resume() - resume normal ops after PCI reset
6487  * @pdev: pointer to PCI device
6488  *
6489  * Called when the error recovery driver tells us that its
6490  * OK to resume normal operation.
6491  */
6492 void amdgpu_pci_resume(struct pci_dev *pdev)
6493 {
6494         struct drm_device *dev = pci_get_drvdata(pdev);
6495         struct amdgpu_device *adev = drm_to_adev(dev);
6496         int i;
6497
6498
6499         DRM_INFO("PCI error: resume callback!!\n");
6500
6501         /* Only continue execution for the case of pci_channel_io_frozen */
6502         if (adev->pci_channel_state != pci_channel_io_frozen)
6503                 return;
6504
6505         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6506                 struct amdgpu_ring *ring = adev->rings[i];
6507
6508                 if (!amdgpu_ring_sched_ready(ring))
6509                         continue;
6510
6511                 drm_sched_start(&ring->sched, 0);
6512         }
6513
6514         amdgpu_device_unset_mp1_state(adev);
6515         amdgpu_device_unlock_reset_domain(adev->reset_domain);
6516 }
6517
6518 bool amdgpu_device_cache_pci_state(struct pci_dev *pdev)
6519 {
6520         struct drm_device *dev = pci_get_drvdata(pdev);
6521         struct amdgpu_device *adev = drm_to_adev(dev);
6522         int r;
6523
6524         if (amdgpu_sriov_vf(adev))
6525                 return false;
6526
6527         r = pci_save_state(pdev);
6528         if (!r) {
6529                 kfree(adev->pci_state);
6530
6531                 adev->pci_state = pci_store_saved_state(pdev);
6532
6533                 if (!adev->pci_state) {
6534                         DRM_ERROR("Failed to store PCI saved state");
6535                         return false;
6536                 }
6537         } else {
6538                 DRM_WARN("Failed to save PCI state, err:%d\n", r);
6539                 return false;
6540         }
6541
6542         return true;
6543 }
6544
6545 bool amdgpu_device_load_pci_state(struct pci_dev *pdev)
6546 {
6547         struct drm_device *dev = pci_get_drvdata(pdev);
6548         struct amdgpu_device *adev = drm_to_adev(dev);
6549         int r;
6550
6551         if (!adev->pci_state)
6552                 return false;
6553
6554         r = pci_load_saved_state(pdev, adev->pci_state);
6555
6556         if (!r) {
6557                 pci_restore_state(pdev);
6558         } else {
6559                 DRM_WARN("Failed to load PCI state, err:%d\n", r);
6560                 return false;
6561         }
6562
6563         return true;
6564 }
6565
6566 void amdgpu_device_flush_hdp(struct amdgpu_device *adev,
6567                 struct amdgpu_ring *ring)
6568 {
6569 #ifdef CONFIG_X86_64
6570         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
6571                 return;
6572 #endif
6573         if (adev->gmc.xgmi.connected_to_cpu)
6574                 return;
6575
6576         if (ring && ring->funcs->emit_hdp_flush)
6577                 amdgpu_ring_emit_hdp_flush(ring);
6578         else
6579                 amdgpu_asic_flush_hdp(adev, ring);
6580 }
6581
6582 void amdgpu_device_invalidate_hdp(struct amdgpu_device *adev,
6583                 struct amdgpu_ring *ring)
6584 {
6585 #ifdef CONFIG_X86_64
6586         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
6587                 return;
6588 #endif
6589         if (adev->gmc.xgmi.connected_to_cpu)
6590                 return;
6591
6592         amdgpu_asic_invalidate_hdp(adev, ring);
6593 }
6594
6595 int amdgpu_in_reset(struct amdgpu_device *adev)
6596 {
6597         return atomic_read(&adev->reset_domain->in_gpu_reset);
6598 }
6599
6600 /**
6601  * amdgpu_device_halt() - bring hardware to some kind of halt state
6602  *
6603  * @adev: amdgpu_device pointer
6604  *
6605  * Bring hardware to some kind of halt state so that no one can touch it
6606  * any more. It will help to maintain error context when error occurred.
6607  * Compare to a simple hang, the system will keep stable at least for SSH
6608  * access. Then it should be trivial to inspect the hardware state and
6609  * see what's going on. Implemented as following:
6610  *
6611  * 1. drm_dev_unplug() makes device inaccessible to user space(IOCTLs, etc),
6612  *    clears all CPU mappings to device, disallows remappings through page faults
6613  * 2. amdgpu_irq_disable_all() disables all interrupts
6614  * 3. amdgpu_fence_driver_hw_fini() signals all HW fences
6615  * 4. set adev->no_hw_access to avoid potential crashes after setp 5
6616  * 5. amdgpu_device_unmap_mmio() clears all MMIO mappings
6617  * 6. pci_disable_device() and pci_wait_for_pending_transaction()
6618  *    flush any in flight DMA operations
6619  */
6620 void amdgpu_device_halt(struct amdgpu_device *adev)
6621 {
6622         struct pci_dev *pdev = adev->pdev;
6623         struct drm_device *ddev = adev_to_drm(adev);
6624
6625         amdgpu_xcp_dev_unplug(adev);
6626         drm_dev_unplug(ddev);
6627
6628         amdgpu_irq_disable_all(adev);
6629
6630         amdgpu_fence_driver_hw_fini(adev);
6631
6632         adev->no_hw_access = true;
6633
6634         amdgpu_device_unmap_mmio(adev);
6635
6636         pci_disable_device(pdev);
6637         pci_wait_for_pending_transaction(pdev);
6638 }
6639
6640 u32 amdgpu_device_pcie_port_rreg(struct amdgpu_device *adev,
6641                                 u32 reg)
6642 {
6643         unsigned long flags, address, data;
6644         u32 r;
6645
6646         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
6647         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
6648
6649         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
6650         WREG32(address, reg * 4);
6651         (void)RREG32(address);
6652         r = RREG32(data);
6653         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
6654         return r;
6655 }
6656
6657 void amdgpu_device_pcie_port_wreg(struct amdgpu_device *adev,
6658                                 u32 reg, u32 v)
6659 {
6660         unsigned long flags, address, data;
6661
6662         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
6663         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
6664
6665         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
6666         WREG32(address, reg * 4);
6667         (void)RREG32(address);
6668         WREG32(data, v);
6669         (void)RREG32(data);
6670         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
6671 }
6672
6673 /**
6674  * amdgpu_device_get_gang - return a reference to the current gang
6675  * @adev: amdgpu_device pointer
6676  *
6677  * Returns: A new reference to the current gang leader.
6678  */
6679 struct dma_fence *amdgpu_device_get_gang(struct amdgpu_device *adev)
6680 {
6681         struct dma_fence *fence;
6682
6683         rcu_read_lock();
6684         fence = dma_fence_get_rcu_safe(&adev->gang_submit);
6685         rcu_read_unlock();
6686         return fence;
6687 }
6688
6689 /**
6690  * amdgpu_device_switch_gang - switch to a new gang
6691  * @adev: amdgpu_device pointer
6692  * @gang: the gang to switch to
6693  *
6694  * Try to switch to a new gang.
6695  * Returns: NULL if we switched to the new gang or a reference to the current
6696  * gang leader.
6697  */
6698 struct dma_fence *amdgpu_device_switch_gang(struct amdgpu_device *adev,
6699                                             struct dma_fence *gang)
6700 {
6701         struct dma_fence *old = NULL;
6702
6703         do {
6704                 dma_fence_put(old);
6705                 old = amdgpu_device_get_gang(adev);
6706                 if (old == gang)
6707                         break;
6708
6709                 if (!dma_fence_is_signaled(old))
6710                         return old;
6711
6712         } while (cmpxchg((struct dma_fence __force **)&adev->gang_submit,
6713                          old, gang) != old);
6714
6715         dma_fence_put(old);
6716         return NULL;
6717 }
6718
6719 bool amdgpu_device_has_display_hardware(struct amdgpu_device *adev)
6720 {
6721         switch (adev->asic_type) {
6722 #ifdef CONFIG_DRM_AMDGPU_SI
6723         case CHIP_HAINAN:
6724 #endif
6725         case CHIP_TOPAZ:
6726                 /* chips with no display hardware */
6727                 return false;
6728 #ifdef CONFIG_DRM_AMDGPU_SI
6729         case CHIP_TAHITI:
6730         case CHIP_PITCAIRN:
6731         case CHIP_VERDE:
6732         case CHIP_OLAND:
6733 #endif
6734 #ifdef CONFIG_DRM_AMDGPU_CIK
6735         case CHIP_BONAIRE:
6736         case CHIP_HAWAII:
6737         case CHIP_KAVERI:
6738         case CHIP_KABINI:
6739         case CHIP_MULLINS:
6740 #endif
6741         case CHIP_TONGA:
6742         case CHIP_FIJI:
6743         case CHIP_POLARIS10:
6744         case CHIP_POLARIS11:
6745         case CHIP_POLARIS12:
6746         case CHIP_VEGAM:
6747         case CHIP_CARRIZO:
6748         case CHIP_STONEY:
6749                 /* chips with display hardware */
6750                 return true;
6751         default:
6752                 /* IP discovery */
6753                 if (!amdgpu_ip_version(adev, DCE_HWIP, 0) ||
6754                     (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
6755                         return false;
6756                 return true;
6757         }
6758 }
6759
6760 uint32_t amdgpu_device_wait_on_rreg(struct amdgpu_device *adev,
6761                 uint32_t inst, uint32_t reg_addr, char reg_name[],
6762                 uint32_t expected_value, uint32_t mask)
6763 {
6764         uint32_t ret = 0;
6765         uint32_t old_ = 0;
6766         uint32_t tmp_ = RREG32(reg_addr);
6767         uint32_t loop = adev->usec_timeout;
6768
6769         while ((tmp_ & (mask)) != (expected_value)) {
6770                 if (old_ != tmp_) {
6771                         loop = adev->usec_timeout;
6772                         old_ = tmp_;
6773                 } else
6774                         udelay(1);
6775                 tmp_ = RREG32(reg_addr);
6776                 loop--;
6777                 if (!loop) {
6778                         DRM_WARN("Register(%d) [%s] failed to reach value 0x%08x != 0x%08xn",
6779                                   inst, reg_name, (uint32_t)expected_value,
6780                                   (uint32_t)(tmp_ & (mask)));
6781                         ret = -ETIMEDOUT;
6782                         break;
6783                 }
6784         }
6785         return ret;
6786 }
6787
6788 ssize_t amdgpu_get_soft_full_reset_mask(struct amdgpu_ring *ring)
6789 {
6790         ssize_t size = 0;
6791
6792         if (!ring || !ring->adev)
6793                 return size;
6794
6795         if (amdgpu_device_should_recover_gpu(ring->adev))
6796                 size |= AMDGPU_RESET_TYPE_FULL;
6797
6798         if (unlikely(!ring->adev->debug_disable_soft_recovery) &&
6799             !amdgpu_sriov_vf(ring->adev) && ring->funcs->soft_recovery)
6800                 size |= AMDGPU_RESET_TYPE_SOFT_RESET;
6801
6802         return size;
6803 }
6804
6805 ssize_t amdgpu_show_reset_mask(char *buf, uint32_t supported_reset)
6806 {
6807         ssize_t size = 0;
6808
6809         if (supported_reset == 0) {
6810                 size += sysfs_emit_at(buf, size, "unsupported");
6811                 size += sysfs_emit_at(buf, size, "\n");
6812                 return size;
6813
6814         }
6815
6816         if (supported_reset & AMDGPU_RESET_TYPE_SOFT_RESET)
6817                 size += sysfs_emit_at(buf, size, "soft ");
6818
6819         if (supported_reset & AMDGPU_RESET_TYPE_PER_QUEUE)
6820                 size += sysfs_emit_at(buf, size, "queue ");
6821
6822         if (supported_reset & AMDGPU_RESET_TYPE_PER_PIPE)
6823                 size += sysfs_emit_at(buf, size, "pipe ");
6824
6825         if (supported_reset & AMDGPU_RESET_TYPE_FULL)
6826                 size += sysfs_emit_at(buf, size, "full ");
6827
6828         size += sysfs_emit_at(buf, size, "\n");
6829         return size;
6830 }