drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

   1 /*
   2  * Copyright 2008 Advanced Micro Devices, Inc.
   3  * Copyright 2008 Red Hat Inc.
   4  * Copyright 2009 Jerome Glisse.
   5  *
   6  * Permission is hereby granted, free of charge, to any person obtaining a
   7  * copy of this software and associated documentation files (the "Software"),
   8  * to deal in the Software without restriction, including without limitation
   9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10  * and/or sell copies of the Software, and to permit persons to whom the
  11  * Software is furnished to do so, subject to the following conditions:
  12  *
  13  * The above copyright notice and this permission notice shall be included in
  14  * all copies or substantial portions of the Software.
  15  *
  16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22  * OTHER DEALINGS IN THE SOFTWARE.
  23  *
  24  * Authors: Dave Airlie
  25  *          Alex Deucher
  26  *          Jerome Glisse
  27  */
  28
  29 #include <linux/aperture.h>
  30 #include <linux/power_supply.h>
  31 #include <linux/kthread.h>
  32 #include <linux/module.h>
  33 #include <linux/console.h>
  34 #include <linux/slab.h>
  35 #include <linux/iommu.h>
  36 #include <linux/pci.h>
  37 #include <linux/pci-p2pdma.h>
  38 #include <linux/apple-gmux.h>
  39
  40 #include <drm/drm_atomic_helper.h>
  41 #include <drm/drm_client_event.h>
  42 #include <drm/drm_crtc_helper.h>
  43 #include <drm/drm_probe_helper.h>
  44 #include <drm/amdgpu_drm.h>
  45 #include <linux/device.h>
  46 #include <linux/vgaarb.h>
  47 #include <linux/vga_switcheroo.h>
  48 #include <linux/efi.h>
  49 #include "amdgpu.h"
  50 #include "amdgpu_trace.h"
  51 #include "amdgpu_i2c.h"
  52 #include "atom.h"
  53 #include "amdgpu_atombios.h"
  54 #include "amdgpu_atomfirmware.h"
  55 #include "amd_pcie.h"
  56 #ifdef CONFIG_DRM_AMDGPU_SI
  57 #include "si.h"
  58 #endif
  59 #ifdef CONFIG_DRM_AMDGPU_CIK
  60 #include "cik.h"
  61 #endif
  62 #include "vi.h"
  63 #include "soc15.h"
  64 #include "nv.h"
  65 #include "bif/bif_4_1_d.h"
  66 #include <linux/firmware.h>
  67 #include "amdgpu_vf_error.h"
  68
  69 #include "amdgpu_amdkfd.h"
  70 #include "amdgpu_pm.h"
  71
  72 #include "amdgpu_xgmi.h"
  73 #include "amdgpu_ras.h"
  74 #include "amdgpu_pmu.h"
  75 #include "amdgpu_fru_eeprom.h"
  76 #include "amdgpu_reset.h"
  77 #include "amdgpu_virt.h"
  78 #include "amdgpu_dev_coredump.h"
  79
  80 #include <linux/suspend.h>
  81 #include <drm/task_barrier.h>
  82 #include <linux/pm_runtime.h>
  83
  84 #include <drm/drm_drv.h>
  85
  86 #if IS_ENABLED(CONFIG_X86)
  87 #include <asm/intel-family.h>
  88 #endif
  89
  90 MODULE_FIRMWARE("amdgpu/vega10_gpu_info.bin");
  91 MODULE_FIRMWARE("amdgpu/vega12_gpu_info.bin");
  92 MODULE_FIRMWARE("amdgpu/raven_gpu_info.bin");
  93 MODULE_FIRMWARE("amdgpu/picasso_gpu_info.bin");
  94 MODULE_FIRMWARE("amdgpu/raven2_gpu_info.bin");
  95 MODULE_FIRMWARE("amdgpu/arcturus_gpu_info.bin");
  96 MODULE_FIRMWARE("amdgpu/navi12_gpu_info.bin");
  97
  98 #define AMDGPU_RESUME_MS                2000
  99 #define AMDGPU_MAX_RETRY_LIMIT          2
 100 #define AMDGPU_RETRY_SRIOV_RESET(r) ((r) == -EBUSY || (r) == -ETIMEDOUT || (r) == -EINVAL)
 101 #define AMDGPU_PCIE_INDEX_FALLBACK (0x38 >> 2)
 102 #define AMDGPU_PCIE_INDEX_HI_FALLBACK (0x44 >> 2)
 103 #define AMDGPU_PCIE_DATA_FALLBACK (0x3C >> 2)
 104
 105 static const struct drm_driver amdgpu_kms_driver;
 106
 107 const char *amdgpu_asic_name[] = {
 108         "TAHITI",
 109         "PITCAIRN",
 110         "VERDE",
 111         "OLAND",
 112         "HAINAN",
 113         "BONAIRE",
 114         "KAVERI",
 115         "KABINI",
 116         "HAWAII",
 117         "MULLINS",
 118         "TOPAZ",
 119         "TONGA",
 120         "FIJI",
 121         "CARRIZO",
 122         "STONEY",
 123         "POLARIS10",
 124         "POLARIS11",
 125         "POLARIS12",
 126         "VEGAM",
 127         "VEGA10",
 128         "VEGA12",
 129         "VEGA20",
 130         "RAVEN",
 131         "ARCTURUS",
 132         "RENOIR",
 133         "ALDEBARAN",
 134         "NAVI10",
 135         "CYAN_SKILLFISH",
 136         "NAVI14",
 137         "NAVI12",
 138         "SIENNA_CICHLID",
 139         "NAVY_FLOUNDER",
 140         "VANGOGH",
 141         "DIMGREY_CAVEFISH",
 142         "BEIGE_GOBY",
 143         "YELLOW_CARP",
 144         "IP DISCOVERY",
 145         "LAST",
 146 };
 147
 148 #define AMDGPU_IP_BLK_MASK_ALL GENMASK(AMD_IP_BLOCK_TYPE_NUM  - 1, 0)
 149 /*
 150  * Default init level where all blocks are expected to be initialized. This is
 151  * the level of initialization expected by default and also after a full reset
 152  * of the device.
 153  */
 154 struct amdgpu_init_level amdgpu_init_default = {
 155         .level = AMDGPU_INIT_LEVEL_DEFAULT,
 156         .hwini_ip_block_mask = AMDGPU_IP_BLK_MASK_ALL,
 157 };
 158
 159 struct amdgpu_init_level amdgpu_init_recovery = {
 160         .level = AMDGPU_INIT_LEVEL_RESET_RECOVERY,
 161         .hwini_ip_block_mask = AMDGPU_IP_BLK_MASK_ALL,
 162 };
 163
 164 /*
 165  * Minimal blocks needed to be initialized before a XGMI hive can be reset. This
 166  * is used for cases like reset on initialization where the entire hive needs to
 167  * be reset before first use.
 168  */
 169 struct amdgpu_init_level amdgpu_init_minimal_xgmi = {
 170         .level = AMDGPU_INIT_LEVEL_MINIMAL_XGMI,
 171         .hwini_ip_block_mask =
 172                 BIT(AMD_IP_BLOCK_TYPE_GMC) | BIT(AMD_IP_BLOCK_TYPE_SMC) |
 173                 BIT(AMD_IP_BLOCK_TYPE_COMMON) | BIT(AMD_IP_BLOCK_TYPE_IH) |
 174                 BIT(AMD_IP_BLOCK_TYPE_PSP)
 175 };
 176
 177 static inline bool amdgpu_ip_member_of_hwini(struct amdgpu_device *adev,
 178                                              enum amd_ip_block_type block)
 179 {
 180         return (adev->init_lvl->hwini_ip_block_mask & (1U << block)) != 0;
 181 }
 182
 183 void amdgpu_set_init_level(struct amdgpu_device *adev,
 184                            enum amdgpu_init_lvl_id lvl)
 185 {
 186         switch (lvl) {
 187         case AMDGPU_INIT_LEVEL_MINIMAL_XGMI:
 188                 adev->init_lvl = &amdgpu_init_minimal_xgmi;
 189                 break;
 190         case AMDGPU_INIT_LEVEL_RESET_RECOVERY:
 191                 adev->init_lvl = &amdgpu_init_recovery;
 192                 break;
 193         case AMDGPU_INIT_LEVEL_DEFAULT:
 194                 fallthrough;
 195         default:
 196                 adev->init_lvl = &amdgpu_init_default;
 197                 break;
 198         }
 199 }
 200
 201 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev);
 202 static int amdgpu_device_pm_notifier(struct notifier_block *nb, unsigned long mode,
 203                                      void *data);
 204
 205 /**
 206  * DOC: pcie_replay_count
 207  *
 208  * The amdgpu driver provides a sysfs API for reporting the total number
 209  * of PCIe replays (NAKs).
 210  * The file pcie_replay_count is used for this and returns the total
 211  * number of replays as a sum of the NAKs generated and NAKs received.
 212  */
 213
 214 static ssize_t amdgpu_device_get_pcie_replay_count(struct device *dev,
 215                 struct device_attribute *attr, char *buf)
 216 {
 217         struct drm_device *ddev = dev_get_drvdata(dev);
 218         struct amdgpu_device *adev = drm_to_adev(ddev);
 219         uint64_t cnt = amdgpu_asic_get_pcie_replay_count(adev);
 220
 221         return sysfs_emit(buf, "%llu\n", cnt);
 222 }
 223
 224 static DEVICE_ATTR(pcie_replay_count, 0444,
 225                 amdgpu_device_get_pcie_replay_count, NULL);
 226
 227 static ssize_t amdgpu_sysfs_reg_state_get(struct file *f, struct kobject *kobj,
 228                                           struct bin_attribute *attr, char *buf,
 229                                           loff_t ppos, size_t count)
 230 {
 231         struct device *dev = kobj_to_dev(kobj);
 232         struct drm_device *ddev = dev_get_drvdata(dev);
 233         struct amdgpu_device *adev = drm_to_adev(ddev);
 234         ssize_t bytes_read;
 235
 236         switch (ppos) {
 237         case AMDGPU_SYS_REG_STATE_XGMI:
 238                 bytes_read = amdgpu_asic_get_reg_state(
 239                         adev, AMDGPU_REG_STATE_TYPE_XGMI, buf, count);
 240                 break;
 241         case AMDGPU_SYS_REG_STATE_WAFL:
 242                 bytes_read = amdgpu_asic_get_reg_state(
 243                         adev, AMDGPU_REG_STATE_TYPE_WAFL, buf, count);
 244                 break;
 245         case AMDGPU_SYS_REG_STATE_PCIE:
 246                 bytes_read = amdgpu_asic_get_reg_state(
 247                         adev, AMDGPU_REG_STATE_TYPE_PCIE, buf, count);
 248                 break;
 249         case AMDGPU_SYS_REG_STATE_USR:
 250                 bytes_read = amdgpu_asic_get_reg_state(
 251                         adev, AMDGPU_REG_STATE_TYPE_USR, buf, count);
 252                 break;
 253         case AMDGPU_SYS_REG_STATE_USR_1:
 254                 bytes_read = amdgpu_asic_get_reg_state(
 255                         adev, AMDGPU_REG_STATE_TYPE_USR_1, buf, count);
 256                 break;
 257         default:
 258                 return -EINVAL;
 259         }
 260
 261         return bytes_read;
 262 }
 263
 264 BIN_ATTR(reg_state, 0444, amdgpu_sysfs_reg_state_get, NULL,
 265          AMDGPU_SYS_REG_STATE_END);
 266
 267 int amdgpu_reg_state_sysfs_init(struct amdgpu_device *adev)
 268 {
 269         int ret;
 270
 271         if (!amdgpu_asic_get_reg_state_supported(adev))
 272                 return 0;
 273
 274         ret = sysfs_create_bin_file(&adev->dev->kobj, &bin_attr_reg_state);
 275
 276         return ret;
 277 }
 278
 279 void amdgpu_reg_state_sysfs_fini(struct amdgpu_device *adev)
 280 {
 281         if (!amdgpu_asic_get_reg_state_supported(adev))
 282                 return;
 283         sysfs_remove_bin_file(&adev->dev->kobj, &bin_attr_reg_state);
 284 }
 285
 286 int amdgpu_ip_block_suspend(struct amdgpu_ip_block *ip_block)
 287 {
 288         int r;
 289
 290         if (ip_block->version->funcs->suspend) {
 291                 r = ip_block->version->funcs->suspend(ip_block);
 292                 if (r) {
 293                         dev_err(ip_block->adev->dev,
 294                                 "suspend of IP block <%s> failed %d\n",
 295                                 ip_block->version->funcs->name, r);
 296                         return r;
 297                 }
 298         }
 299
 300         ip_block->status.hw = false;
 301         return 0;
 302 }
 303
 304 int amdgpu_ip_block_resume(struct amdgpu_ip_block *ip_block)
 305 {
 306         int r;
 307
 308         if (ip_block->version->funcs->resume) {
 309                 r = ip_block->version->funcs->resume(ip_block);
 310                 if (r) {
 311                         dev_err(ip_block->adev->dev,
 312                                 "resume of IP block <%s> failed %d\n",
 313                                 ip_block->version->funcs->name, r);
 314                         return r;
 315                 }
 316         }
 317
 318         ip_block->status.hw = true;
 319         return 0;
 320 }
 321
 322 /**
 323  * DOC: board_info
 324  *
 325  * The amdgpu driver provides a sysfs API for giving board related information.
 326  * It provides the form factor information in the format
 327  *
 328  *   type : form factor
 329  *
 330  * Possible form factor values
 331  *
 332  * - "cem"              - PCIE CEM card
 333  * - "oam"              - Open Compute Accelerator Module
 334  * - "unknown"  - Not known
 335  *
 336  */
 337
 338 static ssize_t amdgpu_device_get_board_info(struct device *dev,
 339                                             struct device_attribute *attr,
 340                                             char *buf)
 341 {
 342         struct drm_device *ddev = dev_get_drvdata(dev);
 343         struct amdgpu_device *adev = drm_to_adev(ddev);
 344         enum amdgpu_pkg_type pkg_type = AMDGPU_PKG_TYPE_CEM;
 345         const char *pkg;
 346
 347         if (adev->smuio.funcs && adev->smuio.funcs->get_pkg_type)
 348                 pkg_type = adev->smuio.funcs->get_pkg_type(adev);
 349
 350         switch (pkg_type) {
 351         case AMDGPU_PKG_TYPE_CEM:
 352                 pkg = "cem";
 353                 break;
 354         case AMDGPU_PKG_TYPE_OAM:
 355                 pkg = "oam";
 356                 break;
 357         default:
 358                 pkg = "unknown";
 359                 break;
 360         }
 361
 362         return sysfs_emit(buf, "%s : %s\n", "type", pkg);
 363 }
 364
 365 static DEVICE_ATTR(board_info, 0444, amdgpu_device_get_board_info, NULL);
 366
 367 static struct attribute *amdgpu_board_attrs[] = {
 368         &dev_attr_board_info.attr,
 369         NULL,
 370 };
 371
 372 static umode_t amdgpu_board_attrs_is_visible(struct kobject *kobj,
 373                                              struct attribute *attr, int n)
 374 {
 375         struct device *dev = kobj_to_dev(kobj);
 376         struct drm_device *ddev = dev_get_drvdata(dev);
 377         struct amdgpu_device *adev = drm_to_adev(ddev);
 378
 379         if (adev->flags & AMD_IS_APU)
 380                 return 0;
 381
 382         return attr->mode;
 383 }
 384
 385 static const struct attribute_group amdgpu_board_attrs_group = {
 386         .attrs = amdgpu_board_attrs,
 387         .is_visible = amdgpu_board_attrs_is_visible
 388 };
 389
 390 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev);
 391
 392
 393 /**
 394  * amdgpu_device_supports_px - Is the device a dGPU with ATPX power control
 395  *
 396  * @dev: drm_device pointer
 397  *
 398  * Returns true if the device is a dGPU with ATPX power control,
 399  * otherwise return false.
 400  */
 401 bool amdgpu_device_supports_px(struct drm_device *dev)
 402 {
 403         struct amdgpu_device *adev = drm_to_adev(dev);
 404
 405         if ((adev->flags & AMD_IS_PX) && !amdgpu_is_atpx_hybrid())
 406                 return true;
 407         return false;
 408 }
 409
 410 /**
 411  * amdgpu_device_supports_boco - Is the device a dGPU with ACPI power resources
 412  *
 413  * @dev: drm_device pointer
 414  *
 415  * Returns true if the device is a dGPU with ACPI power control,
 416  * otherwise return false.
 417  */
 418 bool amdgpu_device_supports_boco(struct drm_device *dev)
 419 {
 420         struct amdgpu_device *adev = drm_to_adev(dev);
 421
 422         if (!IS_ENABLED(CONFIG_HOTPLUG_PCI_PCIE))
 423                 return false;
 424
 425         if (adev->has_pr3 ||
 426             ((adev->flags & AMD_IS_PX) && amdgpu_is_atpx_hybrid()))
 427                 return true;
 428         return false;
 429 }
 430
 431 /**
 432  * amdgpu_device_supports_baco - Does the device support BACO
 433  *
 434  * @dev: drm_device pointer
 435  *
 436  * Return:
 437  * 1 if the device supports BACO;
 438  * 3 if the device supports MACO (only works if BACO is supported)
 439  * otherwise return 0.
 440  */
 441 int amdgpu_device_supports_baco(struct drm_device *dev)
 442 {
 443         struct amdgpu_device *adev = drm_to_adev(dev);
 444
 445         return amdgpu_asic_supports_baco(adev);
 446 }
 447
 448 void amdgpu_device_detect_runtime_pm_mode(struct amdgpu_device *adev)
 449 {
 450         struct drm_device *dev;
 451         int bamaco_support;
 452
 453         dev = adev_to_drm(adev);
 454
 455         adev->pm.rpm_mode = AMDGPU_RUNPM_NONE;
 456         bamaco_support = amdgpu_device_supports_baco(dev);
 457
 458         switch (amdgpu_runtime_pm) {
 459         case 2:
 460                 if (bamaco_support & MACO_SUPPORT) {
 461                         adev->pm.rpm_mode = AMDGPU_RUNPM_BAMACO;
 462                         dev_info(adev->dev, "Forcing BAMACO for runtime pm\n");
 463                 } else if (bamaco_support == BACO_SUPPORT) {
 464                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 465                         dev_info(adev->dev, "Requested mode BAMACO not available,fallback to use BACO\n");
 466                 }
 467                 break;
 468         case 1:
 469                 if (bamaco_support & BACO_SUPPORT) {
 470                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 471                         dev_info(adev->dev, "Forcing BACO for runtime pm\n");
 472                 }
 473                 break;
 474         case -1:
 475         case -2:
 476                 if (amdgpu_device_supports_px(dev)) { /* enable PX as runtime mode */
 477                         adev->pm.rpm_mode = AMDGPU_RUNPM_PX;
 478                         dev_info(adev->dev, "Using ATPX for runtime pm\n");
 479                 } else if (amdgpu_device_supports_boco(dev)) { /* enable boco as runtime mode */
 480                         adev->pm.rpm_mode = AMDGPU_RUNPM_BOCO;
 481                         dev_info(adev->dev, "Using BOCO for runtime pm\n");
 482                 } else {
 483                         if (!bamaco_support)
 484                                 goto no_runtime_pm;
 485
 486                         switch (adev->asic_type) {
 487                         case CHIP_VEGA20:
 488                         case CHIP_ARCTURUS:
 489                                 /* BACO are not supported on vega20 and arctrus */
 490                                 break;
 491                         case CHIP_VEGA10:
 492                                 /* enable BACO as runpm mode if noretry=0 */
 493                                 if (!adev->gmc.noretry)
 494                                         adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 495                                 break;
 496                         default:
 497                                 /* enable BACO as runpm mode on CI+ */
 498                                 adev->pm.rpm_mode = AMDGPU_RUNPM_BACO;
 499                                 break;
 500                         }
 501
 502                         if (adev->pm.rpm_mode == AMDGPU_RUNPM_BACO) {
 503                                 if (bamaco_support & MACO_SUPPORT) {
 504                                         adev->pm.rpm_mode = AMDGPU_RUNPM_BAMACO;
 505                                         dev_info(adev->dev, "Using BAMACO for runtime pm\n");
 506                                 } else {
 507                                         dev_info(adev->dev, "Using BACO for runtime pm\n");
 508                                 }
 509                         }
 510                 }
 511                 break;
 512         case 0:
 513                 dev_info(adev->dev, "runtime pm is manually disabled\n");
 514                 break;
 515         default:
 516                 break;
 517         }
 518
 519 no_runtime_pm:
 520         if (adev->pm.rpm_mode == AMDGPU_RUNPM_NONE)
 521                 dev_info(adev->dev, "Runtime PM not available\n");
 522 }
 523 /**
 524  * amdgpu_device_supports_smart_shift - Is the device dGPU with
 525  * smart shift support
 526  *
 527  * @dev: drm_device pointer
 528  *
 529  * Returns true if the device is a dGPU with Smart Shift support,
 530  * otherwise returns false.
 531  */
 532 bool amdgpu_device_supports_smart_shift(struct drm_device *dev)
 533 {
 534         return (amdgpu_device_supports_boco(dev) &&
 535                 amdgpu_acpi_is_power_shift_control_supported());
 536 }
 537
 538 /*
 539  * VRAM access helper functions
 540  */
 541
 542 /**
 543  * amdgpu_device_mm_access - access vram by MM_INDEX/MM_DATA
 544  *
 545  * @adev: amdgpu_device pointer
 546  * @pos: offset of the buffer in vram
 547  * @buf: virtual address of the buffer in system memory
 548  * @size: read/write size, sizeof(@buf) must > @size
 549  * @write: true - write to vram, otherwise - read from vram
 550  */
 551 void amdgpu_device_mm_access(struct amdgpu_device *adev, loff_t pos,
 552                              void *buf, size_t size, bool write)
 553 {
 554         unsigned long flags;
 555         uint32_t hi = ~0, tmp = 0;
 556         uint32_t *data = buf;
 557         uint64_t last;
 558         int idx;
 559
 560         if (!drm_dev_enter(adev_to_drm(adev), &idx))
 561                 return;
 562
 563         BUG_ON(!IS_ALIGNED(pos, 4) || !IS_ALIGNED(size, 4));
 564
 565         spin_lock_irqsave(&adev->mmio_idx_lock, flags);
 566         for (last = pos + size; pos < last; pos += 4) {
 567                 tmp = pos >> 31;
 568
 569                 WREG32_NO_KIQ(mmMM_INDEX, ((uint32_t)pos) | 0x80000000);
 570                 if (tmp != hi) {
 571                         WREG32_NO_KIQ(mmMM_INDEX_HI, tmp);
 572                         hi = tmp;
 573                 }
 574                 if (write)
 575                         WREG32_NO_KIQ(mmMM_DATA, *data++);
 576                 else
 577                         *data++ = RREG32_NO_KIQ(mmMM_DATA);
 578         }
 579
 580         spin_unlock_irqrestore(&adev->mmio_idx_lock, flags);
 581         drm_dev_exit(idx);
 582 }
 583
 584 /**
 585  * amdgpu_device_aper_access - access vram by vram aperture
 586  *
 587  * @adev: amdgpu_device pointer
 588  * @pos: offset of the buffer in vram
 589  * @buf: virtual address of the buffer in system memory
 590  * @size: read/write size, sizeof(@buf) must > @size
 591  * @write: true - write to vram, otherwise - read from vram
 592  *
 593  * The return value means how many bytes have been transferred.
 594  */
 595 size_t amdgpu_device_aper_access(struct amdgpu_device *adev, loff_t pos,
 596                                  void *buf, size_t size, bool write)
 597 {
 598 #ifdef CONFIG_64BIT
 599         void __iomem *addr;
 600         size_t count = 0;
 601         uint64_t last;
 602
 603         if (!adev->mman.aper_base_kaddr)
 604                 return 0;
 605
 606         last = min(pos + size, adev->gmc.visible_vram_size);
 607         if (last > pos) {
 608                 addr = adev->mman.aper_base_kaddr + pos;
 609                 count = last - pos;
 610
 611                 if (write) {
 612                         memcpy_toio(addr, buf, count);
 613                         /* Make sure HDP write cache flush happens without any reordering
 614                          * after the system memory contents are sent over PCIe device
 615                          */
 616                         mb();
 617                         amdgpu_device_flush_hdp(adev, NULL);
 618                 } else {
 619                         amdgpu_device_invalidate_hdp(adev, NULL);
 620                         /* Make sure HDP read cache is invalidated before issuing a read
 621                          * to the PCIe device
 622                          */
 623                         mb();
 624                         memcpy_fromio(buf, addr, count);
 625                 }
 626
 627         }
 628
 629         return count;
 630 #else
 631         return 0;
 632 #endif
 633 }
 634
 635 /**
 636  * amdgpu_device_vram_access - read/write a buffer in vram
 637  *
 638  * @adev: amdgpu_device pointer
 639  * @pos: offset of the buffer in vram
 640  * @buf: virtual address of the buffer in system memory
 641  * @size: read/write size, sizeof(@buf) must > @size
 642  * @write: true - write to vram, otherwise - read from vram
 643  */
 644 void amdgpu_device_vram_access(struct amdgpu_device *adev, loff_t pos,
 645                                void *buf, size_t size, bool write)
 646 {
 647         size_t count;
 648
 649         /* try to using vram apreature to access vram first */
 650         count = amdgpu_device_aper_access(adev, pos, buf, size, write);
 651         size -= count;
 652         if (size) {
 653                 /* using MM to access rest vram */
 654                 pos += count;
 655                 buf += count;
 656                 amdgpu_device_mm_access(adev, pos, buf, size, write);
 657         }
 658 }
 659
 660 /*
 661  * register access helper functions.
 662  */
 663
 664 /* Check if hw access should be skipped because of hotplug or device error */
 665 bool amdgpu_device_skip_hw_access(struct amdgpu_device *adev)
 666 {
 667         if (adev->no_hw_access)
 668                 return true;
 669
 670 #ifdef CONFIG_LOCKDEP
 671         /*
 672          * This is a bit complicated to understand, so worth a comment. What we assert
 673          * here is that the GPU reset is not running on another thread in parallel.
 674          *
 675          * For this we trylock the read side of the reset semaphore, if that succeeds
 676          * we know that the reset is not running in parallel.
 677          *
 678          * If the trylock fails we assert that we are either already holding the read
 679          * side of the lock or are the reset thread itself and hold the write side of
 680          * the lock.
 681          */
 682         if (in_task()) {
 683                 if (down_read_trylock(&adev->reset_domain->sem))
 684                         up_read(&adev->reset_domain->sem);
 685                 else
 686                         lockdep_assert_held(&adev->reset_domain->sem);
 687         }
 688 #endif
 689         return false;
 690 }
 691
 692 /**
 693  * amdgpu_device_rreg - read a memory mapped IO or indirect register
 694  *
 695  * @adev: amdgpu_device pointer
 696  * @reg: dword aligned register offset
 697  * @acc_flags: access flags which require special behavior
 698  *
 699  * Returns the 32 bit value from the offset specified.
 700  */
 701 uint32_t amdgpu_device_rreg(struct amdgpu_device *adev,
 702                             uint32_t reg, uint32_t acc_flags)
 703 {
 704         uint32_t ret;
 705
 706         if (amdgpu_device_skip_hw_access(adev))
 707                 return 0;
 708
 709         if ((reg * 4) < adev->rmmio_size) {
 710                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 711                     amdgpu_sriov_runtime(adev) &&
 712                     down_read_trylock(&adev->reset_domain->sem)) {
 713                         ret = amdgpu_kiq_rreg(adev, reg, 0);
 714                         up_read(&adev->reset_domain->sem);
 715                 } else {
 716                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 717                 }
 718         } else {
 719                 ret = adev->pcie_rreg(adev, reg * 4);
 720         }
 721
 722         trace_amdgpu_device_rreg(adev->pdev->device, reg, ret);
 723
 724         return ret;
 725 }
 726
 727 /*
 728  * MMIO register read with bytes helper functions
 729  * @offset:bytes offset from MMIO start
 730  */
 731
 732 /**
 733  * amdgpu_mm_rreg8 - read a memory mapped IO register
 734  *
 735  * @adev: amdgpu_device pointer
 736  * @offset: byte aligned register offset
 737  *
 738  * Returns the 8 bit value from the offset specified.
 739  */
 740 uint8_t amdgpu_mm_rreg8(struct amdgpu_device *adev, uint32_t offset)
 741 {
 742         if (amdgpu_device_skip_hw_access(adev))
 743                 return 0;
 744
 745         if (offset < adev->rmmio_size)
 746                 return (readb(adev->rmmio + offset));
 747         BUG();
 748 }
 749
 750
 751 /**
 752  * amdgpu_device_xcc_rreg - read a memory mapped IO or indirect register with specific XCC
 753  *
 754  * @adev: amdgpu_device pointer
 755  * @reg: dword aligned register offset
 756  * @acc_flags: access flags which require special behavior
 757  * @xcc_id: xcc accelerated compute core id
 758  *
 759  * Returns the 32 bit value from the offset specified.
 760  */
 761 uint32_t amdgpu_device_xcc_rreg(struct amdgpu_device *adev,
 762                                 uint32_t reg, uint32_t acc_flags,
 763                                 uint32_t xcc_id)
 764 {
 765         uint32_t ret, rlcg_flag;
 766
 767         if (amdgpu_device_skip_hw_access(adev))
 768                 return 0;
 769
 770         if ((reg * 4) < adev->rmmio_size) {
 771                 if (amdgpu_sriov_vf(adev) &&
 772                     !amdgpu_sriov_runtime(adev) &&
 773                     adev->gfx.rlc.rlcg_reg_access_supported &&
 774                     amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags,
 775                                                          GC_HWIP, false,
 776                                                          &rlcg_flag)) {
 777                         ret = amdgpu_virt_rlcg_reg_rw(adev, reg, 0, rlcg_flag, GET_INST(GC, xcc_id));
 778                 } else if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 779                     amdgpu_sriov_runtime(adev) &&
 780                     down_read_trylock(&adev->reset_domain->sem)) {
 781                         ret = amdgpu_kiq_rreg(adev, reg, xcc_id);
 782                         up_read(&adev->reset_domain->sem);
 783                 } else {
 784                         ret = readl(((void __iomem *)adev->rmmio) + (reg * 4));
 785                 }
 786         } else {
 787                 ret = adev->pcie_rreg(adev, reg * 4);
 788         }
 789
 790         return ret;
 791 }
 792
 793 /*
 794  * MMIO register write with bytes helper functions
 795  * @offset:bytes offset from MMIO start
 796  * @value: the value want to be written to the register
 797  */
 798
 799 /**
 800  * amdgpu_mm_wreg8 - read a memory mapped IO register
 801  *
 802  * @adev: amdgpu_device pointer
 803  * @offset: byte aligned register offset
 804  * @value: 8 bit value to write
 805  *
 806  * Writes the value specified to the offset specified.
 807  */
 808 void amdgpu_mm_wreg8(struct amdgpu_device *adev, uint32_t offset, uint8_t value)
 809 {
 810         if (amdgpu_device_skip_hw_access(adev))
 811                 return;
 812
 813         if (offset < adev->rmmio_size)
 814                 writeb(value, adev->rmmio + offset);
 815         else
 816                 BUG();
 817 }
 818
 819 /**
 820  * amdgpu_device_wreg - write to a memory mapped IO or indirect register
 821  *
 822  * @adev: amdgpu_device pointer
 823  * @reg: dword aligned register offset
 824  * @v: 32 bit value to write to the register
 825  * @acc_flags: access flags which require special behavior
 826  *
 827  * Writes the value specified to the offset specified.
 828  */
 829 void amdgpu_device_wreg(struct amdgpu_device *adev,
 830                         uint32_t reg, uint32_t v,
 831                         uint32_t acc_flags)
 832 {
 833         if (amdgpu_device_skip_hw_access(adev))
 834                 return;
 835
 836         if ((reg * 4) < adev->rmmio_size) {
 837                 if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 838                     amdgpu_sriov_runtime(adev) &&
 839                     down_read_trylock(&adev->reset_domain->sem)) {
 840                         amdgpu_kiq_wreg(adev, reg, v, 0);
 841                         up_read(&adev->reset_domain->sem);
 842                 } else {
 843                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 844                 }
 845         } else {
 846                 adev->pcie_wreg(adev, reg * 4, v);
 847         }
 848
 849         trace_amdgpu_device_wreg(adev->pdev->device, reg, v);
 850 }
 851
 852 /**
 853  * amdgpu_mm_wreg_mmio_rlc -  write register either with direct/indirect mmio or with RLC path if in range
 854  *
 855  * @adev: amdgpu_device pointer
 856  * @reg: mmio/rlc register
 857  * @v: value to write
 858  * @xcc_id: xcc accelerated compute core id
 859  *
 860  * this function is invoked only for the debugfs register access
 861  */
 862 void amdgpu_mm_wreg_mmio_rlc(struct amdgpu_device *adev,
 863                              uint32_t reg, uint32_t v,
 864                              uint32_t xcc_id)
 865 {
 866         if (amdgpu_device_skip_hw_access(adev))
 867                 return;
 868
 869         if (amdgpu_sriov_fullaccess(adev) &&
 870             adev->gfx.rlc.funcs &&
 871             adev->gfx.rlc.funcs->is_rlcg_access_range) {
 872                 if (adev->gfx.rlc.funcs->is_rlcg_access_range(adev, reg))
 873                         return amdgpu_sriov_wreg(adev, reg, v, 0, 0, xcc_id);
 874         } else if ((reg * 4) >= adev->rmmio_size) {
 875                 adev->pcie_wreg(adev, reg * 4, v);
 876         } else {
 877                 writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 878         }
 879 }
 880
 881 /**
 882  * amdgpu_device_xcc_wreg - write to a memory mapped IO or indirect register with specific XCC
 883  *
 884  * @adev: amdgpu_device pointer
 885  * @reg: dword aligned register offset
 886  * @v: 32 bit value to write to the register
 887  * @acc_flags: access flags which require special behavior
 888  * @xcc_id: xcc accelerated compute core id
 889  *
 890  * Writes the value specified to the offset specified.
 891  */
 892 void amdgpu_device_xcc_wreg(struct amdgpu_device *adev,
 893                         uint32_t reg, uint32_t v,
 894                         uint32_t acc_flags, uint32_t xcc_id)
 895 {
 896         uint32_t rlcg_flag;
 897
 898         if (amdgpu_device_skip_hw_access(adev))
 899                 return;
 900
 901         if ((reg * 4) < adev->rmmio_size) {
 902                 if (amdgpu_sriov_vf(adev) &&
 903                     !amdgpu_sriov_runtime(adev) &&
 904                     adev->gfx.rlc.rlcg_reg_access_supported &&
 905                     amdgpu_virt_get_rlcg_reg_access_flag(adev, acc_flags,
 906                                                          GC_HWIP, true,
 907                                                          &rlcg_flag)) {
 908                         amdgpu_virt_rlcg_reg_rw(adev, reg, v, rlcg_flag, GET_INST(GC, xcc_id));
 909                 } else if (!(acc_flags & AMDGPU_REGS_NO_KIQ) &&
 910                     amdgpu_sriov_runtime(adev) &&
 911                     down_read_trylock(&adev->reset_domain->sem)) {
 912                         amdgpu_kiq_wreg(adev, reg, v, xcc_id);
 913                         up_read(&adev->reset_domain->sem);
 914                 } else {
 915                         writel(v, ((void __iomem *)adev->rmmio) + (reg * 4));
 916                 }
 917         } else {
 918                 adev->pcie_wreg(adev, reg * 4, v);
 919         }
 920 }
 921
 922 /**
 923  * amdgpu_device_indirect_rreg - read an indirect register
 924  *
 925  * @adev: amdgpu_device pointer
 926  * @reg_addr: indirect register address to read from
 927  *
 928  * Returns the value of indirect register @reg_addr
 929  */
 930 u32 amdgpu_device_indirect_rreg(struct amdgpu_device *adev,
 931                                 u32 reg_addr)
 932 {
 933         unsigned long flags, pcie_index, pcie_data;
 934         void __iomem *pcie_index_offset;
 935         void __iomem *pcie_data_offset;
 936         u32 r;
 937
 938         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 939         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 940
 941         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 942         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 943         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 944
 945         writel(reg_addr, pcie_index_offset);
 946         readl(pcie_index_offset);
 947         r = readl(pcie_data_offset);
 948         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
 949
 950         return r;
 951 }
 952
 953 u32 amdgpu_device_indirect_rreg_ext(struct amdgpu_device *adev,
 954                                     u64 reg_addr)
 955 {
 956         unsigned long flags, pcie_index, pcie_index_hi, pcie_data;
 957         u32 r;
 958         void __iomem *pcie_index_offset;
 959         void __iomem *pcie_index_hi_offset;
 960         void __iomem *pcie_data_offset;
 961
 962         if (unlikely(!adev->nbio.funcs)) {
 963                 pcie_index = AMDGPU_PCIE_INDEX_FALLBACK;
 964                 pcie_data = AMDGPU_PCIE_DATA_FALLBACK;
 965         } else {
 966                 pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
 967                 pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
 968         }
 969
 970         if (reg_addr >> 32) {
 971                 if (unlikely(!adev->nbio.funcs))
 972                         pcie_index_hi = AMDGPU_PCIE_INDEX_HI_FALLBACK;
 973                 else
 974                         pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
 975         } else {
 976                 pcie_index_hi = 0;
 977         }
 978
 979         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
 980         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
 981         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
 982         if (pcie_index_hi != 0)
 983                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
 984                                 pcie_index_hi * 4;
 985
 986         writel(reg_addr, pcie_index_offset);
 987         readl(pcie_index_offset);
 988         if (pcie_index_hi != 0) {
 989                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
 990                 readl(pcie_index_hi_offset);
 991         }
 992         r = readl(pcie_data_offset);
 993
 994         /* clear the high bits */
 995         if (pcie_index_hi != 0) {
 996                 writel(0, pcie_index_hi_offset);
 997                 readl(pcie_index_hi_offset);
 998         }
 999
1000         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1001
1002         return r;
1003 }
1004
1005 /**
1006  * amdgpu_device_indirect_rreg64 - read a 64bits indirect register
1007  *
1008  * @adev: amdgpu_device pointer
1009  * @reg_addr: indirect register address to read from
1010  *
1011  * Returns the value of indirect register @reg_addr
1012  */
1013 u64 amdgpu_device_indirect_rreg64(struct amdgpu_device *adev,
1014                                   u32 reg_addr)
1015 {
1016         unsigned long flags, pcie_index, pcie_data;
1017         void __iomem *pcie_index_offset;
1018         void __iomem *pcie_data_offset;
1019         u64 r;
1020
1021         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1022         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1023
1024         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1025         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1026         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1027
1028         /* read low 32 bits */
1029         writel(reg_addr, pcie_index_offset);
1030         readl(pcie_index_offset);
1031         r = readl(pcie_data_offset);
1032         /* read high 32 bits */
1033         writel(reg_addr + 4, pcie_index_offset);
1034         readl(pcie_index_offset);
1035         r |= ((u64)readl(pcie_data_offset) << 32);
1036         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1037
1038         return r;
1039 }
1040
1041 u64 amdgpu_device_indirect_rreg64_ext(struct amdgpu_device *adev,
1042                                   u64 reg_addr)
1043 {
1044         unsigned long flags, pcie_index, pcie_data;
1045         unsigned long pcie_index_hi = 0;
1046         void __iomem *pcie_index_offset;
1047         void __iomem *pcie_index_hi_offset;
1048         void __iomem *pcie_data_offset;
1049         u64 r;
1050
1051         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1052         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1053         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1054                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1055
1056         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1057         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1058         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1059         if (pcie_index_hi != 0)
1060                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1061                         pcie_index_hi * 4;
1062
1063         /* read low 32 bits */
1064         writel(reg_addr, pcie_index_offset);
1065         readl(pcie_index_offset);
1066         if (pcie_index_hi != 0) {
1067                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1068                 readl(pcie_index_hi_offset);
1069         }
1070         r = readl(pcie_data_offset);
1071         /* read high 32 bits */
1072         writel(reg_addr + 4, pcie_index_offset);
1073         readl(pcie_index_offset);
1074         if (pcie_index_hi != 0) {
1075                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1076                 readl(pcie_index_hi_offset);
1077         }
1078         r |= ((u64)readl(pcie_data_offset) << 32);
1079
1080         /* clear the high bits */
1081         if (pcie_index_hi != 0) {
1082                 writel(0, pcie_index_hi_offset);
1083                 readl(pcie_index_hi_offset);
1084         }
1085
1086         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1087
1088         return r;
1089 }
1090
1091 /**
1092  * amdgpu_device_indirect_wreg - write an indirect register address
1093  *
1094  * @adev: amdgpu_device pointer
1095  * @reg_addr: indirect register offset
1096  * @reg_data: indirect register data
1097  *
1098  */
1099 void amdgpu_device_indirect_wreg(struct amdgpu_device *adev,
1100                                  u32 reg_addr, u32 reg_data)
1101 {
1102         unsigned long flags, pcie_index, pcie_data;
1103         void __iomem *pcie_index_offset;
1104         void __iomem *pcie_data_offset;
1105
1106         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1107         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1108
1109         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1110         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1111         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1112
1113         writel(reg_addr, pcie_index_offset);
1114         readl(pcie_index_offset);
1115         writel(reg_data, pcie_data_offset);
1116         readl(pcie_data_offset);
1117         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1118 }
1119
1120 void amdgpu_device_indirect_wreg_ext(struct amdgpu_device *adev,
1121                                      u64 reg_addr, u32 reg_data)
1122 {
1123         unsigned long flags, pcie_index, pcie_index_hi, pcie_data;
1124         void __iomem *pcie_index_offset;
1125         void __iomem *pcie_index_hi_offset;
1126         void __iomem *pcie_data_offset;
1127
1128         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1129         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1130         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1131                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1132         else
1133                 pcie_index_hi = 0;
1134
1135         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1136         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1137         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1138         if (pcie_index_hi != 0)
1139                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1140                                 pcie_index_hi * 4;
1141
1142         writel(reg_addr, pcie_index_offset);
1143         readl(pcie_index_offset);
1144         if (pcie_index_hi != 0) {
1145                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1146                 readl(pcie_index_hi_offset);
1147         }
1148         writel(reg_data, pcie_data_offset);
1149         readl(pcie_data_offset);
1150
1151         /* clear the high bits */
1152         if (pcie_index_hi != 0) {
1153                 writel(0, pcie_index_hi_offset);
1154                 readl(pcie_index_hi_offset);
1155         }
1156
1157         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1158 }
1159
1160 /**
1161  * amdgpu_device_indirect_wreg64 - write a 64bits indirect register address
1162  *
1163  * @adev: amdgpu_device pointer
1164  * @reg_addr: indirect register offset
1165  * @reg_data: indirect register data
1166  *
1167  */
1168 void amdgpu_device_indirect_wreg64(struct amdgpu_device *adev,
1169                                    u32 reg_addr, u64 reg_data)
1170 {
1171         unsigned long flags, pcie_index, pcie_data;
1172         void __iomem *pcie_index_offset;
1173         void __iomem *pcie_data_offset;
1174
1175         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1176         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1177
1178         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1179         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1180         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1181
1182         /* write low 32 bits */
1183         writel(reg_addr, pcie_index_offset);
1184         readl(pcie_index_offset);
1185         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
1186         readl(pcie_data_offset);
1187         /* write high 32 bits */
1188         writel(reg_addr + 4, pcie_index_offset);
1189         readl(pcie_index_offset);
1190         writel((u32)(reg_data >> 32), pcie_data_offset);
1191         readl(pcie_data_offset);
1192         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1193 }
1194
1195 void amdgpu_device_indirect_wreg64_ext(struct amdgpu_device *adev,
1196                                    u64 reg_addr, u64 reg_data)
1197 {
1198         unsigned long flags, pcie_index, pcie_data;
1199         unsigned long pcie_index_hi = 0;
1200         void __iomem *pcie_index_offset;
1201         void __iomem *pcie_index_hi_offset;
1202         void __iomem *pcie_data_offset;
1203
1204         pcie_index = adev->nbio.funcs->get_pcie_index_offset(adev);
1205         pcie_data = adev->nbio.funcs->get_pcie_data_offset(adev);
1206         if ((reg_addr >> 32) && (adev->nbio.funcs->get_pcie_index_hi_offset))
1207                 pcie_index_hi = adev->nbio.funcs->get_pcie_index_hi_offset(adev);
1208
1209         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
1210         pcie_index_offset = (void __iomem *)adev->rmmio + pcie_index * 4;
1211         pcie_data_offset = (void __iomem *)adev->rmmio + pcie_data * 4;
1212         if (pcie_index_hi != 0)
1213                 pcie_index_hi_offset = (void __iomem *)adev->rmmio +
1214                                 pcie_index_hi * 4;
1215
1216         /* write low 32 bits */
1217         writel(reg_addr, pcie_index_offset);
1218         readl(pcie_index_offset);
1219         if (pcie_index_hi != 0) {
1220                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1221                 readl(pcie_index_hi_offset);
1222         }
1223         writel((u32)(reg_data & 0xffffffffULL), pcie_data_offset);
1224         readl(pcie_data_offset);
1225         /* write high 32 bits */
1226         writel(reg_addr + 4, pcie_index_offset);
1227         readl(pcie_index_offset);
1228         if (pcie_index_hi != 0) {
1229                 writel((reg_addr >> 32) & 0xff, pcie_index_hi_offset);
1230                 readl(pcie_index_hi_offset);
1231         }
1232         writel((u32)(reg_data >> 32), pcie_data_offset);
1233         readl(pcie_data_offset);
1234
1235         /* clear the high bits */
1236         if (pcie_index_hi != 0) {
1237                 writel(0, pcie_index_hi_offset);
1238                 readl(pcie_index_hi_offset);
1239         }
1240
1241         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
1242 }
1243
1244 /**
1245  * amdgpu_device_get_rev_id - query device rev_id
1246  *
1247  * @adev: amdgpu_device pointer
1248  *
1249  * Return device rev_id
1250  */
1251 u32 amdgpu_device_get_rev_id(struct amdgpu_device *adev)
1252 {
1253         return adev->nbio.funcs->get_rev_id(adev);
1254 }
1255
1256 /**
1257  * amdgpu_invalid_rreg - dummy reg read function
1258  *
1259  * @adev: amdgpu_device pointer
1260  * @reg: offset of register
1261  *
1262  * Dummy register read function.  Used for register blocks
1263  * that certain asics don't have (all asics).
1264  * Returns the value in the register.
1265  */
1266 static uint32_t amdgpu_invalid_rreg(struct amdgpu_device *adev, uint32_t reg)
1267 {
1268         DRM_ERROR("Invalid callback to read register 0x%04X\n", reg);
1269         BUG();
1270         return 0;
1271 }
1272
1273 static uint32_t amdgpu_invalid_rreg_ext(struct amdgpu_device *adev, uint64_t reg)
1274 {
1275         DRM_ERROR("Invalid callback to read register 0x%llX\n", reg);
1276         BUG();
1277         return 0;
1278 }
1279
1280 /**
1281  * amdgpu_invalid_wreg - dummy reg write function
1282  *
1283  * @adev: amdgpu_device pointer
1284  * @reg: offset of register
1285  * @v: value to write to the register
1286  *
1287  * Dummy register read function.  Used for register blocks
1288  * that certain asics don't have (all asics).
1289  */
1290 static void amdgpu_invalid_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
1291 {
1292         DRM_ERROR("Invalid callback to write register 0x%04X with 0x%08X\n",
1293                   reg, v);
1294         BUG();
1295 }
1296
1297 static void amdgpu_invalid_wreg_ext(struct amdgpu_device *adev, uint64_t reg, uint32_t v)
1298 {
1299         DRM_ERROR("Invalid callback to write register 0x%llX with 0x%08X\n",
1300                   reg, v);
1301         BUG();
1302 }
1303
1304 /**
1305  * amdgpu_invalid_rreg64 - dummy 64 bit reg read function
1306  *
1307  * @adev: amdgpu_device pointer
1308  * @reg: offset of register
1309  *
1310  * Dummy register read function.  Used for register blocks
1311  * that certain asics don't have (all asics).
1312  * Returns the value in the register.
1313  */
1314 static uint64_t amdgpu_invalid_rreg64(struct amdgpu_device *adev, uint32_t reg)
1315 {
1316         DRM_ERROR("Invalid callback to read 64 bit register 0x%04X\n", reg);
1317         BUG();
1318         return 0;
1319 }
1320
1321 static uint64_t amdgpu_invalid_rreg64_ext(struct amdgpu_device *adev, uint64_t reg)
1322 {
1323         DRM_ERROR("Invalid callback to read register 0x%llX\n", reg);
1324         BUG();
1325         return 0;
1326 }
1327
1328 /**
1329  * amdgpu_invalid_wreg64 - dummy reg write function
1330  *
1331  * @adev: amdgpu_device pointer
1332  * @reg: offset of register
1333  * @v: value to write to the register
1334  *
1335  * Dummy register read function.  Used for register blocks
1336  * that certain asics don't have (all asics).
1337  */
1338 static void amdgpu_invalid_wreg64(struct amdgpu_device *adev, uint32_t reg, uint64_t v)
1339 {
1340         DRM_ERROR("Invalid callback to write 64 bit register 0x%04X with 0x%08llX\n",
1341                   reg, v);
1342         BUG();
1343 }
1344
1345 static void amdgpu_invalid_wreg64_ext(struct amdgpu_device *adev, uint64_t reg, uint64_t v)
1346 {
1347         DRM_ERROR("Invalid callback to write 64 bit register 0x%llX with 0x%08llX\n",
1348                   reg, v);
1349         BUG();
1350 }
1351
1352 /**
1353  * amdgpu_block_invalid_rreg - dummy reg read function
1354  *
1355  * @adev: amdgpu_device pointer
1356  * @block: offset of instance
1357  * @reg: offset of register
1358  *
1359  * Dummy register read function.  Used for register blocks
1360  * that certain asics don't have (all asics).
1361  * Returns the value in the register.
1362  */
1363 static uint32_t amdgpu_block_invalid_rreg(struct amdgpu_device *adev,
1364                                           uint32_t block, uint32_t reg)
1365 {
1366         DRM_ERROR("Invalid callback to read register 0x%04X in block 0x%04X\n",
1367                   reg, block);
1368         BUG();
1369         return 0;
1370 }
1371
1372 /**
1373  * amdgpu_block_invalid_wreg - dummy reg write function
1374  *
1375  * @adev: amdgpu_device pointer
1376  * @block: offset of instance
1377  * @reg: offset of register
1378  * @v: value to write to the register
1379  *
1380  * Dummy register read function.  Used for register blocks
1381  * that certain asics don't have (all asics).
1382  */
1383 static void amdgpu_block_invalid_wreg(struct amdgpu_device *adev,
1384                                       uint32_t block,
1385                                       uint32_t reg, uint32_t v)
1386 {
1387         DRM_ERROR("Invalid block callback to write register 0x%04X in block 0x%04X with 0x%08X\n",
1388                   reg, block, v);
1389         BUG();
1390 }
1391
1392 /**
1393  * amdgpu_device_asic_init - Wrapper for atom asic_init
1394  *
1395  * @adev: amdgpu_device pointer
1396  *
1397  * Does any asic specific work and then calls atom asic init.
1398  */
1399 static int amdgpu_device_asic_init(struct amdgpu_device *adev)
1400 {
1401         int ret;
1402
1403         amdgpu_asic_pre_asic_init(adev);
1404
1405         if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
1406             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4) ||
1407             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 5, 0) ||
1408             amdgpu_ip_version(adev, GC_HWIP, 0) >= IP_VERSION(11, 0, 0)) {
1409                 amdgpu_psp_wait_for_bootloader(adev);
1410                 ret = amdgpu_atomfirmware_asic_init(adev, true);
1411                 return ret;
1412         } else {
1413                 return amdgpu_atom_asic_init(adev->mode_info.atom_context);
1414         }
1415
1416         return 0;
1417 }
1418
1419 /**
1420  * amdgpu_device_mem_scratch_init - allocate the VRAM scratch page
1421  *
1422  * @adev: amdgpu_device pointer
1423  *
1424  * Allocates a scratch page of VRAM for use by various things in the
1425  * driver.
1426  */
1427 static int amdgpu_device_mem_scratch_init(struct amdgpu_device *adev)
1428 {
1429         return amdgpu_bo_create_kernel(adev, AMDGPU_GPU_PAGE_SIZE, PAGE_SIZE,
1430                                        AMDGPU_GEM_DOMAIN_VRAM |
1431                                        AMDGPU_GEM_DOMAIN_GTT,
1432                                        &adev->mem_scratch.robj,
1433                                        &adev->mem_scratch.gpu_addr,
1434                                        (void **)&adev->mem_scratch.ptr);
1435 }
1436
1437 /**
1438  * amdgpu_device_mem_scratch_fini - Free the VRAM scratch page
1439  *
1440  * @adev: amdgpu_device pointer
1441  *
1442  * Frees the VRAM scratch page.
1443  */
1444 static void amdgpu_device_mem_scratch_fini(struct amdgpu_device *adev)
1445 {
1446         amdgpu_bo_free_kernel(&adev->mem_scratch.robj, NULL, NULL);
1447 }
1448
1449 /**
1450  * amdgpu_device_program_register_sequence - program an array of registers.
1451  *
1452  * @adev: amdgpu_device pointer
1453  * @registers: pointer to the register array
1454  * @array_size: size of the register array
1455  *
1456  * Programs an array or registers with and or masks.
1457  * This is a helper for setting golden registers.
1458  */
1459 void amdgpu_device_program_register_sequence(struct amdgpu_device *adev,
1460                                              const u32 *registers,
1461                                              const u32 array_size)
1462 {
1463         u32 tmp, reg, and_mask, or_mask;
1464         int i;
1465
1466         if (array_size % 3)
1467                 return;
1468
1469         for (i = 0; i < array_size; i += 3) {
1470                 reg = registers[i + 0];
1471                 and_mask = registers[i + 1];
1472                 or_mask = registers[i + 2];
1473
1474                 if (and_mask == 0xffffffff) {
1475                         tmp = or_mask;
1476                 } else {
1477                         tmp = RREG32(reg);
1478                         tmp &= ~and_mask;
1479                         if (adev->family >= AMDGPU_FAMILY_AI)
1480                                 tmp |= (or_mask & and_mask);
1481                         else
1482                                 tmp |= or_mask;
1483                 }
1484                 WREG32(reg, tmp);
1485         }
1486 }
1487
1488 /**
1489  * amdgpu_device_pci_config_reset - reset the GPU
1490  *
1491  * @adev: amdgpu_device pointer
1492  *
1493  * Resets the GPU using the pci config reset sequence.
1494  * Only applicable to asics prior to vega10.
1495  */
1496 void amdgpu_device_pci_config_reset(struct amdgpu_device *adev)
1497 {
1498         pci_write_config_dword(adev->pdev, 0x7c, AMDGPU_ASIC_RESET_DATA);
1499 }
1500
1501 /**
1502  * amdgpu_device_pci_reset - reset the GPU using generic PCI means
1503  *
1504  * @adev: amdgpu_device pointer
1505  *
1506  * Resets the GPU using generic pci reset interfaces (FLR, SBR, etc.).
1507  */
1508 int amdgpu_device_pci_reset(struct amdgpu_device *adev)
1509 {
1510         return pci_reset_function(adev->pdev);
1511 }
1512
1513 /*
1514  * amdgpu_device_wb_*()
1515  * Writeback is the method by which the GPU updates special pages in memory
1516  * with the status of certain GPU events (fences, ring pointers,etc.).
1517  */
1518
1519 /**
1520  * amdgpu_device_wb_fini - Disable Writeback and free memory
1521  *
1522  * @adev: amdgpu_device pointer
1523  *
1524  * Disables Writeback and frees the Writeback memory (all asics).
1525  * Used at driver shutdown.
1526  */
1527 static void amdgpu_device_wb_fini(struct amdgpu_device *adev)
1528 {
1529         if (adev->wb.wb_obj) {
1530                 amdgpu_bo_free_kernel(&adev->wb.wb_obj,
1531                                       &adev->wb.gpu_addr,
1532                                       (void **)&adev->wb.wb);
1533                 adev->wb.wb_obj = NULL;
1534         }
1535 }
1536
1537 /**
1538  * amdgpu_device_wb_init - Init Writeback driver info and allocate memory
1539  *
1540  * @adev: amdgpu_device pointer
1541  *
1542  * Initializes writeback and allocates writeback memory (all asics).
1543  * Used at driver startup.
1544  * Returns 0 on success or an -error on failure.
1545  */
1546 static int amdgpu_device_wb_init(struct amdgpu_device *adev)
1547 {
1548         int r;
1549
1550         if (adev->wb.wb_obj == NULL) {
1551                 /* AMDGPU_MAX_WB * sizeof(uint32_t) * 8 = AMDGPU_MAX_WB 256bit slots */
1552                 r = amdgpu_bo_create_kernel(adev, AMDGPU_MAX_WB * sizeof(uint32_t) * 8,
1553                                             PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
1554                                             &adev->wb.wb_obj, &adev->wb.gpu_addr,
1555                                             (void **)&adev->wb.wb);
1556                 if (r) {
1557                         dev_warn(adev->dev, "(%d) create WB bo failed\n", r);
1558                         return r;
1559                 }
1560
1561                 adev->wb.num_wb = AMDGPU_MAX_WB;
1562                 memset(&adev->wb.used, 0, sizeof(adev->wb.used));
1563
1564                 /* clear wb memory */
1565                 memset((char *)adev->wb.wb, 0, AMDGPU_MAX_WB * sizeof(uint32_t) * 8);
1566         }
1567
1568         return 0;
1569 }
1570
1571 /**
1572  * amdgpu_device_wb_get - Allocate a wb entry
1573  *
1574  * @adev: amdgpu_device pointer
1575  * @wb: wb index
1576  *
1577  * Allocate a wb slot for use by the driver (all asics).
1578  * Returns 0 on success or -EINVAL on failure.
1579  */
1580 int amdgpu_device_wb_get(struct amdgpu_device *adev, u32 *wb)
1581 {
1582         unsigned long flags, offset;
1583
1584         spin_lock_irqsave(&adev->wb.lock, flags);
1585         offset = find_first_zero_bit(adev->wb.used, adev->wb.num_wb);
1586         if (offset < adev->wb.num_wb) {
1587                 __set_bit(offset, adev->wb.used);
1588                 spin_unlock_irqrestore(&adev->wb.lock, flags);
1589                 *wb = offset << 3; /* convert to dw offset */
1590                 return 0;
1591         } else {
1592                 spin_unlock_irqrestore(&adev->wb.lock, flags);
1593                 return -EINVAL;
1594         }
1595 }
1596
1597 /**
1598  * amdgpu_device_wb_free - Free a wb entry
1599  *
1600  * @adev: amdgpu_device pointer
1601  * @wb: wb index
1602  *
1603  * Free a wb slot allocated for use by the driver (all asics)
1604  */
1605 void amdgpu_device_wb_free(struct amdgpu_device *adev, u32 wb)
1606 {
1607         unsigned long flags;
1608
1609         wb >>= 3;
1610         spin_lock_irqsave(&adev->wb.lock, flags);
1611         if (wb < adev->wb.num_wb)
1612                 __clear_bit(wb, adev->wb.used);
1613         spin_unlock_irqrestore(&adev->wb.lock, flags);
1614 }
1615
1616 /**
1617  * amdgpu_device_resize_fb_bar - try to resize FB BAR
1618  *
1619  * @adev: amdgpu_device pointer
1620  *
1621  * Try to resize FB BAR to make all VRAM CPU accessible. We try very hard not
1622  * to fail, but if any of the BARs is not accessible after the size we abort
1623  * driver loading by returning -ENODEV.
1624  */
1625 int amdgpu_device_resize_fb_bar(struct amdgpu_device *adev)
1626 {
1627         int rbar_size = pci_rebar_bytes_to_size(adev->gmc.real_vram_size);
1628         struct pci_bus *root;
1629         struct resource *res;
1630         unsigned int i;
1631         u16 cmd;
1632         int r;
1633
1634         if (!IS_ENABLED(CONFIG_PHYS_ADDR_T_64BIT))
1635                 return 0;
1636
1637         /* Bypass for VF */
1638         if (amdgpu_sriov_vf(adev))
1639                 return 0;
1640
1641         /* PCI_EXT_CAP_ID_VNDR extended capability is located at 0x100 */
1642         if (!pci_find_ext_capability(adev->pdev, PCI_EXT_CAP_ID_VNDR))
1643                 DRM_WARN("System can't access extended configuration space, please check!!\n");
1644
1645         /* skip if the bios has already enabled large BAR */
1646         if (adev->gmc.real_vram_size &&
1647             (pci_resource_len(adev->pdev, 0) >= adev->gmc.real_vram_size))
1648                 return 0;
1649
1650         /* Check if the root BUS has 64bit memory resources */
1651         root = adev->pdev->bus;
1652         while (root->parent)
1653                 root = root->parent;
1654
1655         pci_bus_for_each_resource(root, res, i) {
1656                 if (res && res->flags & (IORESOURCE_MEM | IORESOURCE_MEM_64) &&
1657                     res->start > 0x100000000ull)
1658                         break;
1659         }
1660
1661         /* Trying to resize is pointless without a root hub window above 4GB */
1662         if (!res)
1663                 return 0;
1664
1665         /* Limit the BAR size to what is available */
1666         rbar_size = min(fls(pci_rebar_get_possible_sizes(adev->pdev, 0)) - 1,
1667                         rbar_size);
1668
1669         /* Disable memory decoding while we change the BAR addresses and size */
1670         pci_read_config_word(adev->pdev, PCI_COMMAND, &cmd);
1671         pci_write_config_word(adev->pdev, PCI_COMMAND,
1672                               cmd & ~PCI_COMMAND_MEMORY);
1673
1674         /* Free the VRAM and doorbell BAR, we most likely need to move both. */
1675         amdgpu_doorbell_fini(adev);
1676         if (adev->asic_type >= CHIP_BONAIRE)
1677                 pci_release_resource(adev->pdev, 2);
1678
1679         pci_release_resource(adev->pdev, 0);
1680
1681         r = pci_resize_resource(adev->pdev, 0, rbar_size);
1682         if (r == -ENOSPC)
1683                 DRM_INFO("Not enough PCI address space for a large BAR.");
1684         else if (r && r != -ENOTSUPP)
1685                 DRM_ERROR("Problem resizing BAR0 (%d).", r);
1686
1687         pci_assign_unassigned_bus_resources(adev->pdev->bus);
1688
1689         /* When the doorbell or fb BAR isn't available we have no chance of
1690          * using the device.
1691          */
1692         r = amdgpu_doorbell_init(adev);
1693         if (r || (pci_resource_flags(adev->pdev, 0) & IORESOURCE_UNSET))
1694                 return -ENODEV;
1695
1696         pci_write_config_word(adev->pdev, PCI_COMMAND, cmd);
1697
1698         return 0;
1699 }
1700
1701 static bool amdgpu_device_read_bios(struct amdgpu_device *adev)
1702 {
1703         if (hweight32(adev->aid_mask) && (adev->flags & AMD_IS_APU))
1704                 return false;
1705
1706         return true;
1707 }
1708
1709 /*
1710  * GPU helpers function.
1711  */
1712 /**
1713  * amdgpu_device_need_post - check if the hw need post or not
1714  *
1715  * @adev: amdgpu_device pointer
1716  *
1717  * Check if the asic has been initialized (all asics) at driver startup
1718  * or post is needed if  hw reset is performed.
1719  * Returns true if need or false if not.
1720  */
1721 bool amdgpu_device_need_post(struct amdgpu_device *adev)
1722 {
1723         uint32_t reg;
1724
1725         if (amdgpu_sriov_vf(adev))
1726                 return false;
1727
1728         if (!amdgpu_device_read_bios(adev))
1729                 return false;
1730
1731         if (amdgpu_passthrough(adev)) {
1732                 /* for FIJI: In whole GPU pass-through virtualization case, after VM reboot
1733                  * some old smc fw still need driver do vPost otherwise gpu hang, while
1734                  * those smc fw version above 22.15 doesn't have this flaw, so we force
1735                  * vpost executed for smc version below 22.15
1736                  */
1737                 if (adev->asic_type == CHIP_FIJI) {
1738                         int err;
1739                         uint32_t fw_ver;
1740
1741                         err = request_firmware(&adev->pm.fw, "amdgpu/fiji_smc.bin", adev->dev);
1742                         /* force vPost if error occurred */
1743                         if (err)
1744                                 return true;
1745
1746                         fw_ver = *((uint32_t *)adev->pm.fw->data + 69);
1747                         release_firmware(adev->pm.fw);
1748                         if (fw_ver < 0x00160e00)
1749                                 return true;
1750                 }
1751         }
1752
1753         /* Don't post if we need to reset whole hive on init */
1754         if (adev->init_lvl->level == AMDGPU_INIT_LEVEL_MINIMAL_XGMI)
1755                 return false;
1756
1757         if (adev->has_hw_reset) {
1758                 adev->has_hw_reset = false;
1759                 return true;
1760         }
1761
1762         /* bios scratch used on CIK+ */
1763         if (adev->asic_type >= CHIP_BONAIRE)
1764                 return amdgpu_atombios_scratch_need_asic_init(adev);
1765
1766         /* check MEM_SIZE for older asics */
1767         reg = amdgpu_asic_get_config_memsize(adev);
1768
1769         if ((reg != 0) && (reg != 0xffffffff))
1770                 return false;
1771
1772         return true;
1773 }
1774
1775 /*
1776  * Check whether seamless boot is supported.
1777  *
1778  * So far we only support seamless boot on DCE 3.0 or later.
1779  * If users report that it works on older ASICS as well, we may
1780  * loosen this.
1781  */
1782 bool amdgpu_device_seamless_boot_supported(struct amdgpu_device *adev)
1783 {
1784         switch (amdgpu_seamless) {
1785         case -1:
1786                 break;
1787         case 1:
1788                 return true;
1789         case 0:
1790                 return false;
1791         default:
1792                 DRM_ERROR("Invalid value for amdgpu.seamless: %d\n",
1793                           amdgpu_seamless);
1794                 return false;
1795         }
1796
1797         if (!(adev->flags & AMD_IS_APU))
1798                 return false;
1799
1800         if (adev->mman.keep_stolen_vga_memory)
1801                 return false;
1802
1803         return amdgpu_ip_version(adev, DCE_HWIP, 0) >= IP_VERSION(3, 0, 0);
1804 }
1805
1806 /*
1807  * Intel hosts such as Rocket Lake, Alder Lake, Raptor Lake and Sapphire Rapids
1808  * don't support dynamic speed switching. Until we have confirmation from Intel
1809  * that a specific host supports it, it's safer that we keep it disabled for all.
1810  *
1811  * https://edc.intel.com/content/www/us/en/design/products/platforms/details/raptor-lake-s/13th-generation-core-processors-datasheet-volume-1-of-2/005/pci-express-support/
1812  * https://gitlab.freedesktop.org/drm/amd/-/issues/2663
1813  */
1814 static bool amdgpu_device_pcie_dynamic_switching_supported(struct amdgpu_device *adev)
1815 {
1816 #if IS_ENABLED(CONFIG_X86)
1817         struct cpuinfo_x86 *c = &cpu_data(0);
1818
1819         /* eGPU change speeds based on USB4 fabric conditions */
1820         if (dev_is_removable(adev->dev))
1821                 return true;
1822
1823         if (c->x86_vendor == X86_VENDOR_INTEL)
1824                 return false;
1825 #endif
1826         return true;
1827 }
1828
1829 /**
1830  * amdgpu_device_should_use_aspm - check if the device should program ASPM
1831  *
1832  * @adev: amdgpu_device pointer
1833  *
1834  * Confirm whether the module parameter and pcie bridge agree that ASPM should
1835  * be set for this device.
1836  *
1837  * Returns true if it should be used or false if not.
1838  */
1839 bool amdgpu_device_should_use_aspm(struct amdgpu_device *adev)
1840 {
1841         switch (amdgpu_aspm) {
1842         case -1:
1843                 break;
1844         case 0:
1845                 return false;
1846         case 1:
1847                 return true;
1848         default:
1849                 return false;
1850         }
1851         if (adev->flags & AMD_IS_APU)
1852                 return false;
1853         if (!(adev->pm.pp_feature & PP_PCIE_DPM_MASK))
1854                 return false;
1855         return pcie_aspm_enabled(adev->pdev);
1856 }
1857
1858 /* if we get transitioned to only one device, take VGA back */
1859 /**
1860  * amdgpu_device_vga_set_decode - enable/disable vga decode
1861  *
1862  * @pdev: PCI device pointer
1863  * @state: enable/disable vga decode
1864  *
1865  * Enable/disable vga decode (all asics).
1866  * Returns VGA resource flags.
1867  */
1868 static unsigned int amdgpu_device_vga_set_decode(struct pci_dev *pdev,
1869                 bool state)
1870 {
1871         struct amdgpu_device *adev = drm_to_adev(pci_get_drvdata(pdev));
1872
1873         amdgpu_asic_set_vga_state(adev, state);
1874         if (state)
1875                 return VGA_RSRC_LEGACY_IO | VGA_RSRC_LEGACY_MEM |
1876                        VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1877         else
1878                 return VGA_RSRC_NORMAL_IO | VGA_RSRC_NORMAL_MEM;
1879 }
1880
1881 /**
1882  * amdgpu_device_check_block_size - validate the vm block size
1883  *
1884  * @adev: amdgpu_device pointer
1885  *
1886  * Validates the vm block size specified via module parameter.
1887  * The vm block size defines number of bits in page table versus page directory,
1888  * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1889  * page table and the remaining bits are in the page directory.
1890  */
1891 static void amdgpu_device_check_block_size(struct amdgpu_device *adev)
1892 {
1893         /* defines number of bits in page table versus page directory,
1894          * a page is 4KB so we have 12 bits offset, minimum 9 bits in the
1895          * page table and the remaining bits are in the page directory
1896          */
1897         if (amdgpu_vm_block_size == -1)
1898                 return;
1899
1900         if (amdgpu_vm_block_size < 9) {
1901                 dev_warn(adev->dev, "VM page table size (%d) too small\n",
1902                          amdgpu_vm_block_size);
1903                 amdgpu_vm_block_size = -1;
1904         }
1905 }
1906
1907 /**
1908  * amdgpu_device_check_vm_size - validate the vm size
1909  *
1910  * @adev: amdgpu_device pointer
1911  *
1912  * Validates the vm size in GB specified via module parameter.
1913  * The VM size is the size of the GPU virtual memory space in GB.
1914  */
1915 static void amdgpu_device_check_vm_size(struct amdgpu_device *adev)
1916 {
1917         /* no need to check the default value */
1918         if (amdgpu_vm_size == -1)
1919                 return;
1920
1921         if (amdgpu_vm_size < 1) {
1922                 dev_warn(adev->dev, "VM size (%d) too small, min is 1GB\n",
1923                          amdgpu_vm_size);
1924                 amdgpu_vm_size = -1;
1925         }
1926 }
1927
1928 static void amdgpu_device_check_smu_prv_buffer_size(struct amdgpu_device *adev)
1929 {
1930         struct sysinfo si;
1931         bool is_os_64 = (sizeof(void *) == 8);
1932         uint64_t total_memory;
1933         uint64_t dram_size_seven_GB = 0x1B8000000;
1934         uint64_t dram_size_three_GB = 0xB8000000;
1935
1936         if (amdgpu_smu_memory_pool_size == 0)
1937                 return;
1938
1939         if (!is_os_64) {
1940                 DRM_WARN("Not 64-bit OS, feature not supported\n");
1941                 goto def_value;
1942         }
1943         si_meminfo(&si);
1944         total_memory = (uint64_t)si.totalram * si.mem_unit;
1945
1946         if ((amdgpu_smu_memory_pool_size == 1) ||
1947                 (amdgpu_smu_memory_pool_size == 2)) {
1948                 if (total_memory < dram_size_three_GB)
1949                         goto def_value1;
1950         } else if ((amdgpu_smu_memory_pool_size == 4) ||
1951                 (amdgpu_smu_memory_pool_size == 8)) {
1952                 if (total_memory < dram_size_seven_GB)
1953                         goto def_value1;
1954         } else {
1955                 DRM_WARN("Smu memory pool size not supported\n");
1956                 goto def_value;
1957         }
1958         adev->pm.smu_prv_buffer_size = amdgpu_smu_memory_pool_size << 28;
1959
1960         return;
1961
1962 def_value1:
1963         DRM_WARN("No enough system memory\n");
1964 def_value:
1965         adev->pm.smu_prv_buffer_size = 0;
1966 }
1967
1968 static int amdgpu_device_init_apu_flags(struct amdgpu_device *adev)
1969 {
1970         if (!(adev->flags & AMD_IS_APU) ||
1971             adev->asic_type < CHIP_RAVEN)
1972                 return 0;
1973
1974         switch (adev->asic_type) {
1975         case CHIP_RAVEN:
1976                 if (adev->pdev->device == 0x15dd)
1977                         adev->apu_flags |= AMD_APU_IS_RAVEN;
1978                 if (adev->pdev->device == 0x15d8)
1979                         adev->apu_flags |= AMD_APU_IS_PICASSO;
1980                 break;
1981         case CHIP_RENOIR:
1982                 if ((adev->pdev->device == 0x1636) ||
1983                     (adev->pdev->device == 0x164c))
1984                         adev->apu_flags |= AMD_APU_IS_RENOIR;
1985                 else
1986                         adev->apu_flags |= AMD_APU_IS_GREEN_SARDINE;
1987                 break;
1988         case CHIP_VANGOGH:
1989                 adev->apu_flags |= AMD_APU_IS_VANGOGH;
1990                 break;
1991         case CHIP_YELLOW_CARP:
1992                 break;
1993         case CHIP_CYAN_SKILLFISH:
1994                 if ((adev->pdev->device == 0x13FE) ||
1995                     (adev->pdev->device == 0x143F))
1996                         adev->apu_flags |= AMD_APU_IS_CYAN_SKILLFISH2;
1997                 break;
1998         default:
1999                 break;
2000         }
2001
2002         return 0;
2003 }
2004
2005 /**
2006  * amdgpu_device_check_arguments - validate module params
2007  *
2008  * @adev: amdgpu_device pointer
2009  *
2010  * Validates certain module parameters and updates
2011  * the associated values used by the driver (all asics).
2012  */
2013 static int amdgpu_device_check_arguments(struct amdgpu_device *adev)
2014 {
2015         int i;
2016
2017         if (amdgpu_sched_jobs < 4) {
2018                 dev_warn(adev->dev, "sched jobs (%d) must be at least 4\n",
2019                          amdgpu_sched_jobs);
2020                 amdgpu_sched_jobs = 4;
2021         } else if (!is_power_of_2(amdgpu_sched_jobs)) {
2022                 dev_warn(adev->dev, "sched jobs (%d) must be a power of 2\n",
2023                          amdgpu_sched_jobs);
2024                 amdgpu_sched_jobs = roundup_pow_of_two(amdgpu_sched_jobs);
2025         }
2026
2027         if (amdgpu_gart_size != -1 && amdgpu_gart_size < 32) {
2028                 /* gart size must be greater or equal to 32M */
2029                 dev_warn(adev->dev, "gart size (%d) too small\n",
2030                          amdgpu_gart_size);
2031                 amdgpu_gart_size = -1;
2032         }
2033
2034         if (amdgpu_gtt_size != -1 && amdgpu_gtt_size < 32) {
2035                 /* gtt size must be greater or equal to 32M */
2036                 dev_warn(adev->dev, "gtt size (%d) too small\n",
2037                                  amdgpu_gtt_size);
2038                 amdgpu_gtt_size = -1;
2039         }
2040
2041         /* valid range is between 4 and 9 inclusive */
2042         if (amdgpu_vm_fragment_size != -1 &&
2043             (amdgpu_vm_fragment_size > 9 || amdgpu_vm_fragment_size < 4)) {
2044                 dev_warn(adev->dev, "valid range is between 4 and 9\n");
2045                 amdgpu_vm_fragment_size = -1;
2046         }
2047
2048         if (amdgpu_sched_hw_submission < 2) {
2049                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be at least 2\n",
2050                          amdgpu_sched_hw_submission);
2051                 amdgpu_sched_hw_submission = 2;
2052         } else if (!is_power_of_2(amdgpu_sched_hw_submission)) {
2053                 dev_warn(adev->dev, "sched hw submission jobs (%d) must be a power of 2\n",
2054                          amdgpu_sched_hw_submission);
2055                 amdgpu_sched_hw_submission = roundup_pow_of_two(amdgpu_sched_hw_submission);
2056         }
2057
2058         if (amdgpu_reset_method < -1 || amdgpu_reset_method > 4) {
2059                 dev_warn(adev->dev, "invalid option for reset method, reverting to default\n");
2060                 amdgpu_reset_method = -1;
2061         }
2062
2063         amdgpu_device_check_smu_prv_buffer_size(adev);
2064
2065         amdgpu_device_check_vm_size(adev);
2066
2067         amdgpu_device_check_block_size(adev);
2068
2069         adev->firmware.load_type = amdgpu_ucode_get_load_type(adev, amdgpu_fw_load_type);
2070
2071         for (i = 0; i < MAX_XCP; i++)
2072                 adev->enforce_isolation[i] = !!enforce_isolation;
2073
2074         return 0;
2075 }
2076
2077 /**
2078  * amdgpu_switcheroo_set_state - set switcheroo state
2079  *
2080  * @pdev: pci dev pointer
2081  * @state: vga_switcheroo state
2082  *
2083  * Callback for the switcheroo driver.  Suspends or resumes
2084  * the asics before or after it is powered up using ACPI methods.
2085  */
2086 static void amdgpu_switcheroo_set_state(struct pci_dev *pdev,
2087                                         enum vga_switcheroo_state state)
2088 {
2089         struct drm_device *dev = pci_get_drvdata(pdev);
2090         int r;
2091
2092         if (amdgpu_device_supports_px(dev) && state == VGA_SWITCHEROO_OFF)
2093                 return;
2094
2095         if (state == VGA_SWITCHEROO_ON) {
2096                 pr_info("switched on\n");
2097                 /* don't suspend or resume card normally */
2098                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
2099
2100                 pci_set_power_state(pdev, PCI_D0);
2101                 amdgpu_device_load_pci_state(pdev);
2102                 r = pci_enable_device(pdev);
2103                 if (r)
2104                         DRM_WARN("pci_enable_device failed (%d)\n", r);
2105                 amdgpu_device_resume(dev, true);
2106
2107                 dev->switch_power_state = DRM_SWITCH_POWER_ON;
2108         } else {
2109                 pr_info("switched off\n");
2110                 dev->switch_power_state = DRM_SWITCH_POWER_CHANGING;
2111                 amdgpu_device_prepare(dev);
2112                 amdgpu_device_suspend(dev, true);
2113                 amdgpu_device_cache_pci_state(pdev);
2114                 /* Shut down the device */
2115                 pci_disable_device(pdev);
2116                 pci_set_power_state(pdev, PCI_D3cold);
2117                 dev->switch_power_state = DRM_SWITCH_POWER_OFF;
2118         }
2119 }
2120
2121 /**
2122  * amdgpu_switcheroo_can_switch - see if switcheroo state can change
2123  *
2124  * @pdev: pci dev pointer
2125  *
2126  * Callback for the switcheroo driver.  Check of the switcheroo
2127  * state can be changed.
2128  * Returns true if the state can be changed, false if not.
2129  */
2130 static bool amdgpu_switcheroo_can_switch(struct pci_dev *pdev)
2131 {
2132         struct drm_device *dev = pci_get_drvdata(pdev);
2133
2134        /*
2135         * FIXME: open_count is protected by drm_global_mutex but that would lead to
2136         * locking inversion with the driver load path. And the access here is
2137         * completely racy anyway. So don't bother with locking for now.
2138         */
2139         return atomic_read(&dev->open_count) == 0;
2140 }
2141
2142 static const struct vga_switcheroo_client_ops amdgpu_switcheroo_ops = {
2143         .set_gpu_state = amdgpu_switcheroo_set_state,
2144         .reprobe = NULL,
2145         .can_switch = amdgpu_switcheroo_can_switch,
2146 };
2147
2148 /**
2149  * amdgpu_device_ip_set_clockgating_state - set the CG state
2150  *
2151  * @dev: amdgpu_device pointer
2152  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2153  * @state: clockgating state (gate or ungate)
2154  *
2155  * Sets the requested clockgating state for all instances of
2156  * the hardware IP specified.
2157  * Returns the error code from the last instance.
2158  */
2159 int amdgpu_device_ip_set_clockgating_state(void *dev,
2160                                            enum amd_ip_block_type block_type,
2161                                            enum amd_clockgating_state state)
2162 {
2163         struct amdgpu_device *adev = dev;
2164         int i, r = 0;
2165
2166         for (i = 0; i < adev->num_ip_blocks; i++) {
2167                 if (!adev->ip_blocks[i].status.valid)
2168                         continue;
2169                 if (adev->ip_blocks[i].version->type != block_type)
2170                         continue;
2171                 if (!adev->ip_blocks[i].version->funcs->set_clockgating_state)
2172                         continue;
2173                 r = adev->ip_blocks[i].version->funcs->set_clockgating_state(
2174                         &adev->ip_blocks[i], state);
2175                 if (r)
2176                         DRM_ERROR("set_clockgating_state of IP block <%s> failed %d\n",
2177                                   adev->ip_blocks[i].version->funcs->name, r);
2178         }
2179         return r;
2180 }
2181
2182 /**
2183  * amdgpu_device_ip_set_powergating_state - set the PG state
2184  *
2185  * @dev: amdgpu_device pointer
2186  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2187  * @state: powergating state (gate or ungate)
2188  *
2189  * Sets the requested powergating state for all instances of
2190  * the hardware IP specified.
2191  * Returns the error code from the last instance.
2192  */
2193 int amdgpu_device_ip_set_powergating_state(void *dev,
2194                                            enum amd_ip_block_type block_type,
2195                                            enum amd_powergating_state state)
2196 {
2197         struct amdgpu_device *adev = dev;
2198         int i, r = 0;
2199
2200         for (i = 0; i < adev->num_ip_blocks; i++) {
2201                 if (!adev->ip_blocks[i].status.valid)
2202                         continue;
2203                 if (adev->ip_blocks[i].version->type != block_type)
2204                         continue;
2205                 if (!adev->ip_blocks[i].version->funcs->set_powergating_state)
2206                         continue;
2207                 r = adev->ip_blocks[i].version->funcs->set_powergating_state(
2208                         &adev->ip_blocks[i], state);
2209                 if (r)
2210                         DRM_ERROR("set_powergating_state of IP block <%s> failed %d\n",
2211                                   adev->ip_blocks[i].version->funcs->name, r);
2212         }
2213         return r;
2214 }
2215
2216 /**
2217  * amdgpu_device_ip_get_clockgating_state - get the CG state
2218  *
2219  * @adev: amdgpu_device pointer
2220  * @flags: clockgating feature flags
2221  *
2222  * Walks the list of IPs on the device and updates the clockgating
2223  * flags for each IP.
2224  * Updates @flags with the feature flags for each hardware IP where
2225  * clockgating is enabled.
2226  */
2227 void amdgpu_device_ip_get_clockgating_state(struct amdgpu_device *adev,
2228                                             u64 *flags)
2229 {
2230         int i;
2231
2232         for (i = 0; i < adev->num_ip_blocks; i++) {
2233                 if (!adev->ip_blocks[i].status.valid)
2234                         continue;
2235                 if (adev->ip_blocks[i].version->funcs->get_clockgating_state)
2236                         adev->ip_blocks[i].version->funcs->get_clockgating_state((void *)adev, flags);
2237         }
2238 }
2239
2240 /**
2241  * amdgpu_device_ip_wait_for_idle - wait for idle
2242  *
2243  * @adev: amdgpu_device pointer
2244  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2245  *
2246  * Waits for the request hardware IP to be idle.
2247  * Returns 0 for success or a negative error code on failure.
2248  */
2249 int amdgpu_device_ip_wait_for_idle(struct amdgpu_device *adev,
2250                                    enum amd_ip_block_type block_type)
2251 {
2252         int i, r;
2253
2254         for (i = 0; i < adev->num_ip_blocks; i++) {
2255                 if (!adev->ip_blocks[i].status.valid)
2256                         continue;
2257                 if (adev->ip_blocks[i].version->type == block_type) {
2258                         if (adev->ip_blocks[i].version->funcs->wait_for_idle) {
2259                                 r = adev->ip_blocks[i].version->funcs->wait_for_idle(
2260                                                                 &adev->ip_blocks[i]);
2261                                 if (r)
2262                                         return r;
2263                         }
2264                         break;
2265                 }
2266         }
2267         return 0;
2268
2269 }
2270
2271 /**
2272  * amdgpu_device_ip_is_valid - is the hardware IP enabled
2273  *
2274  * @adev: amdgpu_device pointer
2275  * @block_type: Type of hardware IP (SMU, GFX, UVD, etc.)
2276  *
2277  * Check if the hardware IP is enable or not.
2278  * Returns true if it the IP is enable, false if not.
2279  */
2280 bool amdgpu_device_ip_is_valid(struct amdgpu_device *adev,
2281                                enum amd_ip_block_type block_type)
2282 {
2283         int i;
2284
2285         for (i = 0; i < adev->num_ip_blocks; i++) {
2286                 if (adev->ip_blocks[i].version->type == block_type)
2287                         return adev->ip_blocks[i].status.valid;
2288         }
2289         return false;
2290
2291 }
2292
2293 /**
2294  * amdgpu_device_ip_get_ip_block - get a hw IP pointer
2295  *
2296  * @adev: amdgpu_device pointer
2297  * @type: Type of hardware IP (SMU, GFX, UVD, etc.)
2298  *
2299  * Returns a pointer to the hardware IP block structure
2300  * if it exists for the asic, otherwise NULL.
2301  */
2302 struct amdgpu_ip_block *
2303 amdgpu_device_ip_get_ip_block(struct amdgpu_device *adev,
2304                               enum amd_ip_block_type type)
2305 {
2306         int i;
2307
2308         for (i = 0; i < adev->num_ip_blocks; i++)
2309                 if (adev->ip_blocks[i].version->type == type)
2310                         return &adev->ip_blocks[i];
2311
2312         return NULL;
2313 }
2314
2315 /**
2316  * amdgpu_device_ip_block_version_cmp
2317  *
2318  * @adev: amdgpu_device pointer
2319  * @type: enum amd_ip_block_type
2320  * @major: major version
2321  * @minor: minor version
2322  *
2323  * return 0 if equal or greater
2324  * return 1 if smaller or the ip_block doesn't exist
2325  */
2326 int amdgpu_device_ip_block_version_cmp(struct amdgpu_device *adev,
2327                                        enum amd_ip_block_type type,
2328                                        u32 major, u32 minor)
2329 {
2330         struct amdgpu_ip_block *ip_block = amdgpu_device_ip_get_ip_block(adev, type);
2331
2332         if (ip_block && ((ip_block->version->major > major) ||
2333                         ((ip_block->version->major == major) &&
2334                         (ip_block->version->minor >= minor))))
2335                 return 0;
2336
2337         return 1;
2338 }
2339
2340 /**
2341  * amdgpu_device_ip_block_add
2342  *
2343  * @adev: amdgpu_device pointer
2344  * @ip_block_version: pointer to the IP to add
2345  *
2346  * Adds the IP block driver information to the collection of IPs
2347  * on the asic.
2348  */
2349 int amdgpu_device_ip_block_add(struct amdgpu_device *adev,
2350                                const struct amdgpu_ip_block_version *ip_block_version)
2351 {
2352         if (!ip_block_version)
2353                 return -EINVAL;
2354
2355         switch (ip_block_version->type) {
2356         case AMD_IP_BLOCK_TYPE_VCN:
2357                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_VCN_MASK)
2358                         return 0;
2359                 break;
2360         case AMD_IP_BLOCK_TYPE_JPEG:
2361                 if (adev->harvest_ip_mask & AMD_HARVEST_IP_JPEG_MASK)
2362                         return 0;
2363                 break;
2364         default:
2365                 break;
2366         }
2367
2368         DRM_INFO("add ip block number %d <%s>\n", adev->num_ip_blocks,
2369                   ip_block_version->funcs->name);
2370
2371         adev->ip_blocks[adev->num_ip_blocks].adev = adev;
2372
2373         adev->ip_blocks[adev->num_ip_blocks++].version = ip_block_version;
2374
2375         return 0;
2376 }
2377
2378 /**
2379  * amdgpu_device_enable_virtual_display - enable virtual display feature
2380  *
2381  * @adev: amdgpu_device pointer
2382  *
2383  * Enabled the virtual display feature if the user has enabled it via
2384  * the module parameter virtual_display.  This feature provides a virtual
2385  * display hardware on headless boards or in virtualized environments.
2386  * This function parses and validates the configuration string specified by
2387  * the user and configures the virtual display configuration (number of
2388  * virtual connectors, crtcs, etc.) specified.
2389  */
2390 static void amdgpu_device_enable_virtual_display(struct amdgpu_device *adev)
2391 {
2392         adev->enable_virtual_display = false;
2393
2394         if (amdgpu_virtual_display) {
2395                 const char *pci_address_name = pci_name(adev->pdev);
2396                 char *pciaddstr, *pciaddstr_tmp, *pciaddname_tmp, *pciaddname;
2397
2398                 pciaddstr = kstrdup(amdgpu_virtual_display, GFP_KERNEL);
2399                 pciaddstr_tmp = pciaddstr;
2400                 while ((pciaddname_tmp = strsep(&pciaddstr_tmp, ";"))) {
2401                         pciaddname = strsep(&pciaddname_tmp, ",");
2402                         if (!strcmp("all", pciaddname)
2403                             || !strcmp(pci_address_name, pciaddname)) {
2404                                 long num_crtc;
2405                                 int res = -1;
2406
2407                                 adev->enable_virtual_display = true;
2408
2409                                 if (pciaddname_tmp)
2410                                         res = kstrtol(pciaddname_tmp, 10,
2411                                                       &num_crtc);
2412
2413                                 if (!res) {
2414                                         if (num_crtc < 1)
2415                                                 num_crtc = 1;
2416                                         if (num_crtc > 6)
2417                                                 num_crtc = 6;
2418                                         adev->mode_info.num_crtc = num_crtc;
2419                                 } else {
2420                                         adev->mode_info.num_crtc = 1;
2421                                 }
2422                                 break;
2423                         }
2424                 }
2425
2426                 DRM_INFO("virtual display string:%s, %s:virtual_display:%d, num_crtc:%d\n",
2427                          amdgpu_virtual_display, pci_address_name,
2428                          adev->enable_virtual_display, adev->mode_info.num_crtc);
2429
2430                 kfree(pciaddstr);
2431         }
2432 }
2433
2434 void amdgpu_device_set_sriov_virtual_display(struct amdgpu_device *adev)
2435 {
2436         if (amdgpu_sriov_vf(adev) && !adev->enable_virtual_display) {
2437                 adev->mode_info.num_crtc = 1;
2438                 adev->enable_virtual_display = true;
2439                 DRM_INFO("virtual_display:%d, num_crtc:%d\n",
2440                          adev->enable_virtual_display, adev->mode_info.num_crtc);
2441         }
2442 }
2443
2444 /**
2445  * amdgpu_device_parse_gpu_info_fw - parse gpu info firmware
2446  *
2447  * @adev: amdgpu_device pointer
2448  *
2449  * Parses the asic configuration parameters specified in the gpu info
2450  * firmware and makes them available to the driver for use in configuring
2451  * the asic.
2452  * Returns 0 on success, -EINVAL on failure.
2453  */
2454 static int amdgpu_device_parse_gpu_info_fw(struct amdgpu_device *adev)
2455 {
2456         const char *chip_name;
2457         int err;
2458         const struct gpu_info_firmware_header_v1_0 *hdr;
2459
2460         adev->firmware.gpu_info_fw = NULL;
2461
2462         if (adev->mman.discovery_bin)
2463                 return 0;
2464
2465         switch (adev->asic_type) {
2466         default:
2467                 return 0;
2468         case CHIP_VEGA10:
2469                 chip_name = "vega10";
2470                 break;
2471         case CHIP_VEGA12:
2472                 chip_name = "vega12";
2473                 break;
2474         case CHIP_RAVEN:
2475                 if (adev->apu_flags & AMD_APU_IS_RAVEN2)
2476                         chip_name = "raven2";
2477                 else if (adev->apu_flags & AMD_APU_IS_PICASSO)
2478                         chip_name = "picasso";
2479                 else
2480                         chip_name = "raven";
2481                 break;
2482         case CHIP_ARCTURUS:
2483                 chip_name = "arcturus";
2484                 break;
2485         case CHIP_NAVI12:
2486                 chip_name = "navi12";
2487                 break;
2488         }
2489
2490         err = amdgpu_ucode_request(adev, &adev->firmware.gpu_info_fw,
2491                                    AMDGPU_UCODE_OPTIONAL,
2492                                    "amdgpu/%s_gpu_info.bin", chip_name);
2493         if (err) {
2494                 dev_err(adev->dev,
2495                         "Failed to get gpu_info firmware \"%s_gpu_info.bin\"\n",
2496                         chip_name);
2497                 goto out;
2498         }
2499
2500         hdr = (const struct gpu_info_firmware_header_v1_0 *)adev->firmware.gpu_info_fw->data;
2501         amdgpu_ucode_print_gpu_info_hdr(&hdr->header);
2502
2503         switch (hdr->version_major) {
2504         case 1:
2505         {
2506                 const struct gpu_info_firmware_v1_0 *gpu_info_fw =
2507                         (const struct gpu_info_firmware_v1_0 *)(adev->firmware.gpu_info_fw->data +
2508                                                                 le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2509
2510                 /*
2511                  * Should be dropped when DAL no longer needs it.
2512                  */
2513                 if (adev->asic_type == CHIP_NAVI12)
2514                         goto parse_soc_bounding_box;
2515
2516                 adev->gfx.config.max_shader_engines = le32_to_cpu(gpu_info_fw->gc_num_se);
2517                 adev->gfx.config.max_cu_per_sh = le32_to_cpu(gpu_info_fw->gc_num_cu_per_sh);
2518                 adev->gfx.config.max_sh_per_se = le32_to_cpu(gpu_info_fw->gc_num_sh_per_se);
2519                 adev->gfx.config.max_backends_per_se = le32_to_cpu(gpu_info_fw->gc_num_rb_per_se);
2520                 adev->gfx.config.max_texture_channel_caches =
2521                         le32_to_cpu(gpu_info_fw->gc_num_tccs);
2522                 adev->gfx.config.max_gprs = le32_to_cpu(gpu_info_fw->gc_num_gprs);
2523                 adev->gfx.config.max_gs_threads = le32_to_cpu(gpu_info_fw->gc_num_max_gs_thds);
2524                 adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gpu_info_fw->gc_gs_table_depth);
2525                 adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gpu_info_fw->gc_gsprim_buff_depth);
2526                 adev->gfx.config.double_offchip_lds_buf =
2527                         le32_to_cpu(gpu_info_fw->gc_double_offchip_lds_buffer);
2528                 adev->gfx.cu_info.wave_front_size = le32_to_cpu(gpu_info_fw->gc_wave_size);
2529                 adev->gfx.cu_info.max_waves_per_simd =
2530                         le32_to_cpu(gpu_info_fw->gc_max_waves_per_simd);
2531                 adev->gfx.cu_info.max_scratch_slots_per_cu =
2532                         le32_to_cpu(gpu_info_fw->gc_max_scratch_slots_per_cu);
2533                 adev->gfx.cu_info.lds_size = le32_to_cpu(gpu_info_fw->gc_lds_size);
2534                 if (hdr->version_minor >= 1) {
2535                         const struct gpu_info_firmware_v1_1 *gpu_info_fw =
2536                                 (const struct gpu_info_firmware_v1_1 *)(adev->firmware.gpu_info_fw->data +
2537                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2538                         adev->gfx.config.num_sc_per_sh =
2539                                 le32_to_cpu(gpu_info_fw->num_sc_per_sh);
2540                         adev->gfx.config.num_packer_per_sc =
2541                                 le32_to_cpu(gpu_info_fw->num_packer_per_sc);
2542                 }
2543
2544 parse_soc_bounding_box:
2545                 /*
2546                  * soc bounding box info is not integrated in disocovery table,
2547                  * we always need to parse it from gpu info firmware if needed.
2548                  */
2549                 if (hdr->version_minor == 2) {
2550                         const struct gpu_info_firmware_v1_2 *gpu_info_fw =
2551                                 (const struct gpu_info_firmware_v1_2 *)(adev->firmware.gpu_info_fw->data +
2552                                                                         le32_to_cpu(hdr->header.ucode_array_offset_bytes));
2553                         adev->dm.soc_bounding_box = &gpu_info_fw->soc_bounding_box;
2554                 }
2555                 break;
2556         }
2557         default:
2558                 dev_err(adev->dev,
2559                         "Unsupported gpu_info table %d\n", hdr->header.ucode_version);
2560                 err = -EINVAL;
2561                 goto out;
2562         }
2563 out:
2564         return err;
2565 }
2566
2567 /**
2568  * amdgpu_device_ip_early_init - run early init for hardware IPs
2569  *
2570  * @adev: amdgpu_device pointer
2571  *
2572  * Early initialization pass for hardware IPs.  The hardware IPs that make
2573  * up each asic are discovered each IP's early_init callback is run.  This
2574  * is the first stage in initializing the asic.
2575  * Returns 0 on success, negative error code on failure.
2576  */
2577 static int amdgpu_device_ip_early_init(struct amdgpu_device *adev)
2578 {
2579         struct amdgpu_ip_block *ip_block;
2580         struct pci_dev *parent;
2581         int i, r;
2582         bool total;
2583
2584         amdgpu_device_enable_virtual_display(adev);
2585
2586         if (amdgpu_sriov_vf(adev)) {
2587                 r = amdgpu_virt_request_full_gpu(adev, true);
2588                 if (r)
2589                         return r;
2590         }
2591
2592         switch (adev->asic_type) {
2593 #ifdef CONFIG_DRM_AMDGPU_SI
2594         case CHIP_VERDE:
2595         case CHIP_TAHITI:
2596         case CHIP_PITCAIRN:
2597         case CHIP_OLAND:
2598         case CHIP_HAINAN:
2599                 adev->family = AMDGPU_FAMILY_SI;
2600                 r = si_set_ip_blocks(adev);
2601                 if (r)
2602                         return r;
2603                 break;
2604 #endif
2605 #ifdef CONFIG_DRM_AMDGPU_CIK
2606         case CHIP_BONAIRE:
2607         case CHIP_HAWAII:
2608         case CHIP_KAVERI:
2609         case CHIP_KABINI:
2610         case CHIP_MULLINS:
2611                 if (adev->flags & AMD_IS_APU)
2612                         adev->family = AMDGPU_FAMILY_KV;
2613                 else
2614                         adev->family = AMDGPU_FAMILY_CI;
2615
2616                 r = cik_set_ip_blocks(adev);
2617                 if (r)
2618                         return r;
2619                 break;
2620 #endif
2621         case CHIP_TOPAZ:
2622         case CHIP_TONGA:
2623         case CHIP_FIJI:
2624         case CHIP_POLARIS10:
2625         case CHIP_POLARIS11:
2626         case CHIP_POLARIS12:
2627         case CHIP_VEGAM:
2628         case CHIP_CARRIZO:
2629         case CHIP_STONEY:
2630                 if (adev->flags & AMD_IS_APU)
2631                         adev->family = AMDGPU_FAMILY_CZ;
2632                 else
2633                         adev->family = AMDGPU_FAMILY_VI;
2634
2635                 r = vi_set_ip_blocks(adev);
2636                 if (r)
2637                         return r;
2638                 break;
2639         default:
2640                 r = amdgpu_discovery_set_ip_blocks(adev);
2641                 if (r)
2642                         return r;
2643                 break;
2644         }
2645
2646         if (amdgpu_has_atpx() &&
2647             (amdgpu_is_atpx_hybrid() ||
2648              amdgpu_has_atpx_dgpu_power_cntl()) &&
2649             ((adev->flags & AMD_IS_APU) == 0) &&
2650             !dev_is_removable(&adev->pdev->dev))
2651                 adev->flags |= AMD_IS_PX;
2652
2653         if (!(adev->flags & AMD_IS_APU)) {
2654                 parent = pcie_find_root_port(adev->pdev);
2655                 adev->has_pr3 = parent ? pci_pr3_present(parent) : false;
2656         }
2657
2658
2659         adev->pm.pp_feature = amdgpu_pp_feature_mask;
2660         if (amdgpu_sriov_vf(adev) || sched_policy == KFD_SCHED_POLICY_NO_HWS)
2661                 adev->pm.pp_feature &= ~PP_GFXOFF_MASK;
2662         if (amdgpu_sriov_vf(adev) && adev->asic_type == CHIP_SIENNA_CICHLID)
2663                 adev->pm.pp_feature &= ~PP_OVERDRIVE_MASK;
2664         if (!amdgpu_device_pcie_dynamic_switching_supported(adev))
2665                 adev->pm.pp_feature &= ~PP_PCIE_DPM_MASK;
2666
2667         total = true;
2668         for (i = 0; i < adev->num_ip_blocks; i++) {
2669                 ip_block = &adev->ip_blocks[i];
2670
2671                 if ((amdgpu_ip_block_mask & (1 << i)) == 0) {
2672                         DRM_WARN("disabled ip block: %d <%s>\n",
2673                                   i, adev->ip_blocks[i].version->funcs->name);
2674                         adev->ip_blocks[i].status.valid = false;
2675                 } else if (ip_block->version->funcs->early_init) {
2676                         r = ip_block->version->funcs->early_init(ip_block);
2677                         if (r == -ENOENT) {
2678                                 adev->ip_blocks[i].status.valid = false;
2679                         } else if (r) {
2680                                 DRM_ERROR("early_init of IP block <%s> failed %d\n",
2681                                           adev->ip_blocks[i].version->funcs->name, r);
2682                                 total = false;
2683                         } else {
2684                                 adev->ip_blocks[i].status.valid = true;
2685                         }
2686                 } else {
2687                         adev->ip_blocks[i].status.valid = true;
2688                 }
2689                 /* get the vbios after the asic_funcs are set up */
2690                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2691                         r = amdgpu_device_parse_gpu_info_fw(adev);
2692                         if (r)
2693                                 return r;
2694
2695                         /* Read BIOS */
2696                         if (amdgpu_device_read_bios(adev)) {
2697                                 if (!amdgpu_get_bios(adev))
2698                                         return -EINVAL;
2699
2700                                 r = amdgpu_atombios_init(adev);
2701                                 if (r) {
2702                                         dev_err(adev->dev, "amdgpu_atombios_init failed\n");
2703                                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_INIT_FAIL, 0, 0);
2704                                         return r;
2705                                 }
2706                         }
2707
2708                         /*get pf2vf msg info at it's earliest time*/
2709                         if (amdgpu_sriov_vf(adev))
2710                                 amdgpu_virt_init_data_exchange(adev);
2711
2712                 }
2713         }
2714         if (!total)
2715                 return -ENODEV;
2716
2717         ip_block = amdgpu_device_ip_get_ip_block(adev, AMD_IP_BLOCK_TYPE_GFX);
2718         if (ip_block->status.valid != false)
2719                 amdgpu_amdkfd_device_probe(adev);
2720
2721         adev->cg_flags &= amdgpu_cg_mask;
2722         adev->pg_flags &= amdgpu_pg_mask;
2723
2724         return 0;
2725 }
2726
2727 static int amdgpu_device_ip_hw_init_phase1(struct amdgpu_device *adev)
2728 {
2729         int i, r;
2730
2731         for (i = 0; i < adev->num_ip_blocks; i++) {
2732                 if (!adev->ip_blocks[i].status.sw)
2733                         continue;
2734                 if (adev->ip_blocks[i].status.hw)
2735                         continue;
2736                 if (!amdgpu_ip_member_of_hwini(
2737                             adev, adev->ip_blocks[i].version->type))
2738                         continue;
2739                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
2740                     (amdgpu_sriov_vf(adev) && (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)) ||
2741                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH) {
2742                         r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2743                         if (r) {
2744                                 DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2745                                           adev->ip_blocks[i].version->funcs->name, r);
2746                                 return r;
2747                         }
2748                         adev->ip_blocks[i].status.hw = true;
2749                 }
2750         }
2751
2752         return 0;
2753 }
2754
2755 static int amdgpu_device_ip_hw_init_phase2(struct amdgpu_device *adev)
2756 {
2757         int i, r;
2758
2759         for (i = 0; i < adev->num_ip_blocks; i++) {
2760                 if (!adev->ip_blocks[i].status.sw)
2761                         continue;
2762                 if (adev->ip_blocks[i].status.hw)
2763                         continue;
2764                 if (!amdgpu_ip_member_of_hwini(
2765                             adev, adev->ip_blocks[i].version->type))
2766                         continue;
2767                 r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2768                 if (r) {
2769                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2770                                   adev->ip_blocks[i].version->funcs->name, r);
2771                         return r;
2772                 }
2773                 adev->ip_blocks[i].status.hw = true;
2774         }
2775
2776         return 0;
2777 }
2778
2779 static int amdgpu_device_fw_loading(struct amdgpu_device *adev)
2780 {
2781         int r = 0;
2782         int i;
2783         uint32_t smu_version;
2784
2785         if (adev->asic_type >= CHIP_VEGA10) {
2786                 for (i = 0; i < adev->num_ip_blocks; i++) {
2787                         if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_PSP)
2788                                 continue;
2789
2790                         if (!amdgpu_ip_member_of_hwini(adev,
2791                                                        AMD_IP_BLOCK_TYPE_PSP))
2792                                 break;
2793
2794                         if (!adev->ip_blocks[i].status.sw)
2795                                 continue;
2796
2797                         /* no need to do the fw loading again if already done*/
2798                         if (adev->ip_blocks[i].status.hw == true)
2799                                 break;
2800
2801                         if (amdgpu_in_reset(adev) || adev->in_suspend) {
2802                                 r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
2803                                 if (r)
2804                                         return r;
2805                         } else {
2806                                 r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2807                                 if (r) {
2808                                         DRM_ERROR("hw_init of IP block <%s> failed %d\n",
2809                                                           adev->ip_blocks[i].version->funcs->name, r);
2810                                         return r;
2811                                 }
2812                                 adev->ip_blocks[i].status.hw = true;
2813                         }
2814                         break;
2815                 }
2816         }
2817
2818         if (!amdgpu_sriov_vf(adev) || adev->asic_type == CHIP_TONGA)
2819                 r = amdgpu_pm_load_smu_firmware(adev, &smu_version);
2820
2821         return r;
2822 }
2823
2824 static int amdgpu_device_init_schedulers(struct amdgpu_device *adev)
2825 {
2826         long timeout;
2827         int r, i;
2828
2829         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
2830                 struct amdgpu_ring *ring = adev->rings[i];
2831
2832                 /* No need to setup the GPU scheduler for rings that don't need it */
2833                 if (!ring || ring->no_scheduler)
2834                         continue;
2835
2836                 switch (ring->funcs->type) {
2837                 case AMDGPU_RING_TYPE_GFX:
2838                         timeout = adev->gfx_timeout;
2839                         break;
2840                 case AMDGPU_RING_TYPE_COMPUTE:
2841                         timeout = adev->compute_timeout;
2842                         break;
2843                 case AMDGPU_RING_TYPE_SDMA:
2844                         timeout = adev->sdma_timeout;
2845                         break;
2846                 default:
2847                         timeout = adev->video_timeout;
2848                         break;
2849                 }
2850
2851                 r = drm_sched_init(&ring->sched, &amdgpu_sched_ops, NULL,
2852                                    DRM_SCHED_PRIORITY_COUNT,
2853                                    ring->num_hw_submission, 0,
2854                                    timeout, adev->reset_domain->wq,
2855                                    ring->sched_score, ring->name,
2856                                    adev->dev);
2857                 if (r) {
2858                         DRM_ERROR("Failed to create scheduler on ring %s.\n",
2859                                   ring->name);
2860                         return r;
2861                 }
2862                 r = amdgpu_uvd_entity_init(adev, ring);
2863                 if (r) {
2864                         DRM_ERROR("Failed to create UVD scheduling entity on ring %s.\n",
2865                                   ring->name);
2866                         return r;
2867                 }
2868                 r = amdgpu_vce_entity_init(adev, ring);
2869                 if (r) {
2870                         DRM_ERROR("Failed to create VCE scheduling entity on ring %s.\n",
2871                                   ring->name);
2872                         return r;
2873                 }
2874         }
2875
2876         amdgpu_xcp_update_partition_sched_list(adev);
2877
2878         return 0;
2879 }
2880
2881
2882 /**
2883  * amdgpu_device_ip_init - run init for hardware IPs
2884  *
2885  * @adev: amdgpu_device pointer
2886  *
2887  * Main initialization pass for hardware IPs.  The list of all the hardware
2888  * IPs that make up the asic is walked and the sw_init and hw_init callbacks
2889  * are run.  sw_init initializes the software state associated with each IP
2890  * and hw_init initializes the hardware associated with each IP.
2891  * Returns 0 on success, negative error code on failure.
2892  */
2893 static int amdgpu_device_ip_init(struct amdgpu_device *adev)
2894 {
2895         bool init_badpage;
2896         int i, r;
2897
2898         r = amdgpu_ras_init(adev);
2899         if (r)
2900                 return r;
2901
2902         for (i = 0; i < adev->num_ip_blocks; i++) {
2903                 if (!adev->ip_blocks[i].status.valid)
2904                         continue;
2905                 if (adev->ip_blocks[i].version->funcs->sw_init) {
2906                         r = adev->ip_blocks[i].version->funcs->sw_init(&adev->ip_blocks[i]);
2907                         if (r) {
2908                                 DRM_ERROR("sw_init of IP block <%s> failed %d\n",
2909                                           adev->ip_blocks[i].version->funcs->name, r);
2910                                 goto init_failed;
2911                         }
2912                 }
2913                 adev->ip_blocks[i].status.sw = true;
2914
2915                 if (!amdgpu_ip_member_of_hwini(
2916                             adev, adev->ip_blocks[i].version->type))
2917                         continue;
2918
2919                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON) {
2920                         /* need to do common hw init early so everything is set up for gmc */
2921                         r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2922                         if (r) {
2923                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2924                                 goto init_failed;
2925                         }
2926                         adev->ip_blocks[i].status.hw = true;
2927                 } else if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
2928                         /* need to do gmc hw init early so we can allocate gpu mem */
2929                         /* Try to reserve bad pages early */
2930                         if (amdgpu_sriov_vf(adev))
2931                                 amdgpu_virt_exchange_data(adev);
2932
2933                         r = amdgpu_device_mem_scratch_init(adev);
2934                         if (r) {
2935                                 DRM_ERROR("amdgpu_mem_scratch_init failed %d\n", r);
2936                                 goto init_failed;
2937                         }
2938                         r = adev->ip_blocks[i].version->funcs->hw_init(&adev->ip_blocks[i]);
2939                         if (r) {
2940                                 DRM_ERROR("hw_init %d failed %d\n", i, r);
2941                                 goto init_failed;
2942                         }
2943                         r = amdgpu_device_wb_init(adev);
2944                         if (r) {
2945                                 DRM_ERROR("amdgpu_device_wb_init failed %d\n", r);
2946                                 goto init_failed;
2947                         }
2948                         adev->ip_blocks[i].status.hw = true;
2949
2950                         /* right after GMC hw init, we create CSA */
2951                         if (adev->gfx.mcbp) {
2952                                 r = amdgpu_allocate_static_csa(adev, &adev->virt.csa_obj,
2953                                                                AMDGPU_GEM_DOMAIN_VRAM |
2954                                                                AMDGPU_GEM_DOMAIN_GTT,
2955                                                                AMDGPU_CSA_SIZE);
2956                                 if (r) {
2957                                         DRM_ERROR("allocate CSA failed %d\n", r);
2958                                         goto init_failed;
2959                                 }
2960                         }
2961
2962                         r = amdgpu_seq64_init(adev);
2963                         if (r) {
2964                                 DRM_ERROR("allocate seq64 failed %d\n", r);
2965                                 goto init_failed;
2966                         }
2967                 }
2968         }
2969
2970         if (amdgpu_sriov_vf(adev))
2971                 amdgpu_virt_init_data_exchange(adev);
2972
2973         r = amdgpu_ib_pool_init(adev);
2974         if (r) {
2975                 dev_err(adev->dev, "IB initialization failed (%d).\n", r);
2976                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_IB_INIT_FAIL, 0, r);
2977                 goto init_failed;
2978         }
2979
2980         r = amdgpu_ucode_create_bo(adev); /* create ucode bo when sw_init complete*/
2981         if (r)
2982                 goto init_failed;
2983
2984         r = amdgpu_device_ip_hw_init_phase1(adev);
2985         if (r)
2986                 goto init_failed;
2987
2988         r = amdgpu_device_fw_loading(adev);
2989         if (r)
2990                 goto init_failed;
2991
2992         r = amdgpu_device_ip_hw_init_phase2(adev);
2993         if (r)
2994                 goto init_failed;
2995
2996         /*
2997          * retired pages will be loaded from eeprom and reserved here,
2998          * it should be called after amdgpu_device_ip_hw_init_phase2  since
2999          * for some ASICs the RAS EEPROM code relies on SMU fully functioning
3000          * for I2C communication which only true at this point.
3001          *
3002          * amdgpu_ras_recovery_init may fail, but the upper only cares the
3003          * failure from bad gpu situation and stop amdgpu init process
3004          * accordingly. For other failed cases, it will still release all
3005          * the resource and print error message, rather than returning one
3006          * negative value to upper level.
3007          *
3008          * Note: theoretically, this should be called before all vram allocations
3009          * to protect retired page from abusing
3010          */
3011         init_badpage = (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI);
3012         r = amdgpu_ras_recovery_init(adev, init_badpage);
3013         if (r)
3014                 goto init_failed;
3015
3016         /**
3017          * In case of XGMI grab extra reference for reset domain for this device
3018          */
3019         if (adev->gmc.xgmi.num_physical_nodes > 1) {
3020                 if (amdgpu_xgmi_add_device(adev) == 0) {
3021                         if (!amdgpu_sriov_vf(adev)) {
3022                                 struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3023
3024                                 if (WARN_ON(!hive)) {
3025                                         r = -ENOENT;
3026                                         goto init_failed;
3027                                 }
3028
3029                                 if (!hive->reset_domain ||
3030                                     !amdgpu_reset_get_reset_domain(hive->reset_domain)) {
3031                                         r = -ENOENT;
3032                                         amdgpu_put_xgmi_hive(hive);
3033                                         goto init_failed;
3034                                 }
3035
3036                                 /* Drop the early temporary reset domain we created for device */
3037                                 amdgpu_reset_put_reset_domain(adev->reset_domain);
3038                                 adev->reset_domain = hive->reset_domain;
3039                                 amdgpu_put_xgmi_hive(hive);
3040                         }
3041                 }
3042         }
3043
3044         r = amdgpu_device_init_schedulers(adev);
3045         if (r)
3046                 goto init_failed;
3047
3048         if (adev->mman.buffer_funcs_ring->sched.ready)
3049                 amdgpu_ttm_set_buffer_funcs_status(adev, true);
3050
3051         /* Don't init kfd if whole hive need to be reset during init */
3052         if (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI) {
3053                 kgd2kfd_init_zone_device(adev);
3054                 amdgpu_amdkfd_device_init(adev);
3055         }
3056
3057         amdgpu_fru_get_product_info(adev);
3058
3059 init_failed:
3060
3061         return r;
3062 }
3063
3064 /**
3065  * amdgpu_device_fill_reset_magic - writes reset magic to gart pointer
3066  *
3067  * @adev: amdgpu_device pointer
3068  *
3069  * Writes a reset magic value to the gart pointer in VRAM.  The driver calls
3070  * this function before a GPU reset.  If the value is retained after a
3071  * GPU reset, VRAM has not been lost. Some GPU resets may destroy VRAM contents.
3072  */
3073 static void amdgpu_device_fill_reset_magic(struct amdgpu_device *adev)
3074 {
3075         memcpy(adev->reset_magic, adev->gart.ptr, AMDGPU_RESET_MAGIC_NUM);
3076 }
3077
3078 /**
3079  * amdgpu_device_check_vram_lost - check if vram is valid
3080  *
3081  * @adev: amdgpu_device pointer
3082  *
3083  * Checks the reset magic value written to the gart pointer in VRAM.
3084  * The driver calls this after a GPU reset to see if the contents of
3085  * VRAM is lost or now.
3086  * returns true if vram is lost, false if not.
3087  */
3088 static bool amdgpu_device_check_vram_lost(struct amdgpu_device *adev)
3089 {
3090         if (memcmp(adev->gart.ptr, adev->reset_magic,
3091                         AMDGPU_RESET_MAGIC_NUM))
3092                 return true;
3093
3094         if (!amdgpu_in_reset(adev))
3095                 return false;
3096
3097         /*
3098          * For all ASICs with baco/mode1 reset, the VRAM is
3099          * always assumed to be lost.
3100          */
3101         switch (amdgpu_asic_reset_method(adev)) {
3102         case AMD_RESET_METHOD_BACO:
3103         case AMD_RESET_METHOD_MODE1:
3104                 return true;
3105         default:
3106                 return false;
3107         }
3108 }
3109
3110 /**
3111  * amdgpu_device_set_cg_state - set clockgating for amdgpu device
3112  *
3113  * @adev: amdgpu_device pointer
3114  * @state: clockgating state (gate or ungate)
3115  *
3116  * The list of all the hardware IPs that make up the asic is walked and the
3117  * set_clockgating_state callbacks are run.
3118  * Late initialization pass enabling clockgating for hardware IPs.
3119  * Fini or suspend, pass disabling clockgating for hardware IPs.
3120  * Returns 0 on success, negative error code on failure.
3121  */
3122
3123 int amdgpu_device_set_cg_state(struct amdgpu_device *adev,
3124                                enum amd_clockgating_state state)
3125 {
3126         int i, j, r;
3127
3128         if (amdgpu_emu_mode == 1)
3129                 return 0;
3130
3131         for (j = 0; j < adev->num_ip_blocks; j++) {
3132                 i = state == AMD_CG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
3133                 if (!adev->ip_blocks[i].status.late_initialized)
3134                         continue;
3135                 /* skip CG for GFX, SDMA on S0ix */
3136                 if (adev->in_s0ix &&
3137                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3138                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SDMA))
3139                         continue;
3140                 /* skip CG for VCE/UVD, it's handled specially */
3141                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
3142                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
3143                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
3144                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
3145                     adev->ip_blocks[i].version->funcs->set_clockgating_state) {
3146                         /* enable clockgating to save power */
3147                         r = adev->ip_blocks[i].version->funcs->set_clockgating_state(&adev->ip_blocks[i],
3148                                                                                      state);
3149                         if (r) {
3150                                 DRM_ERROR("set_clockgating_state(gate) of IP block <%s> failed %d\n",
3151                                           adev->ip_blocks[i].version->funcs->name, r);
3152                                 return r;
3153                         }
3154                 }
3155         }
3156
3157         return 0;
3158 }
3159
3160 int amdgpu_device_set_pg_state(struct amdgpu_device *adev,
3161                                enum amd_powergating_state state)
3162 {
3163         int i, j, r;
3164
3165         if (amdgpu_emu_mode == 1)
3166                 return 0;
3167
3168         for (j = 0; j < adev->num_ip_blocks; j++) {
3169                 i = state == AMD_PG_STATE_GATE ? j : adev->num_ip_blocks - j - 1;
3170                 if (!adev->ip_blocks[i].status.late_initialized)
3171                         continue;
3172                 /* skip PG for GFX, SDMA on S0ix */
3173                 if (adev->in_s0ix &&
3174                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3175                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SDMA))
3176                         continue;
3177                 /* skip CG for VCE/UVD, it's handled specially */
3178                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_UVD &&
3179                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCE &&
3180                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_VCN &&
3181                     adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_JPEG &&
3182                     adev->ip_blocks[i].version->funcs->set_powergating_state) {
3183                         /* enable powergating to save power */
3184                         r = adev->ip_blocks[i].version->funcs->set_powergating_state(&adev->ip_blocks[i],
3185                                                                                         state);
3186                         if (r) {
3187                                 DRM_ERROR("set_powergating_state(gate) of IP block <%s> failed %d\n",
3188                                           adev->ip_blocks[i].version->funcs->name, r);
3189                                 return r;
3190                         }
3191                 }
3192         }
3193         return 0;
3194 }
3195
3196 static int amdgpu_device_enable_mgpu_fan_boost(void)
3197 {
3198         struct amdgpu_gpu_instance *gpu_ins;
3199         struct amdgpu_device *adev;
3200         int i, ret = 0;
3201
3202         mutex_lock(&mgpu_info.mutex);
3203
3204         /*
3205          * MGPU fan boost feature should be enabled
3206          * only when there are two or more dGPUs in
3207          * the system
3208          */
3209         if (mgpu_info.num_dgpu < 2)
3210                 goto out;
3211
3212         for (i = 0; i < mgpu_info.num_dgpu; i++) {
3213                 gpu_ins = &(mgpu_info.gpu_ins[i]);
3214                 adev = gpu_ins->adev;
3215                 if (!(adev->flags & AMD_IS_APU) &&
3216                     !gpu_ins->mgpu_fan_enabled) {
3217                         ret = amdgpu_dpm_enable_mgpu_fan_boost(adev);
3218                         if (ret)
3219                                 break;
3220
3221                         gpu_ins->mgpu_fan_enabled = 1;
3222                 }
3223         }
3224
3225 out:
3226         mutex_unlock(&mgpu_info.mutex);
3227
3228         return ret;
3229 }
3230
3231 /**
3232  * amdgpu_device_ip_late_init - run late init for hardware IPs
3233  *
3234  * @adev: amdgpu_device pointer
3235  *
3236  * Late initialization pass for hardware IPs.  The list of all the hardware
3237  * IPs that make up the asic is walked and the late_init callbacks are run.
3238  * late_init covers any special initialization that an IP requires
3239  * after all of the have been initialized or something that needs to happen
3240  * late in the init process.
3241  * Returns 0 on success, negative error code on failure.
3242  */
3243 static int amdgpu_device_ip_late_init(struct amdgpu_device *adev)
3244 {
3245         struct amdgpu_gpu_instance *gpu_instance;
3246         int i = 0, r;
3247
3248         for (i = 0; i < adev->num_ip_blocks; i++) {
3249                 if (!adev->ip_blocks[i].status.hw)
3250                         continue;
3251                 if (adev->ip_blocks[i].version->funcs->late_init) {
3252                         r = adev->ip_blocks[i].version->funcs->late_init(&adev->ip_blocks[i]);
3253                         if (r) {
3254                                 DRM_ERROR("late_init of IP block <%s> failed %d\n",
3255                                           adev->ip_blocks[i].version->funcs->name, r);
3256                                 return r;
3257                         }
3258                 }
3259                 adev->ip_blocks[i].status.late_initialized = true;
3260         }
3261
3262         r = amdgpu_ras_late_init(adev);
3263         if (r) {
3264                 DRM_ERROR("amdgpu_ras_late_init failed %d", r);
3265                 return r;
3266         }
3267
3268         if (!amdgpu_reset_in_recovery(adev))
3269                 amdgpu_ras_set_error_query_ready(adev, true);
3270
3271         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_GATE);
3272         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_GATE);
3273
3274         amdgpu_device_fill_reset_magic(adev);
3275
3276         r = amdgpu_device_enable_mgpu_fan_boost();
3277         if (r)
3278                 DRM_ERROR("enable mgpu fan boost failed (%d).\n", r);
3279
3280         /* For passthrough configuration on arcturus and aldebaran, enable special handling SBR */
3281         if (amdgpu_passthrough(adev) &&
3282             ((adev->asic_type == CHIP_ARCTURUS && adev->gmc.xgmi.num_physical_nodes > 1) ||
3283              adev->asic_type == CHIP_ALDEBARAN))
3284                 amdgpu_dpm_handle_passthrough_sbr(adev, true);
3285
3286         if (adev->gmc.xgmi.num_physical_nodes > 1) {
3287                 mutex_lock(&mgpu_info.mutex);
3288
3289                 /*
3290                  * Reset device p-state to low as this was booted with high.
3291                  *
3292                  * This should be performed only after all devices from the same
3293                  * hive get initialized.
3294                  *
3295                  * However, it's unknown how many device in the hive in advance.
3296                  * As this is counted one by one during devices initializations.
3297                  *
3298                  * So, we wait for all XGMI interlinked devices initialized.
3299                  * This may bring some delays as those devices may come from
3300                  * different hives. But that should be OK.
3301                  */
3302                 if (mgpu_info.num_dgpu == adev->gmc.xgmi.num_physical_nodes) {
3303                         for (i = 0; i < mgpu_info.num_gpu; i++) {
3304                                 gpu_instance = &(mgpu_info.gpu_ins[i]);
3305                                 if (gpu_instance->adev->flags & AMD_IS_APU)
3306                                         continue;
3307
3308                                 r = amdgpu_xgmi_set_pstate(gpu_instance->adev,
3309                                                 AMDGPU_XGMI_PSTATE_MIN);
3310                                 if (r) {
3311                                         DRM_ERROR("pstate setting failed (%d).\n", r);
3312                                         break;
3313                                 }
3314                         }
3315                 }
3316
3317                 mutex_unlock(&mgpu_info.mutex);
3318         }
3319
3320         return 0;
3321 }
3322
3323 static void amdgpu_ip_block_hw_fini(struct amdgpu_ip_block *ip_block)
3324 {
3325         int r;
3326
3327         if (!ip_block->version->funcs->hw_fini) {
3328                 DRM_ERROR("hw_fini of IP block <%s> not defined\n",
3329                           ip_block->version->funcs->name);
3330         } else {
3331                 r = ip_block->version->funcs->hw_fini(ip_block);
3332                 /* XXX handle errors */
3333                 if (r) {
3334                         DRM_DEBUG("hw_fini of IP block <%s> failed %d\n",
3335                                   ip_block->version->funcs->name, r);
3336                 }
3337         }
3338
3339         ip_block->status.hw = false;
3340 }
3341
3342 /**
3343  * amdgpu_device_smu_fini_early - smu hw_fini wrapper
3344  *
3345  * @adev: amdgpu_device pointer
3346  *
3347  * For ASICs need to disable SMC first
3348  */
3349 static void amdgpu_device_smu_fini_early(struct amdgpu_device *adev)
3350 {
3351         int i;
3352
3353         if (amdgpu_ip_version(adev, GC_HWIP, 0) > IP_VERSION(9, 0, 0))
3354                 return;
3355
3356         for (i = 0; i < adev->num_ip_blocks; i++) {
3357                 if (!adev->ip_blocks[i].status.hw)
3358                         continue;
3359                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3360                         amdgpu_ip_block_hw_fini(&adev->ip_blocks[i]);
3361                         break;
3362                 }
3363         }
3364 }
3365
3366 static int amdgpu_device_ip_fini_early(struct amdgpu_device *adev)
3367 {
3368         int i, r;
3369
3370         for (i = 0; i < adev->num_ip_blocks; i++) {
3371                 if (!adev->ip_blocks[i].version->funcs->early_fini)
3372                         continue;
3373
3374                 r = adev->ip_blocks[i].version->funcs->early_fini(&adev->ip_blocks[i]);
3375                 if (r) {
3376                         DRM_DEBUG("early_fini of IP block <%s> failed %d\n",
3377                                   adev->ip_blocks[i].version->funcs->name, r);
3378                 }
3379         }
3380
3381         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
3382         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
3383
3384         amdgpu_amdkfd_suspend(adev, false);
3385
3386         /* Workaround for ASICs need to disable SMC first */
3387         amdgpu_device_smu_fini_early(adev);
3388
3389         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3390                 if (!adev->ip_blocks[i].status.hw)
3391                         continue;
3392
3393                 amdgpu_ip_block_hw_fini(&adev->ip_blocks[i]);
3394         }
3395
3396         if (amdgpu_sriov_vf(adev)) {
3397                 if (amdgpu_virt_release_full_gpu(adev, false))
3398                         DRM_ERROR("failed to release exclusive mode on fini\n");
3399         }
3400
3401         return 0;
3402 }
3403
3404 /**
3405  * amdgpu_device_ip_fini - run fini for hardware IPs
3406  *
3407  * @adev: amdgpu_device pointer
3408  *
3409  * Main teardown pass for hardware IPs.  The list of all the hardware
3410  * IPs that make up the asic is walked and the hw_fini and sw_fini callbacks
3411  * are run.  hw_fini tears down the hardware associated with each IP
3412  * and sw_fini tears down any software state associated with each IP.
3413  * Returns 0 on success, negative error code on failure.
3414  */
3415 static int amdgpu_device_ip_fini(struct amdgpu_device *adev)
3416 {
3417         int i, r;
3418
3419         if (amdgpu_sriov_vf(adev) && adev->virt.ras_init_done)
3420                 amdgpu_virt_release_ras_err_handler_data(adev);
3421
3422         if (adev->gmc.xgmi.num_physical_nodes > 1)
3423                 amdgpu_xgmi_remove_device(adev);
3424
3425         amdgpu_amdkfd_device_fini_sw(adev);
3426
3427         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3428                 if (!adev->ip_blocks[i].status.sw)
3429                         continue;
3430
3431                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) {
3432                         amdgpu_ucode_free_bo(adev);
3433                         amdgpu_free_static_csa(&adev->virt.csa_obj);
3434                         amdgpu_device_wb_fini(adev);
3435                         amdgpu_device_mem_scratch_fini(adev);
3436                         amdgpu_ib_pool_fini(adev);
3437                         amdgpu_seq64_fini(adev);
3438                 }
3439                 if (adev->ip_blocks[i].version->funcs->sw_fini) {
3440                         r = adev->ip_blocks[i].version->funcs->sw_fini(&adev->ip_blocks[i]);
3441                         /* XXX handle errors */
3442                         if (r) {
3443                                 DRM_DEBUG("sw_fini of IP block <%s> failed %d\n",
3444                                           adev->ip_blocks[i].version->funcs->name, r);
3445                         }
3446                 }
3447                 adev->ip_blocks[i].status.sw = false;
3448                 adev->ip_blocks[i].status.valid = false;
3449         }
3450
3451         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3452                 if (!adev->ip_blocks[i].status.late_initialized)
3453                         continue;
3454                 if (adev->ip_blocks[i].version->funcs->late_fini)
3455                         adev->ip_blocks[i].version->funcs->late_fini(&adev->ip_blocks[i]);
3456                 adev->ip_blocks[i].status.late_initialized = false;
3457         }
3458
3459         amdgpu_ras_fini(adev);
3460
3461         return 0;
3462 }
3463
3464 /**
3465  * amdgpu_device_delayed_init_work_handler - work handler for IB tests
3466  *
3467  * @work: work_struct.
3468  */
3469 static void amdgpu_device_delayed_init_work_handler(struct work_struct *work)
3470 {
3471         struct amdgpu_device *adev =
3472                 container_of(work, struct amdgpu_device, delayed_init_work.work);
3473         int r;
3474
3475         r = amdgpu_ib_ring_tests(adev);
3476         if (r)
3477                 DRM_ERROR("ib ring test failed (%d).\n", r);
3478 }
3479
3480 static void amdgpu_device_delay_enable_gfx_off(struct work_struct *work)
3481 {
3482         struct amdgpu_device *adev =
3483                 container_of(work, struct amdgpu_device, gfx.gfx_off_delay_work.work);
3484
3485         WARN_ON_ONCE(adev->gfx.gfx_off_state);
3486         WARN_ON_ONCE(adev->gfx.gfx_off_req_count);
3487
3488         if (!amdgpu_dpm_set_powergating_by_smu(adev, AMD_IP_BLOCK_TYPE_GFX, true, 0))
3489                 adev->gfx.gfx_off_state = true;
3490 }
3491
3492 /**
3493  * amdgpu_device_ip_suspend_phase1 - run suspend for hardware IPs (phase 1)
3494  *
3495  * @adev: amdgpu_device pointer
3496  *
3497  * Main suspend function for hardware IPs.  The list of all the hardware
3498  * IPs that make up the asic is walked, clockgating is disabled and the
3499  * suspend callbacks are run.  suspend puts the hardware and software state
3500  * in each IP into a state suitable for suspend.
3501  * Returns 0 on success, negative error code on failure.
3502  */
3503 static int amdgpu_device_ip_suspend_phase1(struct amdgpu_device *adev)
3504 {
3505         int i, r;
3506
3507         amdgpu_device_set_pg_state(adev, AMD_PG_STATE_UNGATE);
3508         amdgpu_device_set_cg_state(adev, AMD_CG_STATE_UNGATE);
3509
3510         /*
3511          * Per PMFW team's suggestion, driver needs to handle gfxoff
3512          * and df cstate features disablement for gpu reset(e.g. Mode1Reset)
3513          * scenario. Add the missing df cstate disablement here.
3514          */
3515         if (amdgpu_dpm_set_df_cstate(adev, DF_CSTATE_DISALLOW))
3516                 dev_warn(adev->dev, "Failed to disallow df cstate");
3517
3518         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3519                 if (!adev->ip_blocks[i].status.valid)
3520                         continue;
3521
3522                 /* displays are handled separately */
3523                 if (adev->ip_blocks[i].version->type != AMD_IP_BLOCK_TYPE_DCE)
3524                         continue;
3525
3526                 /* XXX handle errors */
3527                 r = amdgpu_ip_block_suspend(&adev->ip_blocks[i]);
3528                 if (r)
3529                         return r;
3530         }
3531
3532         return 0;
3533 }
3534
3535 /**
3536  * amdgpu_device_ip_suspend_phase2 - run suspend for hardware IPs (phase 2)
3537  *
3538  * @adev: amdgpu_device pointer
3539  *
3540  * Main suspend function for hardware IPs.  The list of all the hardware
3541  * IPs that make up the asic is walked, clockgating is disabled and the
3542  * suspend callbacks are run.  suspend puts the hardware and software state
3543  * in each IP into a state suitable for suspend.
3544  * Returns 0 on success, negative error code on failure.
3545  */
3546 static int amdgpu_device_ip_suspend_phase2(struct amdgpu_device *adev)
3547 {
3548         int i, r;
3549
3550         if (adev->in_s0ix)
3551                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D3Entry);
3552
3553         for (i = adev->num_ip_blocks - 1; i >= 0; i--) {
3554                 if (!adev->ip_blocks[i].status.valid)
3555                         continue;
3556                 /* displays are handled in phase1 */
3557                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE)
3558                         continue;
3559                 /* PSP lost connection when err_event_athub occurs */
3560                 if (amdgpu_ras_intr_triggered() &&
3561                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
3562                         adev->ip_blocks[i].status.hw = false;
3563                         continue;
3564                 }
3565
3566                 /* skip unnecessary suspend if we do not initialize them yet */
3567                 if (!amdgpu_ip_member_of_hwini(
3568                             adev, adev->ip_blocks[i].version->type))
3569                         continue;
3570
3571                 /* skip suspend of gfx/mes and psp for S0ix
3572                  * gfx is in gfxoff state, so on resume it will exit gfxoff just
3573                  * like at runtime. PSP is also part of the always on hardware
3574                  * so no need to suspend it.
3575                  */
3576                 if (adev->in_s0ix &&
3577                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP ||
3578                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GFX ||
3579                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_MES))
3580                         continue;
3581
3582                 /* SDMA 5.x+ is part of GFX power domain so it's covered by GFXOFF */
3583                 if (adev->in_s0ix &&
3584                     (amdgpu_ip_version(adev, SDMA0_HWIP, 0) >=
3585                      IP_VERSION(5, 0, 0)) &&
3586                     (adev->ip_blocks[i].version->type ==
3587                      AMD_IP_BLOCK_TYPE_SDMA))
3588                         continue;
3589
3590                 /* Once swPSP provides the IMU, RLC FW binaries to TOS during cold-boot.
3591                  * These are in TMR, hence are expected to be reused by PSP-TOS to reload
3592                  * from this location and RLC Autoload automatically also gets loaded
3593                  * from here based on PMFW -> PSP message during re-init sequence.
3594                  * Therefore, the psp suspend & resume should be skipped to avoid destroy
3595                  * the TMR and reload FWs again for IMU enabled APU ASICs.
3596                  */
3597                 if (amdgpu_in_reset(adev) &&
3598                     (adev->flags & AMD_IS_APU) && adev->gfx.imu.funcs &&
3599                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3600                         continue;
3601
3602                 /* XXX handle errors */
3603                 r = amdgpu_ip_block_suspend(&adev->ip_blocks[i]);
3604                 adev->ip_blocks[i].status.hw = false;
3605
3606                 /* handle putting the SMC in the appropriate state */
3607                 if (!amdgpu_sriov_vf(adev)) {
3608                         if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) {
3609                                 r = amdgpu_dpm_set_mp1_state(adev, adev->mp1_state);
3610                                 if (r) {
3611                                         DRM_ERROR("SMC failed to set mp1 state %d, %d\n",
3612                                                         adev->mp1_state, r);
3613                                         return r;
3614                                 }
3615                         }
3616                 }
3617         }
3618
3619         return 0;
3620 }
3621
3622 /**
3623  * amdgpu_device_ip_suspend - run suspend for hardware IPs
3624  *
3625  * @adev: amdgpu_device pointer
3626  *
3627  * Main suspend function for hardware IPs.  The list of all the hardware
3628  * IPs that make up the asic is walked, clockgating is disabled and the
3629  * suspend callbacks are run.  suspend puts the hardware and software state
3630  * in each IP into a state suitable for suspend.
3631  * Returns 0 on success, negative error code on failure.
3632  */
3633 int amdgpu_device_ip_suspend(struct amdgpu_device *adev)
3634 {
3635         int r;
3636
3637         if (amdgpu_sriov_vf(adev)) {
3638                 amdgpu_virt_fini_data_exchange(adev);
3639                 amdgpu_virt_request_full_gpu(adev, false);
3640         }
3641
3642         amdgpu_ttm_set_buffer_funcs_status(adev, false);
3643
3644         r = amdgpu_device_ip_suspend_phase1(adev);
3645         if (r)
3646                 return r;
3647         r = amdgpu_device_ip_suspend_phase2(adev);
3648
3649         if (amdgpu_sriov_vf(adev))
3650                 amdgpu_virt_release_full_gpu(adev, false);
3651
3652         return r;
3653 }
3654
3655 static int amdgpu_device_ip_reinit_early_sriov(struct amdgpu_device *adev)
3656 {
3657         int i, r;
3658
3659         static enum amd_ip_block_type ip_order[] = {
3660                 AMD_IP_BLOCK_TYPE_COMMON,
3661                 AMD_IP_BLOCK_TYPE_GMC,
3662                 AMD_IP_BLOCK_TYPE_PSP,
3663                 AMD_IP_BLOCK_TYPE_IH,
3664         };
3665
3666         for (i = 0; i < adev->num_ip_blocks; i++) {
3667                 int j;
3668                 struct amdgpu_ip_block *block;
3669
3670                 block = &adev->ip_blocks[i];
3671                 block->status.hw = false;
3672
3673                 for (j = 0; j < ARRAY_SIZE(ip_order); j++) {
3674
3675                         if (block->version->type != ip_order[j] ||
3676                                 !block->status.valid)
3677                                 continue;
3678
3679                         r = block->version->funcs->hw_init(&adev->ip_blocks[i]);
3680                         if (r) {
3681                                 dev_err(adev->dev, "RE-INIT-early: %s failed\n",
3682                                          block->version->funcs->name);
3683                                 return r;
3684                         }
3685                         block->status.hw = true;
3686                 }
3687         }
3688
3689         return 0;
3690 }
3691
3692 static int amdgpu_device_ip_reinit_late_sriov(struct amdgpu_device *adev)
3693 {
3694         struct amdgpu_ip_block *block;
3695         int i, r = 0;
3696
3697         static enum amd_ip_block_type ip_order[] = {
3698                 AMD_IP_BLOCK_TYPE_SMC,
3699                 AMD_IP_BLOCK_TYPE_DCE,
3700                 AMD_IP_BLOCK_TYPE_GFX,
3701                 AMD_IP_BLOCK_TYPE_SDMA,
3702                 AMD_IP_BLOCK_TYPE_MES,
3703                 AMD_IP_BLOCK_TYPE_UVD,
3704                 AMD_IP_BLOCK_TYPE_VCE,
3705                 AMD_IP_BLOCK_TYPE_VCN,
3706                 AMD_IP_BLOCK_TYPE_JPEG
3707         };
3708
3709         for (i = 0; i < ARRAY_SIZE(ip_order); i++) {
3710                 block = amdgpu_device_ip_get_ip_block(adev, ip_order[i]);
3711
3712                 if (!block)
3713                         continue;
3714
3715                 if (block->status.valid && !block->status.hw) {
3716                         if (block->version->type == AMD_IP_BLOCK_TYPE_SMC) {
3717                                 r = amdgpu_ip_block_resume(block);
3718                         } else {
3719                                 r = block->version->funcs->hw_init(block);
3720                         }
3721
3722                         if (r) {
3723                                 dev_err(adev->dev, "RE-INIT-late: %s failed\n",
3724                                          block->version->funcs->name);
3725                                 break;
3726                         }
3727                         block->status.hw = true;
3728                 }
3729         }
3730
3731         return r;
3732 }
3733
3734 /**
3735  * amdgpu_device_ip_resume_phase1 - run resume for hardware IPs
3736  *
3737  * @adev: amdgpu_device pointer
3738  *
3739  * First resume function for hardware IPs.  The list of all the hardware
3740  * IPs that make up the asic is walked and the resume callbacks are run for
3741  * COMMON, GMC, and IH.  resume puts the hardware into a functional state
3742  * after a suspend and updates the software state as necessary.  This
3743  * function is also used for restoring the GPU after a GPU reset.
3744  * Returns 0 on success, negative error code on failure.
3745  */
3746 static int amdgpu_device_ip_resume_phase1(struct amdgpu_device *adev)
3747 {
3748         int i, r;
3749
3750         for (i = 0; i < adev->num_ip_blocks; i++) {
3751                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3752                         continue;
3753                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3754                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3755                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3756                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP && amdgpu_sriov_vf(adev))) {
3757
3758                         r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
3759                         if (r)
3760                                 return r;
3761                 }
3762         }
3763
3764         return 0;
3765 }
3766
3767 /**
3768  * amdgpu_device_ip_resume_phase2 - run resume for hardware IPs
3769  *
3770  * @adev: amdgpu_device pointer
3771  *
3772  * Second resume function for hardware IPs.  The list of all the hardware
3773  * IPs that make up the asic is walked and the resume callbacks are run for
3774  * all blocks except COMMON, GMC, and IH.  resume puts the hardware into a
3775  * functional state after a suspend and updates the software state as
3776  * necessary.  This function is also used for restoring the GPU after a GPU
3777  * reset.
3778  * Returns 0 on success, negative error code on failure.
3779  */
3780 static int amdgpu_device_ip_resume_phase2(struct amdgpu_device *adev)
3781 {
3782         int i, r;
3783
3784         for (i = 0; i < adev->num_ip_blocks; i++) {
3785                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3786                         continue;
3787                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_COMMON ||
3788                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC ||
3789                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_IH ||
3790                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE ||
3791                     adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP)
3792                         continue;
3793                 r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
3794                 if (r)
3795                         return r;
3796         }
3797
3798         return 0;
3799 }
3800
3801 /**
3802  * amdgpu_device_ip_resume_phase3 - run resume for hardware IPs
3803  *
3804  * @adev: amdgpu_device pointer
3805  *
3806  * Third resume function for hardware IPs.  The list of all the hardware
3807  * IPs that make up the asic is walked and the resume callbacks are run for
3808  * all DCE.  resume puts the hardware into a functional state after a suspend
3809  * and updates the software state as necessary.  This function is also used
3810  * for restoring the GPU after a GPU reset.
3811  *
3812  * Returns 0 on success, negative error code on failure.
3813  */
3814 static int amdgpu_device_ip_resume_phase3(struct amdgpu_device *adev)
3815 {
3816         int i, r;
3817
3818         for (i = 0; i < adev->num_ip_blocks; i++) {
3819                 if (!adev->ip_blocks[i].status.valid || adev->ip_blocks[i].status.hw)
3820                         continue;
3821                 if (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) {
3822                         r = amdgpu_ip_block_resume(&adev->ip_blocks[i]);
3823                         if (r)
3824                                 return r;
3825                 }
3826         }
3827
3828         return 0;
3829 }
3830
3831 /**
3832  * amdgpu_device_ip_resume - run resume for hardware IPs
3833  *
3834  * @adev: amdgpu_device pointer
3835  *
3836  * Main resume function for hardware IPs.  The hardware IPs
3837  * are split into two resume functions because they are
3838  * also used in recovering from a GPU reset and some additional
3839  * steps need to be take between them.  In this case (S3/S4) they are
3840  * run sequentially.
3841  * Returns 0 on success, negative error code on failure.
3842  */
3843 static int amdgpu_device_ip_resume(struct amdgpu_device *adev)
3844 {
3845         int r;
3846
3847         r = amdgpu_device_ip_resume_phase1(adev);
3848         if (r)
3849                 return r;
3850
3851         r = amdgpu_device_fw_loading(adev);
3852         if (r)
3853                 return r;
3854
3855         r = amdgpu_device_ip_resume_phase2(adev);
3856
3857         if (adev->mman.buffer_funcs_ring->sched.ready)
3858                 amdgpu_ttm_set_buffer_funcs_status(adev, true);
3859
3860         if (r)
3861                 return r;
3862
3863         amdgpu_fence_driver_hw_init(adev);
3864
3865         r = amdgpu_device_ip_resume_phase3(adev);
3866
3867         return r;
3868 }
3869
3870 /**
3871  * amdgpu_device_detect_sriov_bios - determine if the board supports SR-IOV
3872  *
3873  * @adev: amdgpu_device pointer
3874  *
3875  * Query the VBIOS data tables to determine if the board supports SR-IOV.
3876  */
3877 static void amdgpu_device_detect_sriov_bios(struct amdgpu_device *adev)
3878 {
3879         if (amdgpu_sriov_vf(adev)) {
3880                 if (adev->is_atom_fw) {
3881                         if (amdgpu_atomfirmware_gpu_virtualization_supported(adev))
3882                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3883                 } else {
3884                         if (amdgpu_atombios_has_gpu_virtualization_table(adev))
3885                                 adev->virt.caps |= AMDGPU_SRIOV_CAPS_SRIOV_VBIOS;
3886                 }
3887
3888                 if (!(adev->virt.caps & AMDGPU_SRIOV_CAPS_SRIOV_VBIOS))
3889                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_NO_VBIOS, 0, 0);
3890         }
3891 }
3892
3893 /**
3894  * amdgpu_device_asic_has_dc_support - determine if DC supports the asic
3895  *
3896  * @asic_type: AMD asic type
3897  *
3898  * Check if there is DC (new modesetting infrastructre) support for an asic.
3899  * returns true if DC has support, false if not.
3900  */
3901 bool amdgpu_device_asic_has_dc_support(enum amd_asic_type asic_type)
3902 {
3903         switch (asic_type) {
3904 #ifdef CONFIG_DRM_AMDGPU_SI
3905         case CHIP_HAINAN:
3906 #endif
3907         case CHIP_TOPAZ:
3908                 /* chips with no display hardware */
3909                 return false;
3910 #if defined(CONFIG_DRM_AMD_DC)
3911         case CHIP_TAHITI:
3912         case CHIP_PITCAIRN:
3913         case CHIP_VERDE:
3914         case CHIP_OLAND:
3915                 /*
3916                  * We have systems in the wild with these ASICs that require
3917                  * LVDS and VGA support which is not supported with DC.
3918                  *
3919                  * Fallback to the non-DC driver here by default so as not to
3920                  * cause regressions.
3921                  */
3922 #if defined(CONFIG_DRM_AMD_DC_SI)
3923                 return amdgpu_dc > 0;
3924 #else
3925                 return false;
3926 #endif
3927         case CHIP_BONAIRE:
3928         case CHIP_KAVERI:
3929         case CHIP_KABINI:
3930         case CHIP_MULLINS:
3931                 /*
3932                  * We have systems in the wild with these ASICs that require
3933                  * VGA support which is not supported with DC.
3934                  *
3935                  * Fallback to the non-DC driver here by default so as not to
3936                  * cause regressions.
3937                  */
3938                 return amdgpu_dc > 0;
3939         default:
3940                 return amdgpu_dc != 0;
3941 #else
3942         default:
3943                 if (amdgpu_dc > 0)
3944                         DRM_INFO_ONCE("Display Core has been requested via kernel parameter but isn't supported by ASIC, ignoring\n");
3945                 return false;
3946 #endif
3947         }
3948 }
3949
3950 /**
3951  * amdgpu_device_has_dc_support - check if dc is supported
3952  *
3953  * @adev: amdgpu_device pointer
3954  *
3955  * Returns true for supported, false for not supported
3956  */
3957 bool amdgpu_device_has_dc_support(struct amdgpu_device *adev)
3958 {
3959         if (adev->enable_virtual_display ||
3960             (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
3961                 return false;
3962
3963         return amdgpu_device_asic_has_dc_support(adev->asic_type);
3964 }
3965
3966 static void amdgpu_device_xgmi_reset_func(struct work_struct *__work)
3967 {
3968         struct amdgpu_device *adev =
3969                 container_of(__work, struct amdgpu_device, xgmi_reset_work);
3970         struct amdgpu_hive_info *hive = amdgpu_get_xgmi_hive(adev);
3971
3972         /* It's a bug to not have a hive within this function */
3973         if (WARN_ON(!hive))
3974                 return;
3975
3976         /*
3977          * Use task barrier to synchronize all xgmi reset works across the
3978          * hive. task_barrier_enter and task_barrier_exit will block
3979          * until all the threads running the xgmi reset works reach
3980          * those points. task_barrier_full will do both blocks.
3981          */
3982         if (amdgpu_asic_reset_method(adev) == AMD_RESET_METHOD_BACO) {
3983
3984                 task_barrier_enter(&hive->tb);
3985                 adev->asic_reset_res = amdgpu_device_baco_enter(adev_to_drm(adev));
3986
3987                 if (adev->asic_reset_res)
3988                         goto fail;
3989
3990                 task_barrier_exit(&hive->tb);
3991                 adev->asic_reset_res = amdgpu_device_baco_exit(adev_to_drm(adev));
3992
3993                 if (adev->asic_reset_res)
3994                         goto fail;
3995
3996                 amdgpu_ras_reset_error_count(adev, AMDGPU_RAS_BLOCK__MMHUB);
3997         } else {
3998
3999                 task_barrier_full(&hive->tb);
4000                 adev->asic_reset_res =  amdgpu_asic_reset(adev);
4001         }
4002
4003 fail:
4004         if (adev->asic_reset_res)
4005                 DRM_WARN("ASIC reset failed with error, %d for drm dev, %s",
4006                          adev->asic_reset_res, adev_to_drm(adev)->unique);
4007         amdgpu_put_xgmi_hive(hive);
4008 }
4009
4010 static int amdgpu_device_get_job_timeout_settings(struct amdgpu_device *adev)
4011 {
4012         char *input = amdgpu_lockup_timeout;
4013         char *timeout_setting = NULL;
4014         int index = 0;
4015         long timeout;
4016         int ret = 0;
4017
4018         /*
4019          * By default timeout for non compute jobs is 10000
4020          * and 60000 for compute jobs.
4021          * In SR-IOV or passthrough mode, timeout for compute
4022          * jobs are 60000 by default.
4023          */
4024         adev->gfx_timeout = msecs_to_jiffies(10000);
4025         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
4026         if (amdgpu_sriov_vf(adev))
4027                 adev->compute_timeout = amdgpu_sriov_is_pp_one_vf(adev) ?
4028                                         msecs_to_jiffies(60000) : msecs_to_jiffies(10000);
4029         else
4030                 adev->compute_timeout =  msecs_to_jiffies(60000);
4031
4032         if (strnlen(input, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
4033                 while ((timeout_setting = strsep(&input, ",")) &&
4034                                 strnlen(timeout_setting, AMDGPU_MAX_TIMEOUT_PARAM_LENGTH)) {
4035                         ret = kstrtol(timeout_setting, 0, &timeout);
4036                         if (ret)
4037                                 return ret;
4038
4039                         if (timeout == 0) {
4040                                 index++;
4041                                 continue;
4042                         } else if (timeout < 0) {
4043                                 timeout = MAX_SCHEDULE_TIMEOUT;
4044                                 dev_warn(adev->dev, "lockup timeout disabled");
4045                                 add_taint(TAINT_SOFTLOCKUP, LOCKDEP_STILL_OK);
4046                         } else {
4047                                 timeout = msecs_to_jiffies(timeout);
4048                         }
4049
4050                         switch (index++) {
4051                         case 0:
4052                                 adev->gfx_timeout = timeout;
4053                                 break;
4054                         case 1:
4055                                 adev->compute_timeout = timeout;
4056                                 break;
4057                         case 2:
4058                                 adev->sdma_timeout = timeout;
4059                                 break;
4060                         case 3:
4061                                 adev->video_timeout = timeout;
4062                                 break;
4063                         default:
4064                                 break;
4065                         }
4066                 }
4067                 /*
4068                  * There is only one value specified and
4069                  * it should apply to all non-compute jobs.
4070                  */
4071                 if (index == 1) {
4072                         adev->sdma_timeout = adev->video_timeout = adev->gfx_timeout;
4073                         if (amdgpu_sriov_vf(adev) || amdgpu_passthrough(adev))
4074                                 adev->compute_timeout = adev->gfx_timeout;
4075                 }
4076         }
4077
4078         return ret;
4079 }
4080
4081 /**
4082  * amdgpu_device_check_iommu_direct_map - check if RAM direct mapped to GPU
4083  *
4084  * @adev: amdgpu_device pointer
4085  *
4086  * RAM direct mapped to GPU if IOMMU is not enabled or is pass through mode
4087  */
4088 static void amdgpu_device_check_iommu_direct_map(struct amdgpu_device *adev)
4089 {
4090         struct iommu_domain *domain;
4091
4092         domain = iommu_get_domain_for_dev(adev->dev);
4093         if (!domain || domain->type == IOMMU_DOMAIN_IDENTITY)
4094                 adev->ram_is_direct_mapped = true;
4095 }
4096
4097 #if defined(CONFIG_HSA_AMD_P2P)
4098 /**
4099  * amdgpu_device_check_iommu_remap - Check if DMA remapping is enabled.
4100  *
4101  * @adev: amdgpu_device pointer
4102  *
4103  * return if IOMMU remapping bar address
4104  */
4105 static bool amdgpu_device_check_iommu_remap(struct amdgpu_device *adev)
4106 {
4107         struct iommu_domain *domain;
4108
4109         domain = iommu_get_domain_for_dev(adev->dev);
4110         if (domain && (domain->type == IOMMU_DOMAIN_DMA ||
4111                 domain->type == IOMMU_DOMAIN_DMA_FQ))
4112                 return true;
4113
4114         return false;
4115 }
4116 #endif
4117
4118 static const struct attribute *amdgpu_dev_attributes[] = {
4119         &dev_attr_pcie_replay_count.attr,
4120         NULL
4121 };
4122
4123 static void amdgpu_device_set_mcbp(struct amdgpu_device *adev)
4124 {
4125         if (amdgpu_mcbp == 1)
4126                 adev->gfx.mcbp = true;
4127         else if (amdgpu_mcbp == 0)
4128                 adev->gfx.mcbp = false;
4129
4130         if (amdgpu_sriov_vf(adev))
4131                 adev->gfx.mcbp = true;
4132
4133         if (adev->gfx.mcbp)
4134                 DRM_INFO("MCBP is enabled\n");
4135 }
4136
4137 /**
4138  * amdgpu_device_init - initialize the driver
4139  *
4140  * @adev: amdgpu_device pointer
4141  * @flags: driver flags
4142  *
4143  * Initializes the driver info and hw (all asics).
4144  * Returns 0 for success or an error on failure.
4145  * Called at driver startup.
4146  */
4147 int amdgpu_device_init(struct amdgpu_device *adev,
4148                        uint32_t flags)
4149 {
4150         struct drm_device *ddev = adev_to_drm(adev);
4151         struct pci_dev *pdev = adev->pdev;
4152         int r, i;
4153         bool px = false;
4154         u32 max_MBps;
4155         int tmp;
4156
4157         adev->shutdown = false;
4158         adev->flags = flags;
4159
4160         if (amdgpu_force_asic_type >= 0 && amdgpu_force_asic_type < CHIP_LAST)
4161                 adev->asic_type = amdgpu_force_asic_type;
4162         else
4163                 adev->asic_type = flags & AMD_ASIC_MASK;
4164
4165         adev->usec_timeout = AMDGPU_MAX_USEC_TIMEOUT;
4166         if (amdgpu_emu_mode == 1)
4167                 adev->usec_timeout *= 10;
4168         adev->gmc.gart_size = 512 * 1024 * 1024;
4169         adev->accel_working = false;
4170         adev->num_rings = 0;
4171         RCU_INIT_POINTER(adev->gang_submit, dma_fence_get_stub());
4172         adev->mman.buffer_funcs = NULL;
4173         adev->mman.buffer_funcs_ring = NULL;
4174         adev->vm_manager.vm_pte_funcs = NULL;
4175         adev->vm_manager.vm_pte_num_scheds = 0;
4176         adev->gmc.gmc_funcs = NULL;
4177         adev->harvest_ip_mask = 0x0;
4178         adev->fence_context = dma_fence_context_alloc(AMDGPU_MAX_RINGS);
4179         bitmap_zero(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES);
4180
4181         adev->smc_rreg = &amdgpu_invalid_rreg;
4182         adev->smc_wreg = &amdgpu_invalid_wreg;
4183         adev->pcie_rreg = &amdgpu_invalid_rreg;
4184         adev->pcie_wreg = &amdgpu_invalid_wreg;
4185         adev->pcie_rreg_ext = &amdgpu_invalid_rreg_ext;
4186         adev->pcie_wreg_ext = &amdgpu_invalid_wreg_ext;
4187         adev->pciep_rreg = &amdgpu_invalid_rreg;
4188         adev->pciep_wreg = &amdgpu_invalid_wreg;
4189         adev->pcie_rreg64 = &amdgpu_invalid_rreg64;
4190         adev->pcie_wreg64 = &amdgpu_invalid_wreg64;
4191         adev->pcie_rreg64_ext = &amdgpu_invalid_rreg64_ext;
4192         adev->pcie_wreg64_ext = &amdgpu_invalid_wreg64_ext;
4193         adev->uvd_ctx_rreg = &amdgpu_invalid_rreg;
4194         adev->uvd_ctx_wreg = &amdgpu_invalid_wreg;
4195         adev->didt_rreg = &amdgpu_invalid_rreg;
4196         adev->didt_wreg = &amdgpu_invalid_wreg;
4197         adev->gc_cac_rreg = &amdgpu_invalid_rreg;
4198         adev->gc_cac_wreg = &amdgpu_invalid_wreg;
4199         adev->audio_endpt_rreg = &amdgpu_block_invalid_rreg;
4200         adev->audio_endpt_wreg = &amdgpu_block_invalid_wreg;
4201
4202         DRM_INFO("initializing kernel modesetting (%s 0x%04X:0x%04X 0x%04X:0x%04X 0x%02X).\n",
4203                  amdgpu_asic_name[adev->asic_type], pdev->vendor, pdev->device,
4204                  pdev->subsystem_vendor, pdev->subsystem_device, pdev->revision);
4205
4206         /* mutex initialization are all done here so we
4207          * can recall function without having locking issues
4208          */
4209         mutex_init(&adev->firmware.mutex);
4210         mutex_init(&adev->pm.mutex);
4211         mutex_init(&adev->gfx.gpu_clock_mutex);
4212         mutex_init(&adev->srbm_mutex);
4213         mutex_init(&adev->gfx.pipe_reserve_mutex);
4214         mutex_init(&adev->gfx.gfx_off_mutex);
4215         mutex_init(&adev->gfx.partition_mutex);
4216         mutex_init(&adev->grbm_idx_mutex);
4217         mutex_init(&adev->mn_lock);
4218         mutex_init(&adev->virt.vf_errors.lock);
4219         mutex_init(&adev->virt.rlcg_reg_lock);
4220         hash_init(adev->mn_hash);
4221         mutex_init(&adev->psp.mutex);
4222         mutex_init(&adev->notifier_lock);
4223         mutex_init(&adev->pm.stable_pstate_ctx_lock);
4224         mutex_init(&adev->benchmark_mutex);
4225         mutex_init(&adev->gfx.reset_sem_mutex);
4226         /* Initialize the mutex for cleaner shader isolation between GFX and compute processes */
4227         mutex_init(&adev->enforce_isolation_mutex);
4228         mutex_init(&adev->gfx.kfd_sch_mutex);
4229
4230         amdgpu_device_init_apu_flags(adev);
4231
4232         r = amdgpu_device_check_arguments(adev);
4233         if (r)
4234                 return r;
4235
4236         spin_lock_init(&adev->mmio_idx_lock);
4237         spin_lock_init(&adev->smc_idx_lock);
4238         spin_lock_init(&adev->pcie_idx_lock);
4239         spin_lock_init(&adev->uvd_ctx_idx_lock);
4240         spin_lock_init(&adev->didt_idx_lock);
4241         spin_lock_init(&adev->gc_cac_idx_lock);
4242         spin_lock_init(&adev->se_cac_idx_lock);
4243         spin_lock_init(&adev->audio_endpt_idx_lock);
4244         spin_lock_init(&adev->mm_stats.lock);
4245         spin_lock_init(&adev->wb.lock);
4246
4247         INIT_LIST_HEAD(&adev->reset_list);
4248
4249         INIT_LIST_HEAD(&adev->ras_list);
4250
4251         INIT_LIST_HEAD(&adev->pm.od_kobj_list);
4252
4253         INIT_DELAYED_WORK(&adev->delayed_init_work,
4254                           amdgpu_device_delayed_init_work_handler);
4255         INIT_DELAYED_WORK(&adev->gfx.gfx_off_delay_work,
4256                           amdgpu_device_delay_enable_gfx_off);
4257         /*
4258          * Initialize the enforce_isolation work structures for each XCP
4259          * partition.  This work handler is responsible for enforcing shader
4260          * isolation on AMD GPUs.  It counts the number of emitted fences for
4261          * each GFX and compute ring.  If there are any fences, it schedules
4262          * the `enforce_isolation_work` to be run after a delay.  If there are
4263          * no fences, it signals the Kernel Fusion Driver (KFD) to resume the
4264          * runqueue.
4265          */
4266         for (i = 0; i < MAX_XCP; i++) {
4267                 INIT_DELAYED_WORK(&adev->gfx.enforce_isolation[i].work,
4268                                   amdgpu_gfx_enforce_isolation_handler);
4269                 adev->gfx.enforce_isolation[i].adev = adev;
4270                 adev->gfx.enforce_isolation[i].xcp_id = i;
4271         }
4272
4273         INIT_WORK(&adev->xgmi_reset_work, amdgpu_device_xgmi_reset_func);
4274
4275         adev->gfx.gfx_off_req_count = 1;
4276         adev->gfx.gfx_off_residency = 0;
4277         adev->gfx.gfx_off_entrycount = 0;
4278         adev->pm.ac_power = power_supply_is_system_supplied() > 0;
4279
4280         atomic_set(&adev->throttling_logging_enabled, 1);
4281         /*
4282          * If throttling continues, logging will be performed every minute
4283          * to avoid log flooding. "-1" is subtracted since the thermal
4284          * throttling interrupt comes every second. Thus, the total logging
4285          * interval is 59 seconds(retelimited printk interval) + 1(waiting
4286          * for throttling interrupt) = 60 seconds.
4287          */
4288         ratelimit_state_init(&adev->throttling_logging_rs, (60 - 1) * HZ, 1);
4289         ratelimit_state_init(&adev->virt.ras_telemetry_rs, 5 * HZ, 1);
4290
4291         ratelimit_set_flags(&adev->throttling_logging_rs, RATELIMIT_MSG_ON_RELEASE);
4292         ratelimit_set_flags(&adev->virt.ras_telemetry_rs, RATELIMIT_MSG_ON_RELEASE);
4293
4294         /* Registers mapping */
4295         /* TODO: block userspace mapping of io register */
4296         if (adev->asic_type >= CHIP_BONAIRE) {
4297                 adev->rmmio_base = pci_resource_start(adev->pdev, 5);
4298                 adev->rmmio_size = pci_resource_len(adev->pdev, 5);
4299         } else {
4300                 adev->rmmio_base = pci_resource_start(adev->pdev, 2);
4301                 adev->rmmio_size = pci_resource_len(adev->pdev, 2);
4302         }
4303
4304         for (i = 0; i < AMD_IP_BLOCK_TYPE_NUM; i++)
4305                 atomic_set(&adev->pm.pwr_state[i], POWER_STATE_UNKNOWN);
4306
4307         adev->rmmio = ioremap(adev->rmmio_base, adev->rmmio_size);
4308         if (!adev->rmmio)
4309                 return -ENOMEM;
4310
4311         DRM_INFO("register mmio base: 0x%08X\n", (uint32_t)adev->rmmio_base);
4312         DRM_INFO("register mmio size: %u\n", (unsigned int)adev->rmmio_size);
4313
4314         /*
4315          * Reset domain needs to be present early, before XGMI hive discovered
4316          * (if any) and initialized to use reset sem and in_gpu reset flag
4317          * early on during init and before calling to RREG32.
4318          */
4319         adev->reset_domain = amdgpu_reset_create_reset_domain(SINGLE_DEVICE, "amdgpu-reset-dev");
4320         if (!adev->reset_domain)
4321                 return -ENOMEM;
4322
4323         /* detect hw virtualization here */
4324         amdgpu_detect_virtualization(adev);
4325
4326         amdgpu_device_get_pcie_info(adev);
4327
4328         r = amdgpu_device_get_job_timeout_settings(adev);
4329         if (r) {
4330                 dev_err(adev->dev, "invalid lockup_timeout parameter syntax\n");
4331                 return r;
4332         }
4333
4334         amdgpu_device_set_mcbp(adev);
4335
4336         /*
4337          * By default, use default mode where all blocks are expected to be
4338          * initialized. At present a 'swinit' of blocks is required to be
4339          * completed before the need for a different level is detected.
4340          */
4341         amdgpu_set_init_level(adev, AMDGPU_INIT_LEVEL_DEFAULT);
4342         /* early init functions */
4343         r = amdgpu_device_ip_early_init(adev);
4344         if (r)
4345                 return r;
4346
4347         /* Get rid of things like offb */
4348         r = aperture_remove_conflicting_pci_devices(adev->pdev, amdgpu_kms_driver.name);
4349         if (r)
4350                 return r;
4351
4352         /* Enable TMZ based on IP_VERSION */
4353         amdgpu_gmc_tmz_set(adev);
4354
4355         if (amdgpu_sriov_vf(adev) &&
4356             amdgpu_ip_version(adev, GC_HWIP, 0) >= IP_VERSION(10, 3, 0))
4357                 /* VF MMIO access (except mailbox range) from CPU
4358                  * will be blocked during sriov runtime
4359                  */
4360                 adev->virt.caps |= AMDGPU_VF_MMIO_ACCESS_PROTECT;
4361
4362         amdgpu_gmc_noretry_set(adev);
4363         /* Need to get xgmi info early to decide the reset behavior*/
4364         if (adev->gmc.xgmi.supported) {
4365                 r = adev->gfxhub.funcs->get_xgmi_info(adev);
4366                 if (r)
4367                         return r;
4368         }
4369
4370         /* enable PCIE atomic ops */
4371         if (amdgpu_sriov_vf(adev)) {
4372                 if (adev->virt.fw_reserve.p_pf2vf)
4373                         adev->have_atomics_support = ((struct amd_sriov_msg_pf2vf_info *)
4374                                                       adev->virt.fw_reserve.p_pf2vf)->pcie_atomic_ops_support_flags ==
4375                                 (PCI_EXP_DEVCAP2_ATOMIC_COMP32 | PCI_EXP_DEVCAP2_ATOMIC_COMP64);
4376         /* APUs w/ gfx9 onwards doesn't reply on PCIe atomics, rather it is a
4377          * internal path natively support atomics, set have_atomics_support to true.
4378          */
4379         } else if ((adev->flags & AMD_IS_APU) &&
4380                    (amdgpu_ip_version(adev, GC_HWIP, 0) >
4381                     IP_VERSION(9, 0, 0))) {
4382                 adev->have_atomics_support = true;
4383         } else {
4384                 adev->have_atomics_support =
4385                         !pci_enable_atomic_ops_to_root(adev->pdev,
4386                                           PCI_EXP_DEVCAP2_ATOMIC_COMP32 |
4387                                           PCI_EXP_DEVCAP2_ATOMIC_COMP64);
4388         }
4389
4390         if (!adev->have_atomics_support)
4391                 dev_info(adev->dev, "PCIE atomic ops is not supported\n");
4392
4393         /* doorbell bar mapping and doorbell index init*/
4394         amdgpu_doorbell_init(adev);
4395
4396         if (amdgpu_emu_mode == 1) {
4397                 /* post the asic on emulation mode */
4398                 emu_soc_asic_init(adev);
4399                 goto fence_driver_init;
4400         }
4401
4402         amdgpu_reset_init(adev);
4403
4404         /* detect if we are with an SRIOV vbios */
4405         if (adev->bios)
4406                 amdgpu_device_detect_sriov_bios(adev);
4407
4408         /* check if we need to reset the asic
4409          *  E.g., driver was not cleanly unloaded previously, etc.
4410          */
4411         if (!amdgpu_sriov_vf(adev) && amdgpu_asic_need_reset_on_init(adev)) {
4412                 if (adev->gmc.xgmi.num_physical_nodes) {
4413                         dev_info(adev->dev, "Pending hive reset.\n");
4414                         amdgpu_set_init_level(adev,
4415                                               AMDGPU_INIT_LEVEL_MINIMAL_XGMI);
4416                 } else if (amdgpu_ip_version(adev, MP1_HWIP, 0) == IP_VERSION(13, 0, 10) &&
4417                                    !amdgpu_device_has_display_hardware(adev)) {
4418                                         r = psp_gpu_reset(adev);
4419                 } else {
4420                                 tmp = amdgpu_reset_method;
4421                                 /* It should do a default reset when loading or reloading the driver,
4422                                  * regardless of the module parameter reset_method.
4423                                  */
4424                                 amdgpu_reset_method = AMD_RESET_METHOD_NONE;
4425                                 r = amdgpu_asic_reset(adev);
4426                                 amdgpu_reset_method = tmp;
4427                 }
4428
4429                 if (r) {
4430                   dev_err(adev->dev, "asic reset on init failed\n");
4431                   goto failed;
4432                 }
4433         }
4434
4435         /* Post card if necessary */
4436         if (amdgpu_device_need_post(adev)) {
4437                 if (!adev->bios) {
4438                         dev_err(adev->dev, "no vBIOS found\n");
4439                         r = -EINVAL;
4440                         goto failed;
4441                 }
4442                 DRM_INFO("GPU posting now...\n");
4443                 r = amdgpu_device_asic_init(adev);
4444                 if (r) {
4445                         dev_err(adev->dev, "gpu post error!\n");
4446                         goto failed;
4447                 }
4448         }
4449
4450         if (adev->bios) {
4451                 if (adev->is_atom_fw) {
4452                         /* Initialize clocks */
4453                         r = amdgpu_atomfirmware_get_clock_info(adev);
4454                         if (r) {
4455                                 dev_err(adev->dev, "amdgpu_atomfirmware_get_clock_info failed\n");
4456                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
4457                                 goto failed;
4458                         }
4459                 } else {
4460                         /* Initialize clocks */
4461                         r = amdgpu_atombios_get_clock_info(adev);
4462                         if (r) {
4463                                 dev_err(adev->dev, "amdgpu_atombios_get_clock_info failed\n");
4464                                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_ATOMBIOS_GET_CLOCK_FAIL, 0, 0);
4465                                 goto failed;
4466                         }
4467                         /* init i2c buses */
4468                         if (!amdgpu_device_has_dc_support(adev))
4469                                 amdgpu_atombios_i2c_init(adev);
4470                 }
4471         }
4472
4473 fence_driver_init:
4474         /* Fence driver */
4475         r = amdgpu_fence_driver_sw_init(adev);
4476         if (r) {
4477                 dev_err(adev->dev, "amdgpu_fence_driver_sw_init failed\n");
4478                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_FENCE_INIT_FAIL, 0, 0);
4479                 goto failed;
4480         }
4481
4482         /* init the mode config */
4483         drm_mode_config_init(adev_to_drm(adev));
4484
4485         r = amdgpu_device_ip_init(adev);
4486         if (r) {
4487                 dev_err(adev->dev, "amdgpu_device_ip_init failed\n");
4488                 amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_INIT_FAIL, 0, 0);
4489                 goto release_ras_con;
4490         }
4491
4492         amdgpu_fence_driver_hw_init(adev);
4493
4494         dev_info(adev->dev,
4495                 "SE %d, SH per SE %d, CU per SH %d, active_cu_number %d\n",
4496                         adev->gfx.config.max_shader_engines,
4497                         adev->gfx.config.max_sh_per_se,
4498                         adev->gfx.config.max_cu_per_sh,
4499                         adev->gfx.cu_info.number);
4500
4501         adev->accel_working = true;
4502
4503         amdgpu_vm_check_compute_bug(adev);
4504
4505         /* Initialize the buffer migration limit. */
4506         if (amdgpu_moverate >= 0)
4507                 max_MBps = amdgpu_moverate;
4508         else
4509                 max_MBps = 8; /* Allow 8 MB/s. */
4510         /* Get a log2 for easy divisions. */
4511         adev->mm_stats.log2_max_MBps = ilog2(max(1u, max_MBps));
4512
4513         /*
4514          * Register gpu instance before amdgpu_device_enable_mgpu_fan_boost.
4515          * Otherwise the mgpu fan boost feature will be skipped due to the
4516          * gpu instance is counted less.
4517          */
4518         amdgpu_register_gpu_instance(adev);
4519
4520         /* enable clockgating, etc. after ib tests, etc. since some blocks require
4521          * explicit gating rather than handling it automatically.
4522          */
4523         if (adev->init_lvl->level != AMDGPU_INIT_LEVEL_MINIMAL_XGMI) {
4524                 r = amdgpu_device_ip_late_init(adev);
4525                 if (r) {
4526                         dev_err(adev->dev, "amdgpu_device_ip_late_init failed\n");
4527                         amdgpu_vf_error_put(adev, AMDGIM_ERROR_VF_AMDGPU_LATE_INIT_FAIL, 0, r);
4528                         goto release_ras_con;
4529                 }
4530                 /* must succeed. */
4531                 amdgpu_ras_resume(adev);
4532                 queue_delayed_work(system_wq, &adev->delayed_init_work,
4533                                    msecs_to_jiffies(AMDGPU_RESUME_MS));
4534         }
4535
4536         if (amdgpu_sriov_vf(adev)) {
4537                 amdgpu_virt_release_full_gpu(adev, true);
4538                 flush_delayed_work(&adev->delayed_init_work);
4539         }
4540
4541         /*
4542          * Place those sysfs registering after `late_init`. As some of those
4543          * operations performed in `late_init` might affect the sysfs
4544          * interfaces creating.
4545          */
4546         r = amdgpu_atombios_sysfs_init(adev);
4547         if (r)
4548                 drm_err(&adev->ddev,
4549                         "registering atombios sysfs failed (%d).\n", r);
4550
4551         r = amdgpu_pm_sysfs_init(adev);
4552         if (r)
4553                 DRM_ERROR("registering pm sysfs failed (%d).\n", r);
4554
4555         r = amdgpu_ucode_sysfs_init(adev);
4556         if (r) {
4557                 adev->ucode_sysfs_en = false;
4558                 DRM_ERROR("Creating firmware sysfs failed (%d).\n", r);
4559         } else
4560                 adev->ucode_sysfs_en = true;
4561
4562         r = sysfs_create_files(&adev->dev->kobj, amdgpu_dev_attributes);
4563         if (r)
4564                 dev_err(adev->dev, "Could not create amdgpu device attr\n");
4565
4566         r = devm_device_add_group(adev->dev, &amdgpu_board_attrs_group);
4567         if (r)
4568                 dev_err(adev->dev,
4569                         "Could not create amdgpu board attributes\n");
4570
4571         amdgpu_fru_sysfs_init(adev);
4572         amdgpu_reg_state_sysfs_init(adev);
4573         amdgpu_xcp_cfg_sysfs_init(adev);
4574
4575         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4576                 r = amdgpu_pmu_init(adev);
4577         if (r)
4578                 dev_err(adev->dev, "amdgpu_pmu_init failed\n");
4579
4580         /* Have stored pci confspace at hand for restore in sudden PCI error */
4581         if (amdgpu_device_cache_pci_state(adev->pdev))
4582                 pci_restore_state(pdev);
4583
4584         /* if we have > 1 VGA cards, then disable the amdgpu VGA resources */
4585         /* this will fail for cards that aren't VGA class devices, just
4586          * ignore it
4587          */
4588         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4589                 vga_client_register(adev->pdev, amdgpu_device_vga_set_decode);
4590
4591         px = amdgpu_device_supports_px(ddev);
4592
4593         if (px || (!dev_is_removable(&adev->pdev->dev) &&
4594                                 apple_gmux_detect(NULL, NULL)))
4595                 vga_switcheroo_register_client(adev->pdev,
4596                                                &amdgpu_switcheroo_ops, px);
4597
4598         if (px)
4599                 vga_switcheroo_init_domain_pm_ops(adev->dev, &adev->vga_pm_domain);
4600
4601         if (adev->init_lvl->level == AMDGPU_INIT_LEVEL_MINIMAL_XGMI)
4602                 amdgpu_xgmi_reset_on_init(adev);
4603
4604         amdgpu_device_check_iommu_direct_map(adev);
4605
4606         adev->pm_nb.notifier_call = amdgpu_device_pm_notifier;
4607         r = register_pm_notifier(&adev->pm_nb);
4608         if (r)
4609                 goto failed;
4610
4611         return 0;
4612
4613 release_ras_con:
4614         if (amdgpu_sriov_vf(adev))
4615                 amdgpu_virt_release_full_gpu(adev, true);
4616
4617         /* failed in exclusive mode due to timeout */
4618         if (amdgpu_sriov_vf(adev) &&
4619                 !amdgpu_sriov_runtime(adev) &&
4620                 amdgpu_virt_mmio_blocked(adev) &&
4621                 !amdgpu_virt_wait_reset(adev)) {
4622                 dev_err(adev->dev, "VF exclusive mode timeout\n");
4623                 /* Don't send request since VF is inactive. */
4624                 adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
4625                 adev->virt.ops = NULL;
4626                 r = -EAGAIN;
4627         }
4628         amdgpu_release_ras_context(adev);
4629
4630 failed:
4631         amdgpu_vf_error_trans_all(adev);
4632
4633         return r;
4634 }
4635
4636 static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
4637 {
4638
4639         /* Clear all CPU mappings pointing to this device */
4640         unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
4641
4642         /* Unmap all mapped bars - Doorbell, registers and VRAM */
4643         amdgpu_doorbell_fini(adev);
4644
4645         iounmap(adev->rmmio);
4646         adev->rmmio = NULL;
4647         if (adev->mman.aper_base_kaddr)
4648                 iounmap(adev->mman.aper_base_kaddr);
4649         adev->mman.aper_base_kaddr = NULL;
4650
4651         /* Memory manager related */
4652         if (!adev->gmc.xgmi.connected_to_cpu && !adev->gmc.is_app_apu) {
4653                 arch_phys_wc_del(adev->gmc.vram_mtrr);
4654                 arch_io_free_memtype_wc(adev->gmc.aper_base, adev->gmc.aper_size);
4655         }
4656 }
4657
4658 /**
4659  * amdgpu_device_fini_hw - tear down the driver
4660  *
4661  * @adev: amdgpu_device pointer
4662  *
4663  * Tear down the driver info (all asics).
4664  * Called at driver shutdown.
4665  */
4666 void amdgpu_device_fini_hw(struct amdgpu_device *adev)
4667 {
4668         dev_info(adev->dev, "amdgpu: finishing device.\n");
4669         flush_delayed_work(&adev->delayed_init_work);
4670
4671         if (adev->mman.initialized)
4672                 drain_workqueue(adev->mman.bdev.wq);
4673         adev->shutdown = true;
4674
4675         unregister_pm_notifier(&adev->pm_nb);
4676
4677         /* make sure IB test finished before entering exclusive mode
4678          * to avoid preemption on IB test
4679          */
4680         if (amdgpu_sriov_vf(adev)) {
4681                 amdgpu_virt_request_full_gpu(adev, false);
4682                 amdgpu_virt_fini_data_exchange(adev);
4683         }
4684
4685         /* disable all interrupts */
4686         amdgpu_irq_disable_all(adev);
4687         if (adev->mode_info.mode_config_initialized) {
4688                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(adev)))
4689                         drm_helper_force_disable_all(adev_to_drm(adev));
4690                 else
4691                         drm_atomic_helper_shutdown(adev_to_drm(adev));
4692         }
4693         amdgpu_fence_driver_hw_fini(adev);
4694
4695         if (adev->pm.sysfs_initialized)
4696                 amdgpu_pm_sysfs_fini(adev);
4697         if (adev->ucode_sysfs_en)
4698                 amdgpu_ucode_sysfs_fini(adev);
4699         sysfs_remove_files(&adev->dev->kobj, amdgpu_dev_attributes);
4700         amdgpu_fru_sysfs_fini(adev);
4701
4702         amdgpu_reg_state_sysfs_fini(adev);
4703         amdgpu_xcp_cfg_sysfs_fini(adev);
4704
4705         /* disable ras feature must before hw fini */
4706         amdgpu_ras_pre_fini(adev);
4707
4708         amdgpu_ttm_set_buffer_funcs_status(adev, false);
4709
4710         amdgpu_device_ip_fini_early(adev);
4711
4712         amdgpu_irq_fini_hw(adev);
4713
4714         if (adev->mman.initialized)
4715                 ttm_device_clear_dma_mappings(&adev->mman.bdev);
4716
4717         amdgpu_gart_dummy_page_fini(adev);
4718
4719         if (drm_dev_is_unplugged(adev_to_drm(adev)))
4720                 amdgpu_device_unmap_mmio(adev);
4721
4722 }
4723
4724 void amdgpu_device_fini_sw(struct amdgpu_device *adev)
4725 {
4726         int idx;
4727         bool px;
4728
4729         amdgpu_device_ip_fini(adev);
4730         amdgpu_fence_driver_sw_fini(adev);
4731         amdgpu_ucode_release(&adev->firmware.gpu_info_fw);
4732         adev->accel_working = false;
4733         dma_fence_put(rcu_dereference_protected(adev->gang_submit, true));
4734
4735         amdgpu_reset_fini(adev);
4736
4737         /* free i2c buses */
4738         if (!amdgpu_device_has_dc_support(adev))
4739                 amdgpu_i2c_fini(adev);
4740
4741         if (amdgpu_emu_mode != 1)
4742                 amdgpu_atombios_fini(adev);
4743
4744         kfree(adev->bios);
4745         adev->bios = NULL;
4746
4747         kfree(adev->fru_info);
4748         adev->fru_info = NULL;
4749
4750         px = amdgpu_device_supports_px(adev_to_drm(adev));
4751
4752         if (px || (!dev_is_removable(&adev->pdev->dev) &&
4753                                 apple_gmux_detect(NULL, NULL)))
4754                 vga_switcheroo_unregister_client(adev->pdev);
4755
4756         if (px)
4757                 vga_switcheroo_fini_domain_pm_ops(adev->dev);
4758
4759         if ((adev->pdev->class >> 8) == PCI_CLASS_DISPLAY_VGA)
4760                 vga_client_unregister(adev->pdev);
4761
4762         if (drm_dev_enter(adev_to_drm(adev), &idx)) {
4763
4764                 iounmap(adev->rmmio);
4765                 adev->rmmio = NULL;
4766                 amdgpu_doorbell_fini(adev);
4767                 drm_dev_exit(idx);
4768         }
4769
4770         if (IS_ENABLED(CONFIG_PERF_EVENTS))
4771                 amdgpu_pmu_fini(adev);
4772         if (adev->mman.discovery_bin)
4773                 amdgpu_discovery_fini(adev);
4774
4775         amdgpu_reset_put_reset_domain(adev->reset_domain);
4776         adev->reset_domain = NULL;
4777
4778         kfree(adev->pci_state);
4779
4780 }
4781
4782 /**
4783  * amdgpu_device_evict_resources - evict device resources
4784  * @adev: amdgpu device object
4785  *
4786  * Evicts all ttm device resources(vram BOs, gart table) from the lru list
4787  * of the vram memory type. Mainly used for evicting device resources
4788  * at suspend time.
4789  *
4790  */
4791 static int amdgpu_device_evict_resources(struct amdgpu_device *adev)
4792 {
4793         int ret;
4794
4795         /* No need to evict vram on APUs unless going to S4 */
4796         if (!adev->in_s4 && (adev->flags & AMD_IS_APU))
4797                 return 0;
4798
4799         ret = amdgpu_ttm_evict_resources(adev, TTM_PL_VRAM);
4800         if (ret)
4801                 DRM_WARN("evicting device resources failed\n");
4802         return ret;
4803 }
4804
4805 /*
4806  * Suspend & resume.
4807  */
4808 /**
4809  * amdgpu_device_pm_notifier - Notification block for Suspend/Hibernate events
4810  * @nb: notifier block
4811  * @mode: suspend mode
4812  * @data: data
4813  *
4814  * This function is called when the system is about to suspend or hibernate.
4815  * It is used to evict resources from the device before the system goes to
4816  * sleep while there is still access to swap.
4817  */
4818 static int amdgpu_device_pm_notifier(struct notifier_block *nb, unsigned long mode,
4819                                      void *data)
4820 {
4821         struct amdgpu_device *adev = container_of(nb, struct amdgpu_device, pm_nb);
4822         int r;
4823
4824         switch (mode) {
4825         case PM_HIBERNATION_PREPARE:
4826                 adev->in_s4 = true;
4827                 fallthrough;
4828         case PM_SUSPEND_PREPARE:
4829                 r = amdgpu_device_evict_resources(adev);
4830                 /*
4831                  * This is considered non-fatal at this time because
4832                  * amdgpu_device_prepare() will also fatally evict resources.
4833                  * See https://gitlab.freedesktop.org/drm/amd/-/issues/3781
4834                  */
4835                 if (r)
4836                         drm_warn(adev_to_drm(adev), "Failed to evict resources, freeze active processes if problems occur: %d\n", r);
4837                 break;
4838         }
4839
4840         return NOTIFY_DONE;
4841 }
4842
4843 /**
4844  * amdgpu_device_prepare - prepare for device suspend
4845  *
4846  * @dev: drm dev pointer
4847  *
4848  * Prepare to put the hw in the suspend state (all asics).
4849  * Returns 0 for success or an error on failure.
4850  * Called at driver suspend.
4851  */
4852 int amdgpu_device_prepare(struct drm_device *dev)
4853 {
4854         struct amdgpu_device *adev = drm_to_adev(dev);
4855         int i, r;
4856
4857         amdgpu_choose_low_power_state(adev);
4858
4859         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4860                 return 0;
4861
4862         /* Evict the majority of BOs before starting suspend sequence */
4863         r = amdgpu_device_evict_resources(adev);
4864         if (r)
4865                 goto unprepare;
4866
4867         flush_delayed_work(&adev->gfx.gfx_off_delay_work);
4868
4869         for (i = 0; i < adev->num_ip_blocks; i++) {
4870                 if (!adev->ip_blocks[i].status.valid)
4871                         continue;
4872                 if (!adev->ip_blocks[i].version->funcs->prepare_suspend)
4873                         continue;
4874                 r = adev->ip_blocks[i].version->funcs->prepare_suspend(&adev->ip_blocks[i]);
4875                 if (r)
4876                         goto unprepare;
4877         }
4878
4879         return 0;
4880
4881 unprepare:
4882         adev->in_s0ix = adev->in_s3 = adev->in_s4 = false;
4883
4884         return r;
4885 }
4886
4887 /**
4888  * amdgpu_device_suspend - initiate device suspend
4889  *
4890  * @dev: drm dev pointer
4891  * @notify_clients: notify in-kernel DRM clients
4892  *
4893  * Puts the hw in the suspend state (all asics).
4894  * Returns 0 for success or an error on failure.
4895  * Called at driver suspend.
4896  */
4897 int amdgpu_device_suspend(struct drm_device *dev, bool notify_clients)
4898 {
4899         struct amdgpu_device *adev = drm_to_adev(dev);
4900         int r = 0;
4901
4902         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4903                 return 0;
4904
4905         adev->in_suspend = true;
4906
4907         if (amdgpu_sriov_vf(adev)) {
4908                 amdgpu_virt_fini_data_exchange(adev);
4909                 r = amdgpu_virt_request_full_gpu(adev, false);
4910                 if (r)
4911                         return r;
4912         }
4913
4914         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D3))
4915                 DRM_WARN("smart shift update failed\n");
4916
4917         if (notify_clients)
4918                 drm_client_dev_suspend(adev_to_drm(adev), false);
4919
4920         cancel_delayed_work_sync(&adev->delayed_init_work);
4921
4922         amdgpu_ras_suspend(adev);
4923
4924         amdgpu_device_ip_suspend_phase1(adev);
4925
4926         if (!adev->in_s0ix)
4927                 amdgpu_amdkfd_suspend(adev, adev->in_runpm);
4928
4929         r = amdgpu_device_evict_resources(adev);
4930         if (r)
4931                 return r;
4932
4933         amdgpu_ttm_set_buffer_funcs_status(adev, false);
4934
4935         amdgpu_fence_driver_hw_fini(adev);
4936
4937         amdgpu_device_ip_suspend_phase2(adev);
4938
4939         if (amdgpu_sriov_vf(adev))
4940                 amdgpu_virt_release_full_gpu(adev, false);
4941
4942         r = amdgpu_dpm_notify_rlc_state(adev, false);
4943         if (r)
4944                 return r;
4945
4946         return 0;
4947 }
4948
4949 /**
4950  * amdgpu_device_resume - initiate device resume
4951  *
4952  * @dev: drm dev pointer
4953  * @notify_clients: notify in-kernel DRM clients
4954  *
4955  * Bring the hw back to operating state (all asics).
4956  * Returns 0 for success or an error on failure.
4957  * Called at driver resume.
4958  */
4959 int amdgpu_device_resume(struct drm_device *dev, bool notify_clients)
4960 {
4961         struct amdgpu_device *adev = drm_to_adev(dev);
4962         int r = 0;
4963
4964         if (amdgpu_sriov_vf(adev)) {
4965                 r = amdgpu_virt_request_full_gpu(adev, true);
4966                 if (r)
4967                         return r;
4968         }
4969
4970         if (dev->switch_power_state == DRM_SWITCH_POWER_OFF)
4971                 return 0;
4972
4973         if (adev->in_s0ix)
4974                 amdgpu_dpm_gfx_state_change(adev, sGpuChangeState_D0Entry);
4975
4976         /* post card */
4977         if (amdgpu_device_need_post(adev)) {
4978                 r = amdgpu_device_asic_init(adev);
4979                 if (r)
4980                         dev_err(adev->dev, "amdgpu asic init failed\n");
4981         }
4982
4983         r = amdgpu_device_ip_resume(adev);
4984
4985         if (r) {
4986                 dev_err(adev->dev, "amdgpu_device_ip_resume failed (%d).\n", r);
4987                 goto exit;
4988         }
4989
4990         if (!adev->in_s0ix) {
4991                 r = amdgpu_amdkfd_resume(adev, adev->in_runpm);
4992                 if (r)
4993                         goto exit;
4994         }
4995
4996         r = amdgpu_device_ip_late_init(adev);
4997         if (r)
4998                 goto exit;
4999
5000         queue_delayed_work(system_wq, &adev->delayed_init_work,
5001                            msecs_to_jiffies(AMDGPU_RESUME_MS));
5002 exit:
5003         if (amdgpu_sriov_vf(adev)) {
5004                 amdgpu_virt_init_data_exchange(adev);
5005                 amdgpu_virt_release_full_gpu(adev, true);
5006         }
5007
5008         if (r)
5009                 return r;
5010
5011         /* Make sure IB tests flushed */
5012         flush_delayed_work(&adev->delayed_init_work);
5013
5014         if (notify_clients)
5015                 drm_client_dev_resume(adev_to_drm(adev), false);
5016
5017         amdgpu_ras_resume(adev);
5018
5019         if (adev->mode_info.num_crtc) {
5020                 /*
5021                  * Most of the connector probing functions try to acquire runtime pm
5022                  * refs to ensure that the GPU is powered on when connector polling is
5023                  * performed. Since we're calling this from a runtime PM callback,
5024                  * trying to acquire rpm refs will cause us to deadlock.
5025                  *
5026                  * Since we're guaranteed to be holding the rpm lock, it's safe to
5027                  * temporarily disable the rpm helpers so this doesn't deadlock us.
5028                  */
5029 #ifdef CONFIG_PM
5030                 dev->dev->power.disable_depth++;
5031 #endif
5032                 if (!adev->dc_enabled)
5033                         drm_helper_hpd_irq_event(dev);
5034                 else
5035                         drm_kms_helper_hotplug_event(dev);
5036 #ifdef CONFIG_PM
5037                 dev->dev->power.disable_depth--;
5038 #endif
5039         }
5040         adev->in_suspend = false;
5041
5042         if (adev->enable_mes)
5043                 amdgpu_mes_self_test(adev);
5044
5045         if (amdgpu_acpi_smart_shift_update(dev, AMDGPU_SS_DEV_D0))
5046                 DRM_WARN("smart shift update failed\n");
5047
5048         return 0;
5049 }
5050
5051 /**
5052  * amdgpu_device_ip_check_soft_reset - did soft reset succeed
5053  *
5054  * @adev: amdgpu_device pointer
5055  *
5056  * The list of all the hardware IPs that make up the asic is walked and
5057  * the check_soft_reset callbacks are run.  check_soft_reset determines
5058  * if the asic is still hung or not.
5059  * Returns true if any of the IPs are still in a hung state, false if not.
5060  */
5061 static bool amdgpu_device_ip_check_soft_reset(struct amdgpu_device *adev)
5062 {
5063         int i;
5064         bool asic_hang = false;
5065
5066         if (amdgpu_sriov_vf(adev))
5067                 return true;
5068
5069         if (amdgpu_asic_need_full_reset(adev))
5070                 return true;
5071
5072         for (i = 0; i < adev->num_ip_blocks; i++) {
5073                 if (!adev->ip_blocks[i].status.valid)
5074                         continue;
5075                 if (adev->ip_blocks[i].version->funcs->check_soft_reset)
5076                         adev->ip_blocks[i].status.hang =
5077                                 adev->ip_blocks[i].version->funcs->check_soft_reset(
5078                                         &adev->ip_blocks[i]);
5079                 if (adev->ip_blocks[i].status.hang) {
5080                         dev_info(adev->dev, "IP block:%s is hung!\n", adev->ip_blocks[i].version->funcs->name);
5081                         asic_hang = true;
5082                 }
5083         }
5084         return asic_hang;
5085 }
5086
5087 /**
5088  * amdgpu_device_ip_pre_soft_reset - prepare for soft reset
5089  *
5090  * @adev: amdgpu_device pointer
5091  *
5092  * The list of all the hardware IPs that make up the asic is walked and the
5093  * pre_soft_reset callbacks are run if the block is hung.  pre_soft_reset
5094  * handles any IP specific hardware or software state changes that are
5095  * necessary for a soft reset to succeed.
5096  * Returns 0 on success, negative error code on failure.
5097  */
5098 static int amdgpu_device_ip_pre_soft_reset(struct amdgpu_device *adev)
5099 {
5100         int i, r = 0;
5101
5102         for (i = 0; i < adev->num_ip_blocks; i++) {
5103                 if (!adev->ip_blocks[i].status.valid)
5104                         continue;
5105                 if (adev->ip_blocks[i].status.hang &&
5106                     adev->ip_blocks[i].version->funcs->pre_soft_reset) {
5107                         r = adev->ip_blocks[i].version->funcs->pre_soft_reset(&adev->ip_blocks[i]);
5108                         if (r)
5109                                 return r;
5110                 }
5111         }
5112
5113         return 0;
5114 }
5115
5116 /**
5117  * amdgpu_device_ip_need_full_reset - check if a full asic reset is needed
5118  *
5119  * @adev: amdgpu_device pointer
5120  *
5121  * Some hardware IPs cannot be soft reset.  If they are hung, a full gpu
5122  * reset is necessary to recover.
5123  * Returns true if a full asic reset is required, false if not.
5124  */
5125 static bool amdgpu_device_ip_need_full_reset(struct amdgpu_device *adev)
5126 {
5127         int i;
5128
5129         if (amdgpu_asic_need_full_reset(adev))
5130                 return true;
5131
5132         for (i = 0; i < adev->num_ip_blocks; i++) {
5133                 if (!adev->ip_blocks[i].status.valid)
5134                         continue;
5135                 if ((adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_GMC) ||
5136                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_SMC) ||
5137                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_ACP) ||
5138                     (adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_DCE) ||
5139                      adev->ip_blocks[i].version->type == AMD_IP_BLOCK_TYPE_PSP) {
5140                         if (adev->ip_blocks[i].status.hang) {
5141                                 dev_info(adev->dev, "Some block need full reset!\n");
5142                                 return true;
5143                         }
5144                 }
5145         }
5146         return false;
5147 }
5148
5149 /**
5150  * amdgpu_device_ip_soft_reset - do a soft reset
5151  *
5152  * @adev: amdgpu_device pointer
5153  *
5154  * The list of all the hardware IPs that make up the asic is walked and the
5155  * soft_reset callbacks are run if the block is hung.  soft_reset handles any
5156  * IP specific hardware or software state changes that are necessary to soft
5157  * reset the IP.
5158  * Returns 0 on success, negative error code on failure.
5159  */
5160 static int amdgpu_device_ip_soft_reset(struct amdgpu_device *adev)
5161 {
5162         int i, r = 0;
5163
5164         for (i = 0; i < adev->num_ip_blocks; i++) {
5165                 if (!adev->ip_blocks[i].status.valid)
5166                         continue;
5167                 if (adev->ip_blocks[i].status.hang &&
5168                     adev->ip_blocks[i].version->funcs->soft_reset) {
5169                         r = adev->ip_blocks[i].version->funcs->soft_reset(&adev->ip_blocks[i]);
5170                         if (r)
5171                                 return r;
5172                 }
5173         }
5174
5175         return 0;
5176 }
5177
5178 /**
5179  * amdgpu_device_ip_post_soft_reset - clean up from soft reset
5180  *
5181  * @adev: amdgpu_device pointer
5182  *
5183  * The list of all the hardware IPs that make up the asic is walked and the
5184  * post_soft_reset callbacks are run if the asic was hung.  post_soft_reset
5185  * handles any IP specific hardware or software state changes that are
5186  * necessary after the IP has been soft reset.
5187  * Returns 0 on success, negative error code on failure.
5188  */
5189 static int amdgpu_device_ip_post_soft_reset(struct amdgpu_device *adev)
5190 {
5191         int i, r = 0;
5192
5193         for (i = 0; i < adev->num_ip_blocks; i++) {
5194                 if (!adev->ip_blocks[i].status.valid)
5195                         continue;
5196                 if (adev->ip_blocks[i].status.hang &&
5197                     adev->ip_blocks[i].version->funcs->post_soft_reset)
5198                         r = adev->ip_blocks[i].version->funcs->post_soft_reset(&adev->ip_blocks[i]);
5199                 if (r)
5200                         return r;
5201         }
5202
5203         return 0;
5204 }
5205
5206 /**
5207  * amdgpu_device_reset_sriov - reset ASIC for SR-IOV vf
5208  *
5209  * @adev: amdgpu_device pointer
5210  * @reset_context: amdgpu reset context pointer
5211  *
5212  * do VF FLR and reinitialize Asic
5213  * return 0 means succeeded otherwise failed
5214  */
5215 static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
5216                                      struct amdgpu_reset_context *reset_context)
5217 {
5218         int r;
5219         struct amdgpu_hive_info *hive = NULL;
5220
5221         if (test_bit(AMDGPU_HOST_FLR, &reset_context->flags)) {
5222                 if (!amdgpu_ras_get_fed_status(adev))
5223                         amdgpu_virt_ready_to_reset(adev);
5224                 amdgpu_virt_wait_reset(adev);
5225                 clear_bit(AMDGPU_HOST_FLR, &reset_context->flags);
5226                 r = amdgpu_virt_request_full_gpu(adev, true);
5227         } else {
5228                 r = amdgpu_virt_reset_gpu(adev);
5229         }
5230         if (r)
5231                 return r;
5232
5233         amdgpu_ras_clear_err_state(adev);
5234         amdgpu_irq_gpu_reset_resume_helper(adev);
5235
5236         /* some sw clean up VF needs to do before recover */
5237         amdgpu_virt_post_reset(adev);
5238
5239         /* Resume IP prior to SMC */
5240         r = amdgpu_device_ip_reinit_early_sriov(adev);
5241         if (r)
5242                 return r;
5243
5244         amdgpu_virt_init_data_exchange(adev);
5245
5246         r = amdgpu_device_fw_loading(adev);
5247         if (r)
5248                 return r;
5249
5250         /* now we are okay to resume SMC/CP/SDMA */
5251         r = amdgpu_device_ip_reinit_late_sriov(adev);
5252         if (r)
5253                 return r;
5254
5255         hive = amdgpu_get_xgmi_hive(adev);
5256         /* Update PSP FW topology after reset */
5257         if (hive && adev->gmc.xgmi.num_physical_nodes > 1)
5258                 r = amdgpu_xgmi_update_topology(hive, adev);
5259         if (hive)
5260                 amdgpu_put_xgmi_hive(hive);
5261         if (r)
5262                 return r;
5263
5264         r = amdgpu_ib_ring_tests(adev);
5265         if (r)
5266                 return r;
5267
5268         if (adev->virt.gim_feature & AMDGIM_FEATURE_GIM_FLR_VRAMLOST)
5269                 amdgpu_inc_vram_lost(adev);
5270
5271         /* need to be called during full access so we can't do it later like
5272          * bare-metal does.
5273          */
5274         amdgpu_amdkfd_post_reset(adev);
5275         amdgpu_virt_release_full_gpu(adev, true);
5276
5277         /* Aldebaran and gfx_11_0_3 support ras in SRIOV, so need resume ras during reset */
5278         if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 2) ||
5279             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
5280             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4) ||
5281             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(11, 0, 3))
5282                 amdgpu_ras_resume(adev);
5283
5284         amdgpu_virt_ras_telemetry_post_reset(adev);
5285
5286         return 0;
5287 }
5288
5289 /**
5290  * amdgpu_device_has_job_running - check if there is any unfinished job
5291  *
5292  * @adev: amdgpu_device pointer
5293  *
5294  * check if there is any job running on the device when guest driver receives
5295  * FLR notification from host driver. If there are still jobs running, then
5296  * the guest driver will not respond the FLR reset. Instead, let the job hit
5297  * the timeout and guest driver then issue the reset request.
5298  */
5299 bool amdgpu_device_has_job_running(struct amdgpu_device *adev)
5300 {
5301         int i;
5302
5303         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5304                 struct amdgpu_ring *ring = adev->rings[i];
5305
5306                 if (!amdgpu_ring_sched_ready(ring))
5307                         continue;
5308
5309                 if (amdgpu_fence_count_emitted(ring))
5310                         return true;
5311         }
5312         return false;
5313 }
5314
5315 /**
5316  * amdgpu_device_should_recover_gpu - check if we should try GPU recovery
5317  *
5318  * @adev: amdgpu_device pointer
5319  *
5320  * Check amdgpu_gpu_recovery and SRIOV status to see if we should try to recover
5321  * a hung GPU.
5322  */
5323 bool amdgpu_device_should_recover_gpu(struct amdgpu_device *adev)
5324 {
5325
5326         if (amdgpu_gpu_recovery == 0)
5327                 goto disabled;
5328
5329         /* Skip soft reset check in fatal error mode */
5330         if (!amdgpu_ras_is_poison_mode_supported(adev))
5331                 return true;
5332
5333         if (amdgpu_sriov_vf(adev))
5334                 return true;
5335
5336         if (amdgpu_gpu_recovery == -1) {
5337                 switch (adev->asic_type) {
5338 #ifdef CONFIG_DRM_AMDGPU_SI
5339                 case CHIP_VERDE:
5340                 case CHIP_TAHITI:
5341                 case CHIP_PITCAIRN:
5342                 case CHIP_OLAND:
5343                 case CHIP_HAINAN:
5344 #endif
5345 #ifdef CONFIG_DRM_AMDGPU_CIK
5346                 case CHIP_KAVERI:
5347                 case CHIP_KABINI:
5348                 case CHIP_MULLINS:
5349 #endif
5350                 case CHIP_CARRIZO:
5351                 case CHIP_STONEY:
5352                 case CHIP_CYAN_SKILLFISH:
5353                         goto disabled;
5354                 default:
5355                         break;
5356                 }
5357         }
5358
5359         return true;
5360
5361 disabled:
5362                 dev_info(adev->dev, "GPU recovery disabled.\n");
5363                 return false;
5364 }
5365
5366 int amdgpu_device_mode1_reset(struct amdgpu_device *adev)
5367 {
5368         u32 i;
5369         int ret = 0;
5370
5371         amdgpu_atombios_scratch_regs_engine_hung(adev, true);
5372
5373         dev_info(adev->dev, "GPU mode1 reset\n");
5374
5375         /* Cache the state before bus master disable. The saved config space
5376          * values are used in other cases like restore after mode-2 reset.
5377          */
5378         amdgpu_device_cache_pci_state(adev->pdev);
5379
5380         /* disable BM */
5381         pci_clear_master(adev->pdev);
5382
5383         if (amdgpu_dpm_is_mode1_reset_supported(adev)) {
5384                 dev_info(adev->dev, "GPU smu mode1 reset\n");
5385                 ret = amdgpu_dpm_mode1_reset(adev);
5386         } else {
5387                 dev_info(adev->dev, "GPU psp mode1 reset\n");
5388                 ret = psp_gpu_reset(adev);
5389         }
5390
5391         if (ret)
5392                 goto mode1_reset_failed;
5393
5394         amdgpu_device_load_pci_state(adev->pdev);
5395         ret = amdgpu_psp_wait_for_bootloader(adev);
5396         if (ret)
5397                 goto mode1_reset_failed;
5398
5399         /* wait for asic to come out of reset */
5400         for (i = 0; i < adev->usec_timeout; i++) {
5401                 u32 memsize = adev->nbio.funcs->get_memsize(adev);
5402
5403                 if (memsize != 0xffffffff)
5404                         break;
5405                 udelay(1);
5406         }
5407
5408         if (i >= adev->usec_timeout) {
5409                 ret = -ETIMEDOUT;
5410                 goto mode1_reset_failed;
5411         }
5412
5413         amdgpu_atombios_scratch_regs_engine_hung(adev, false);
5414
5415         return 0;
5416
5417 mode1_reset_failed:
5418         dev_err(adev->dev, "GPU mode1 reset failed\n");
5419         return ret;
5420 }
5421
5422 int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev,
5423                                  struct amdgpu_reset_context *reset_context)
5424 {
5425         int i, r = 0;
5426         struct amdgpu_job *job = NULL;
5427         struct amdgpu_device *tmp_adev = reset_context->reset_req_dev;
5428         bool need_full_reset =
5429                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5430
5431         if (reset_context->reset_req_dev == adev)
5432                 job = reset_context->job;
5433
5434         if (amdgpu_sriov_vf(adev))
5435                 amdgpu_virt_pre_reset(adev);
5436
5437         amdgpu_fence_driver_isr_toggle(adev, true);
5438
5439         /* block all schedulers and reset given job's ring */
5440         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5441                 struct amdgpu_ring *ring = adev->rings[i];
5442
5443                 if (!amdgpu_ring_sched_ready(ring))
5444                         continue;
5445
5446                 /* Clear job fence from fence drv to avoid force_completion
5447                  * leave NULL and vm flush fence in fence drv
5448                  */
5449                 amdgpu_fence_driver_clear_job_fences(ring);
5450
5451                 /* after all hw jobs are reset, hw fence is meaningless, so force_completion */
5452                 amdgpu_fence_driver_force_completion(ring);
5453         }
5454
5455         amdgpu_fence_driver_isr_toggle(adev, false);
5456
5457         if (job && job->vm)
5458                 drm_sched_increase_karma(&job->base);
5459
5460         r = amdgpu_reset_prepare_hwcontext(adev, reset_context);
5461         /* If reset handler not implemented, continue; otherwise return */
5462         if (r == -EOPNOTSUPP)
5463                 r = 0;
5464         else
5465                 return r;
5466
5467         /* Don't suspend on bare metal if we are not going to HW reset the ASIC */
5468         if (!amdgpu_sriov_vf(adev)) {
5469
5470                 if (!need_full_reset)
5471                         need_full_reset = amdgpu_device_ip_need_full_reset(adev);
5472
5473                 if (!need_full_reset && amdgpu_gpu_recovery &&
5474                     amdgpu_device_ip_check_soft_reset(adev)) {
5475                         amdgpu_device_ip_pre_soft_reset(adev);
5476                         r = amdgpu_device_ip_soft_reset(adev);
5477                         amdgpu_device_ip_post_soft_reset(adev);
5478                         if (r || amdgpu_device_ip_check_soft_reset(adev)) {
5479                                 dev_info(adev->dev, "soft reset failed, will fallback to full reset!\n");
5480                                 need_full_reset = true;
5481                         }
5482                 }
5483
5484                 if (!test_bit(AMDGPU_SKIP_COREDUMP, &reset_context->flags)) {
5485                         dev_info(tmp_adev->dev, "Dumping IP State\n");
5486                         /* Trigger ip dump before we reset the asic */
5487                         for (i = 0; i < tmp_adev->num_ip_blocks; i++)
5488                                 if (tmp_adev->ip_blocks[i].version->funcs->dump_ip_state)
5489                                         tmp_adev->ip_blocks[i].version->funcs
5490                                                 ->dump_ip_state((void *)&tmp_adev->ip_blocks[i]);
5491                         dev_info(tmp_adev->dev, "Dumping IP State Completed\n");
5492                 }
5493
5494                 if (need_full_reset)
5495                         r = amdgpu_device_ip_suspend(adev);
5496                 if (need_full_reset)
5497                         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5498                 else
5499                         clear_bit(AMDGPU_NEED_FULL_RESET,
5500                                   &reset_context->flags);
5501         }
5502
5503         return r;
5504 }
5505
5506 int amdgpu_device_reinit_after_reset(struct amdgpu_reset_context *reset_context)
5507 {
5508         struct list_head *device_list_handle;
5509         bool full_reset, vram_lost = false;
5510         struct amdgpu_device *tmp_adev;
5511         int r, init_level;
5512
5513         device_list_handle = reset_context->reset_device_list;
5514
5515         if (!device_list_handle)
5516                 return -EINVAL;
5517
5518         full_reset = test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5519
5520         /**
5521          * If it's reset on init, it's default init level, otherwise keep level
5522          * as recovery level.
5523          */
5524         if (reset_context->method == AMD_RESET_METHOD_ON_INIT)
5525                         init_level = AMDGPU_INIT_LEVEL_DEFAULT;
5526         else
5527                         init_level = AMDGPU_INIT_LEVEL_RESET_RECOVERY;
5528
5529         r = 0;
5530         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5531                 amdgpu_set_init_level(tmp_adev, init_level);
5532                 if (full_reset) {
5533                         /* post card */
5534                         amdgpu_ras_clear_err_state(tmp_adev);
5535                         r = amdgpu_device_asic_init(tmp_adev);
5536                         if (r) {
5537                                 dev_warn(tmp_adev->dev, "asic atom init failed!");
5538                         } else {
5539                                 dev_info(tmp_adev->dev, "GPU reset succeeded, trying to resume\n");
5540
5541                                 r = amdgpu_device_ip_resume_phase1(tmp_adev);
5542                                 if (r)
5543                                         goto out;
5544
5545                                 vram_lost = amdgpu_device_check_vram_lost(tmp_adev);
5546
5547                                 if (!test_bit(AMDGPU_SKIP_COREDUMP, &reset_context->flags))
5548                                         amdgpu_coredump(tmp_adev, false, vram_lost, reset_context->job);
5549
5550                                 if (vram_lost) {
5551                                         DRM_INFO("VRAM is lost due to GPU reset!\n");
5552                                         amdgpu_inc_vram_lost(tmp_adev);
5553                                 }
5554
5555                                 r = amdgpu_device_fw_loading(tmp_adev);
5556                                 if (r)
5557                                         return r;
5558
5559                                 r = amdgpu_xcp_restore_partition_mode(
5560                                         tmp_adev->xcp_mgr);
5561                                 if (r)
5562                                         goto out;
5563
5564                                 r = amdgpu_device_ip_resume_phase2(tmp_adev);
5565                                 if (r)
5566                                         goto out;
5567
5568                                 if (tmp_adev->mman.buffer_funcs_ring->sched.ready)
5569                                         amdgpu_ttm_set_buffer_funcs_status(tmp_adev, true);
5570
5571                                 r = amdgpu_device_ip_resume_phase3(tmp_adev);
5572                                 if (r)
5573                                         goto out;
5574
5575                                 if (vram_lost)
5576                                         amdgpu_device_fill_reset_magic(tmp_adev);
5577
5578                                 /*
5579                                  * Add this ASIC as tracked as reset was already
5580                                  * complete successfully.
5581                                  */
5582                                 amdgpu_register_gpu_instance(tmp_adev);
5583
5584                                 if (!reset_context->hive &&
5585                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
5586                                         amdgpu_xgmi_add_device(tmp_adev);
5587
5588                                 r = amdgpu_device_ip_late_init(tmp_adev);
5589                                 if (r)
5590                                         goto out;
5591
5592                                 drm_client_dev_resume(adev_to_drm(tmp_adev), false);
5593
5594                                 /*
5595                                  * The GPU enters bad state once faulty pages
5596                                  * by ECC has reached the threshold, and ras
5597                                  * recovery is scheduled next. So add one check
5598                                  * here to break recovery if it indeed exceeds
5599                                  * bad page threshold, and remind user to
5600                                  * retire this GPU or setting one bigger
5601                                  * bad_page_threshold value to fix this once
5602                                  * probing driver again.
5603                                  */
5604                                 if (!amdgpu_ras_is_rma(tmp_adev)) {
5605                                         /* must succeed. */
5606                                         amdgpu_ras_resume(tmp_adev);
5607                                 } else {
5608                                         r = -EINVAL;
5609                                         goto out;
5610                                 }
5611
5612                                 /* Update PSP FW topology after reset */
5613                                 if (reset_context->hive &&
5614                                     tmp_adev->gmc.xgmi.num_physical_nodes > 1)
5615                                         r = amdgpu_xgmi_update_topology(
5616                                                 reset_context->hive, tmp_adev);
5617                         }
5618                 }
5619
5620 out:
5621                 if (!r) {
5622                         /* IP init is complete now, set level as default */
5623                         amdgpu_set_init_level(tmp_adev,
5624                                               AMDGPU_INIT_LEVEL_DEFAULT);
5625                         amdgpu_irq_gpu_reset_resume_helper(tmp_adev);
5626                         r = amdgpu_ib_ring_tests(tmp_adev);
5627                         if (r) {
5628                                 dev_err(tmp_adev->dev, "ib ring test failed (%d).\n", r);
5629                                 r = -EAGAIN;
5630                                 goto end;
5631                         }
5632                 }
5633
5634                 if (r)
5635                         tmp_adev->asic_reset_res = r;
5636         }
5637
5638 end:
5639         return r;
5640 }
5641
5642 int amdgpu_do_asic_reset(struct list_head *device_list_handle,
5643                          struct amdgpu_reset_context *reset_context)
5644 {
5645         struct amdgpu_device *tmp_adev = NULL;
5646         bool need_full_reset, skip_hw_reset;
5647         int r = 0;
5648
5649         /* Try reset handler method first */
5650         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5651                                     reset_list);
5652
5653         reset_context->reset_device_list = device_list_handle;
5654         r = amdgpu_reset_perform_reset(tmp_adev, reset_context);
5655         /* If reset handler not implemented, continue; otherwise return */
5656         if (r == -EOPNOTSUPP)
5657                 r = 0;
5658         else
5659                 return r;
5660
5661         /* Reset handler not implemented, use the default method */
5662         need_full_reset =
5663                 test_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5664         skip_hw_reset = test_bit(AMDGPU_SKIP_HW_RESET, &reset_context->flags);
5665
5666         /*
5667          * ASIC reset has to be done on all XGMI hive nodes ASAP
5668          * to allow proper links negotiation in FW (within 1 sec)
5669          */
5670         if (!skip_hw_reset && need_full_reset) {
5671                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5672                         /* For XGMI run all resets in parallel to speed up the process */
5673                         if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
5674                                 if (!queue_work(system_unbound_wq,
5675                                                 &tmp_adev->xgmi_reset_work))
5676                                         r = -EALREADY;
5677                         } else
5678                                 r = amdgpu_asic_reset(tmp_adev);
5679
5680                         if (r) {
5681                                 dev_err(tmp_adev->dev,
5682                                         "ASIC reset failed with error, %d for drm dev, %s",
5683                                         r, adev_to_drm(tmp_adev)->unique);
5684                                 goto out;
5685                         }
5686                 }
5687
5688                 /* For XGMI wait for all resets to complete before proceed */
5689                 if (!r) {
5690                         list_for_each_entry(tmp_adev, device_list_handle,
5691                                             reset_list) {
5692                                 if (tmp_adev->gmc.xgmi.num_physical_nodes > 1) {
5693                                         flush_work(&tmp_adev->xgmi_reset_work);
5694                                         r = tmp_adev->asic_reset_res;
5695                                         if (r)
5696                                                 break;
5697                                 }
5698                         }
5699                 }
5700         }
5701
5702         if (!r && amdgpu_ras_intr_triggered()) {
5703                 list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5704                         amdgpu_ras_reset_error_count(tmp_adev,
5705                                                      AMDGPU_RAS_BLOCK__MMHUB);
5706                 }
5707
5708                 amdgpu_ras_intr_cleared();
5709         }
5710
5711         r = amdgpu_device_reinit_after_reset(reset_context);
5712         if (r == -EAGAIN)
5713                 set_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5714         else
5715                 clear_bit(AMDGPU_NEED_FULL_RESET, &reset_context->flags);
5716
5717 out:
5718         return r;
5719 }
5720
5721 static void amdgpu_device_set_mp1_state(struct amdgpu_device *adev)
5722 {
5723
5724         switch (amdgpu_asic_reset_method(adev)) {
5725         case AMD_RESET_METHOD_MODE1:
5726                 adev->mp1_state = PP_MP1_STATE_SHUTDOWN;
5727                 break;
5728         case AMD_RESET_METHOD_MODE2:
5729                 adev->mp1_state = PP_MP1_STATE_RESET;
5730                 break;
5731         default:
5732                 adev->mp1_state = PP_MP1_STATE_NONE;
5733                 break;
5734         }
5735 }
5736
5737 static void amdgpu_device_unset_mp1_state(struct amdgpu_device *adev)
5738 {
5739         amdgpu_vf_error_trans_all(adev);
5740         adev->mp1_state = PP_MP1_STATE_NONE;
5741 }
5742
5743 static void amdgpu_device_resume_display_audio(struct amdgpu_device *adev)
5744 {
5745         struct pci_dev *p = NULL;
5746
5747         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5748                         adev->pdev->bus->number, 1);
5749         if (p) {
5750                 pm_runtime_enable(&(p->dev));
5751                 pm_runtime_resume(&(p->dev));
5752         }
5753
5754         pci_dev_put(p);
5755 }
5756
5757 static int amdgpu_device_suspend_display_audio(struct amdgpu_device *adev)
5758 {
5759         enum amd_reset_method reset_method;
5760         struct pci_dev *p = NULL;
5761         u64 expires;
5762
5763         /*
5764          * For now, only BACO and mode1 reset are confirmed
5765          * to suffer the audio issue without proper suspended.
5766          */
5767         reset_method = amdgpu_asic_reset_method(adev);
5768         if ((reset_method != AMD_RESET_METHOD_BACO) &&
5769              (reset_method != AMD_RESET_METHOD_MODE1))
5770                 return -EINVAL;
5771
5772         p = pci_get_domain_bus_and_slot(pci_domain_nr(adev->pdev->bus),
5773                         adev->pdev->bus->number, 1);
5774         if (!p)
5775                 return -ENODEV;
5776
5777         expires = pm_runtime_autosuspend_expiration(&(p->dev));
5778         if (!expires)
5779                 /*
5780                  * If we cannot get the audio device autosuspend delay,
5781                  * a fixed 4S interval will be used. Considering 3S is
5782                  * the audio controller default autosuspend delay setting.
5783                  * 4S used here is guaranteed to cover that.
5784                  */
5785                 expires = ktime_get_mono_fast_ns() + NSEC_PER_SEC * 4ULL;
5786
5787         while (!pm_runtime_status_suspended(&(p->dev))) {
5788                 if (!pm_runtime_suspend(&(p->dev)))
5789                         break;
5790
5791                 if (expires < ktime_get_mono_fast_ns()) {
5792                         dev_warn(adev->dev, "failed to suspend display audio\n");
5793                         pci_dev_put(p);
5794                         /* TODO: abort the succeeding gpu reset? */
5795                         return -ETIMEDOUT;
5796                 }
5797         }
5798
5799         pm_runtime_disable(&(p->dev));
5800
5801         pci_dev_put(p);
5802         return 0;
5803 }
5804
5805 static inline void amdgpu_device_stop_pending_resets(struct amdgpu_device *adev)
5806 {
5807         struct amdgpu_ras *con = amdgpu_ras_get_context(adev);
5808
5809 #if defined(CONFIG_DEBUG_FS)
5810         if (!amdgpu_sriov_vf(adev))
5811                 cancel_work(&adev->reset_work);
5812 #endif
5813
5814         if (adev->kfd.dev)
5815                 cancel_work(&adev->kfd.reset_work);
5816
5817         if (amdgpu_sriov_vf(adev))
5818                 cancel_work(&adev->virt.flr_work);
5819
5820         if (con && adev->ras_enabled)
5821                 cancel_work(&con->recovery_work);
5822
5823 }
5824
5825 static int amdgpu_device_health_check(struct list_head *device_list_handle)
5826 {
5827         struct amdgpu_device *tmp_adev;
5828         int ret = 0;
5829         u32 status;
5830
5831         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5832                 pci_read_config_dword(tmp_adev->pdev, PCI_COMMAND, &status);
5833                 if (PCI_POSSIBLE_ERROR(status)) {
5834                         dev_err(tmp_adev->dev, "device lost from bus!");
5835                         ret = -ENODEV;
5836                 }
5837         }
5838
5839         return ret;
5840 }
5841
5842 /**
5843  * amdgpu_device_gpu_recover - reset the asic and recover scheduler
5844  *
5845  * @adev: amdgpu_device pointer
5846  * @job: which job trigger hang
5847  * @reset_context: amdgpu reset context pointer
5848  *
5849  * Attempt to reset the GPU if it has hung (all asics).
5850  * Attempt to do soft-reset or full-reset and reinitialize Asic
5851  * Returns 0 for success or an error on failure.
5852  */
5853
5854 int amdgpu_device_gpu_recover(struct amdgpu_device *adev,
5855                               struct amdgpu_job *job,
5856                               struct amdgpu_reset_context *reset_context)
5857 {
5858         struct list_head device_list, *device_list_handle =  NULL;
5859         bool job_signaled = false;
5860         struct amdgpu_hive_info *hive = NULL;
5861         struct amdgpu_device *tmp_adev = NULL;
5862         int i, r = 0;
5863         bool need_emergency_restart = false;
5864         bool audio_suspended = false;
5865         int retry_limit = AMDGPU_MAX_RETRY_LIMIT;
5866
5867         /*
5868          * If it reaches here because of hang/timeout and a RAS error is
5869          * detected at the same time, let RAS recovery take care of it.
5870          */
5871         if (amdgpu_ras_is_err_state(adev, AMDGPU_RAS_BLOCK__ANY) &&
5872             !amdgpu_sriov_vf(adev) &&
5873             reset_context->src != AMDGPU_RESET_SRC_RAS) {
5874                 dev_dbg(adev->dev,
5875                         "Gpu recovery from source: %d yielding to RAS error recovery handling",
5876                         reset_context->src);
5877                 return 0;
5878         }
5879         /*
5880          * Special case: RAS triggered and full reset isn't supported
5881          */
5882         need_emergency_restart = amdgpu_ras_need_emergency_restart(adev);
5883
5884         /*
5885          * Flush RAM to disk so that after reboot
5886          * the user can read log and see why the system rebooted.
5887          */
5888         if (need_emergency_restart && amdgpu_ras_get_context(adev) &&
5889                 amdgpu_ras_get_context(adev)->reboot) {
5890                 DRM_WARN("Emergency reboot.");
5891
5892                 ksys_sync_helper();
5893                 emergency_restart();
5894         }
5895
5896         dev_info(adev->dev, "GPU %s begin!\n",
5897                 need_emergency_restart ? "jobs stop":"reset");
5898
5899         if (!amdgpu_sriov_vf(adev))
5900                 hive = amdgpu_get_xgmi_hive(adev);
5901         if (hive)
5902                 mutex_lock(&hive->hive_lock);
5903
5904         reset_context->job = job;
5905         reset_context->hive = hive;
5906         /*
5907          * Build list of devices to reset.
5908          * In case we are in XGMI hive mode, resort the device list
5909          * to put adev in the 1st position.
5910          */
5911         INIT_LIST_HEAD(&device_list);
5912         if (!amdgpu_sriov_vf(adev) && (adev->gmc.xgmi.num_physical_nodes > 1) && hive) {
5913                 list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head) {
5914                         list_add_tail(&tmp_adev->reset_list, &device_list);
5915                         if (adev->shutdown)
5916                                 tmp_adev->shutdown = true;
5917                 }
5918                 if (!list_is_first(&adev->reset_list, &device_list))
5919                         list_rotate_to_front(&adev->reset_list, &device_list);
5920                 device_list_handle = &device_list;
5921         } else {
5922                 list_add_tail(&adev->reset_list, &device_list);
5923                 device_list_handle = &device_list;
5924         }
5925
5926         if (!amdgpu_sriov_vf(adev)) {
5927                 r = amdgpu_device_health_check(device_list_handle);
5928                 if (r)
5929                         goto end_reset;
5930         }
5931
5932         /* We need to lock reset domain only once both for XGMI and single device */
5933         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
5934                                     reset_list);
5935         amdgpu_device_lock_reset_domain(tmp_adev->reset_domain);
5936
5937         /* block all schedulers and reset given job's ring */
5938         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
5939
5940                 amdgpu_device_set_mp1_state(tmp_adev);
5941
5942                 /*
5943                  * Try to put the audio codec into suspend state
5944                  * before gpu reset started.
5945                  *
5946                  * Due to the power domain of the graphics device
5947                  * is shared with AZ power domain. Without this,
5948                  * we may change the audio hardware from behind
5949                  * the audio driver's back. That will trigger
5950                  * some audio codec errors.
5951                  */
5952                 if (!amdgpu_device_suspend_display_audio(tmp_adev))
5953                         audio_suspended = true;
5954
5955                 amdgpu_ras_set_error_query_ready(tmp_adev, false);
5956
5957                 cancel_delayed_work_sync(&tmp_adev->delayed_init_work);
5958
5959                 amdgpu_amdkfd_pre_reset(tmp_adev, reset_context);
5960
5961                 /*
5962                  * Mark these ASICs to be reset as untracked first
5963                  * And add them back after reset completed
5964                  */
5965                 amdgpu_unregister_gpu_instance(tmp_adev);
5966
5967                 drm_client_dev_suspend(adev_to_drm(tmp_adev), false);
5968
5969                 /* disable ras on ALL IPs */
5970                 if (!need_emergency_restart &&
5971                       amdgpu_device_ip_need_full_reset(tmp_adev))
5972                         amdgpu_ras_suspend(tmp_adev);
5973
5974                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
5975                         struct amdgpu_ring *ring = tmp_adev->rings[i];
5976
5977                         if (!amdgpu_ring_sched_ready(ring))
5978                                 continue;
5979
5980                         drm_sched_stop(&ring->sched, job ? &job->base : NULL);
5981
5982                         if (need_emergency_restart)
5983                                 amdgpu_job_stop_all_jobs_on_sched(&ring->sched);
5984                 }
5985                 atomic_inc(&tmp_adev->gpu_reset_counter);
5986         }
5987
5988         if (need_emergency_restart)
5989                 goto skip_sched_resume;
5990
5991         /*
5992          * Must check guilty signal here since after this point all old
5993          * HW fences are force signaled.
5994          *
5995          * job->base holds a reference to parent fence
5996          */
5997         if (job && dma_fence_is_signaled(&job->hw_fence)) {
5998                 job_signaled = true;
5999                 dev_info(adev->dev, "Guilty job already signaled, skipping HW reset");
6000                 goto skip_hw_reset;
6001         }
6002
6003 retry:  /* Rest of adevs pre asic reset from XGMI hive. */
6004         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
6005                 r = amdgpu_device_pre_asic_reset(tmp_adev, reset_context);
6006                 /*TODO Should we stop ?*/
6007                 if (r) {
6008                         dev_err(tmp_adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
6009                                   r, adev_to_drm(tmp_adev)->unique);
6010                         tmp_adev->asic_reset_res = r;
6011                 }
6012         }
6013
6014         /* Actual ASIC resets if needed.*/
6015         /* Host driver will handle XGMI hive reset for SRIOV */
6016         if (amdgpu_sriov_vf(adev)) {
6017                 if (amdgpu_ras_get_fed_status(adev) || amdgpu_virt_rcvd_ras_interrupt(adev)) {
6018                         dev_dbg(adev->dev, "Detected RAS error, wait for FLR completion\n");
6019                         amdgpu_ras_set_fed(adev, true);
6020                         set_bit(AMDGPU_HOST_FLR, &reset_context->flags);
6021                 }
6022
6023                 r = amdgpu_device_reset_sriov(adev, reset_context);
6024                 if (AMDGPU_RETRY_SRIOV_RESET(r) && (retry_limit--) > 0) {
6025                         amdgpu_virt_release_full_gpu(adev, true);
6026                         goto retry;
6027                 }
6028                 if (r)
6029                         adev->asic_reset_res = r;
6030         } else {
6031                 r = amdgpu_do_asic_reset(device_list_handle, reset_context);
6032                 if (r && r == -EAGAIN)
6033                         goto retry;
6034         }
6035
6036         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
6037                 /*
6038                  * Drop any pending non scheduler resets queued before reset is done.
6039                  * Any reset scheduled after this point would be valid. Scheduler resets
6040                  * were already dropped during drm_sched_stop and no new ones can come
6041                  * in before drm_sched_start.
6042                  */
6043                 amdgpu_device_stop_pending_resets(tmp_adev);
6044         }
6045
6046 skip_hw_reset:
6047
6048         /* Post ASIC reset for all devs .*/
6049         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
6050
6051                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6052                         struct amdgpu_ring *ring = tmp_adev->rings[i];
6053
6054                         if (!amdgpu_ring_sched_ready(ring))
6055                                 continue;
6056
6057                         drm_sched_start(&ring->sched, 0);
6058                 }
6059
6060                 if (!drm_drv_uses_atomic_modeset(adev_to_drm(tmp_adev)) && !job_signaled)
6061                         drm_helper_resume_force_mode(adev_to_drm(tmp_adev));
6062
6063                 if (tmp_adev->asic_reset_res)
6064                         r = tmp_adev->asic_reset_res;
6065
6066                 tmp_adev->asic_reset_res = 0;
6067
6068                 if (r) {
6069                         /* bad news, how to tell it to userspace ?
6070                          * for ras error, we should report GPU bad status instead of
6071                          * reset failure
6072                          */
6073                         if (reset_context->src != AMDGPU_RESET_SRC_RAS ||
6074                             !amdgpu_ras_eeprom_check_err_threshold(tmp_adev))
6075                                 dev_info(tmp_adev->dev, "GPU reset(%d) failed\n",
6076                                         atomic_read(&tmp_adev->gpu_reset_counter));
6077                         amdgpu_vf_error_put(tmp_adev, AMDGIM_ERROR_VF_GPU_RESET_FAIL, 0, r);
6078                 } else {
6079                         dev_info(tmp_adev->dev, "GPU reset(%d) succeeded!\n", atomic_read(&tmp_adev->gpu_reset_counter));
6080                         if (amdgpu_acpi_smart_shift_update(adev_to_drm(tmp_adev), AMDGPU_SS_DEV_D0))
6081                                 DRM_WARN("smart shift update failed\n");
6082                 }
6083         }
6084
6085 skip_sched_resume:
6086         list_for_each_entry(tmp_adev, device_list_handle, reset_list) {
6087                 /* unlock kfd: SRIOV would do it separately */
6088                 if (!need_emergency_restart && !amdgpu_sriov_vf(tmp_adev))
6089                         amdgpu_amdkfd_post_reset(tmp_adev);
6090
6091                 /* kfd_post_reset will do nothing if kfd device is not initialized,
6092                  * need to bring up kfd here if it's not be initialized before
6093                  */
6094                 if (!adev->kfd.init_complete)
6095                         amdgpu_amdkfd_device_init(adev);
6096
6097                 if (audio_suspended)
6098                         amdgpu_device_resume_display_audio(tmp_adev);
6099
6100                 amdgpu_device_unset_mp1_state(tmp_adev);
6101
6102                 amdgpu_ras_set_error_query_ready(tmp_adev, true);
6103         }
6104
6105         tmp_adev = list_first_entry(device_list_handle, struct amdgpu_device,
6106                                             reset_list);
6107         amdgpu_device_unlock_reset_domain(tmp_adev->reset_domain);
6108
6109 end_reset:
6110         if (hive) {
6111                 mutex_unlock(&hive->hive_lock);
6112                 amdgpu_put_xgmi_hive(hive);
6113         }
6114
6115         if (r)
6116                 dev_info(adev->dev, "GPU reset end with ret = %d\n", r);
6117
6118         atomic_set(&adev->reset_domain->reset_res, r);
6119         return r;
6120 }
6121
6122 /**
6123  * amdgpu_device_partner_bandwidth - find the bandwidth of appropriate partner
6124  *
6125  * @adev: amdgpu_device pointer
6126  * @speed: pointer to the speed of the link
6127  * @width: pointer to the width of the link
6128  *
6129  * Evaluate the hierarchy to find the speed and bandwidth capabilities of the
6130  * first physical partner to an AMD dGPU.
6131  * This will exclude any virtual switches and links.
6132  */
6133 static void amdgpu_device_partner_bandwidth(struct amdgpu_device *adev,
6134                                             enum pci_bus_speed *speed,
6135                                             enum pcie_link_width *width)
6136 {
6137         struct pci_dev *parent = adev->pdev;
6138
6139         if (!speed || !width)
6140                 return;
6141
6142         *speed = PCI_SPEED_UNKNOWN;
6143         *width = PCIE_LNK_WIDTH_UNKNOWN;
6144
6145         if (amdgpu_device_pcie_dynamic_switching_supported(adev)) {
6146                 while ((parent = pci_upstream_bridge(parent))) {
6147                         /* skip upstream/downstream switches internal to dGPU*/
6148                         if (parent->vendor == PCI_VENDOR_ID_ATI)
6149                                 continue;
6150                         *speed = pcie_get_speed_cap(parent);
6151                         *width = pcie_get_width_cap(parent);
6152                         break;
6153                 }
6154         } else {
6155                 /* use the current speeds rather than max if switching is not supported */
6156                 pcie_bandwidth_available(adev->pdev, NULL, speed, width);
6157         }
6158 }
6159
6160 /**
6161  * amdgpu_device_get_pcie_info - fence pcie info about the PCIE slot
6162  *
6163  * @adev: amdgpu_device pointer
6164  *
6165  * Fetches and stores in the driver the PCIE capabilities (gen speed
6166  * and lanes) of the slot the device is in. Handles APUs and
6167  * virtualized environments where PCIE config space may not be available.
6168  */
6169 static void amdgpu_device_get_pcie_info(struct amdgpu_device *adev)
6170 {
6171         struct pci_dev *pdev;
6172         enum pci_bus_speed speed_cap, platform_speed_cap;
6173         enum pcie_link_width platform_link_width;
6174
6175         if (amdgpu_pcie_gen_cap)
6176                 adev->pm.pcie_gen_mask = amdgpu_pcie_gen_cap;
6177
6178         if (amdgpu_pcie_lane_cap)
6179                 adev->pm.pcie_mlw_mask = amdgpu_pcie_lane_cap;
6180
6181         /* covers APUs as well */
6182         if (pci_is_root_bus(adev->pdev->bus) && !amdgpu_passthrough(adev)) {
6183                 if (adev->pm.pcie_gen_mask == 0)
6184                         adev->pm.pcie_gen_mask = AMDGPU_DEFAULT_PCIE_GEN_MASK;
6185                 if (adev->pm.pcie_mlw_mask == 0)
6186                         adev->pm.pcie_mlw_mask = AMDGPU_DEFAULT_PCIE_MLW_MASK;
6187                 return;
6188         }
6189
6190         if (adev->pm.pcie_gen_mask && adev->pm.pcie_mlw_mask)
6191                 return;
6192
6193         amdgpu_device_partner_bandwidth(adev, &platform_speed_cap,
6194                                         &platform_link_width);
6195
6196         if (adev->pm.pcie_gen_mask == 0) {
6197                 /* asic caps */
6198                 pdev = adev->pdev;
6199                 speed_cap = pcie_get_speed_cap(pdev);
6200                 if (speed_cap == PCI_SPEED_UNKNOWN) {
6201                         adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6202                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6203                                                   CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
6204                 } else {
6205                         if (speed_cap == PCIE_SPEED_32_0GT)
6206                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6207                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6208                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6209                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4 |
6210                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN5);
6211                         else if (speed_cap == PCIE_SPEED_16_0GT)
6212                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6213                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6214                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6215                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN4);
6216                         else if (speed_cap == PCIE_SPEED_8_0GT)
6217                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6218                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6219                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN3);
6220                         else if (speed_cap == PCIE_SPEED_5_0GT)
6221                                 adev->pm.pcie_gen_mask |= (CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6222                                                           CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN2);
6223                         else
6224                                 adev->pm.pcie_gen_mask |= CAIL_ASIC_PCIE_LINK_SPEED_SUPPORT_GEN1;
6225                 }
6226                 /* platform caps */
6227                 if (platform_speed_cap == PCI_SPEED_UNKNOWN) {
6228                         adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6229                                                    CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
6230                 } else {
6231                         if (platform_speed_cap == PCIE_SPEED_32_0GT)
6232                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6233                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6234                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6235                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4 |
6236                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN5);
6237                         else if (platform_speed_cap == PCIE_SPEED_16_0GT)
6238                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6239                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6240                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3 |
6241                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN4);
6242                         else if (platform_speed_cap == PCIE_SPEED_8_0GT)
6243                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6244                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 |
6245                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3);
6246                         else if (platform_speed_cap == PCIE_SPEED_5_0GT)
6247                                 adev->pm.pcie_gen_mask |= (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1 |
6248                                                            CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2);
6249                         else
6250                                 adev->pm.pcie_gen_mask |= CAIL_PCIE_LINK_SPEED_SUPPORT_GEN1;
6251
6252                 }
6253         }
6254         if (adev->pm.pcie_mlw_mask == 0) {
6255                 if (platform_link_width == PCIE_LNK_WIDTH_UNKNOWN) {
6256                         adev->pm.pcie_mlw_mask |= AMDGPU_DEFAULT_PCIE_MLW_MASK;
6257                 } else {
6258                         switch (platform_link_width) {
6259                         case PCIE_LNK_X32:
6260                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X32 |
6261                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
6262                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6263                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6264                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6265                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6266                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6267                                 break;
6268                         case PCIE_LNK_X16:
6269                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X16 |
6270                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6271                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6272                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6273                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6274                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6275                                 break;
6276                         case PCIE_LNK_X12:
6277                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X12 |
6278                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6279                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6280                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6281                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6282                                 break;
6283                         case PCIE_LNK_X8:
6284                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X8 |
6285                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6286                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6287                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6288                                 break;
6289                         case PCIE_LNK_X4:
6290                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X4 |
6291                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6292                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6293                                 break;
6294                         case PCIE_LNK_X2:
6295                                 adev->pm.pcie_mlw_mask = (CAIL_PCIE_LINK_WIDTH_SUPPORT_X2 |
6296                                                           CAIL_PCIE_LINK_WIDTH_SUPPORT_X1);
6297                                 break;
6298                         case PCIE_LNK_X1:
6299                                 adev->pm.pcie_mlw_mask = CAIL_PCIE_LINK_WIDTH_SUPPORT_X1;
6300                                 break;
6301                         default:
6302                                 break;
6303                         }
6304                 }
6305         }
6306 }
6307
6308 /**
6309  * amdgpu_device_is_peer_accessible - Check peer access through PCIe BAR
6310  *
6311  * @adev: amdgpu_device pointer
6312  * @peer_adev: amdgpu_device pointer for peer device trying to access @adev
6313  *
6314  * Return true if @peer_adev can access (DMA) @adev through the PCIe
6315  * BAR, i.e. @adev is "large BAR" and the BAR matches the DMA mask of
6316  * @peer_adev.
6317  */
6318 bool amdgpu_device_is_peer_accessible(struct amdgpu_device *adev,
6319                                       struct amdgpu_device *peer_adev)
6320 {
6321 #ifdef CONFIG_HSA_AMD_P2P
6322         bool p2p_access =
6323                 !adev->gmc.xgmi.connected_to_cpu &&
6324                 !(pci_p2pdma_distance(adev->pdev, peer_adev->dev, false) < 0);
6325         if (!p2p_access)
6326                 dev_info(adev->dev, "PCIe P2P access from peer device %s is not supported by the chipset\n",
6327                         pci_name(peer_adev->pdev));
6328
6329         bool is_large_bar = adev->gmc.visible_vram_size &&
6330                 adev->gmc.real_vram_size == adev->gmc.visible_vram_size;
6331         bool p2p_addressable = amdgpu_device_check_iommu_remap(peer_adev);
6332
6333         if (!p2p_addressable) {
6334                 uint64_t address_mask = peer_adev->dev->dma_mask ?
6335                         ~*peer_adev->dev->dma_mask : ~((1ULL << 32) - 1);
6336                 resource_size_t aper_limit =
6337                         adev->gmc.aper_base + adev->gmc.aper_size - 1;
6338
6339                 p2p_addressable = !(adev->gmc.aper_base & address_mask ||
6340                                      aper_limit & address_mask);
6341         }
6342         return pcie_p2p && is_large_bar && p2p_access && p2p_addressable;
6343 #else
6344         return false;
6345 #endif
6346 }
6347
6348 int amdgpu_device_baco_enter(struct drm_device *dev)
6349 {
6350         struct amdgpu_device *adev = drm_to_adev(dev);
6351         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
6352
6353         if (!amdgpu_device_supports_baco(dev))
6354                 return -ENOTSUPP;
6355
6356         if (ras && adev->ras_enabled &&
6357             adev->nbio.funcs->enable_doorbell_interrupt)
6358                 adev->nbio.funcs->enable_doorbell_interrupt(adev, false);
6359
6360         return amdgpu_dpm_baco_enter(adev);
6361 }
6362
6363 int amdgpu_device_baco_exit(struct drm_device *dev)
6364 {
6365         struct amdgpu_device *adev = drm_to_adev(dev);
6366         struct amdgpu_ras *ras = amdgpu_ras_get_context(adev);
6367         int ret = 0;
6368
6369         if (!amdgpu_device_supports_baco(dev))
6370                 return -ENOTSUPP;
6371
6372         ret = amdgpu_dpm_baco_exit(adev);
6373         if (ret)
6374                 return ret;
6375
6376         if (ras && adev->ras_enabled &&
6377             adev->nbio.funcs->enable_doorbell_interrupt)
6378                 adev->nbio.funcs->enable_doorbell_interrupt(adev, true);
6379
6380         if (amdgpu_passthrough(adev) && adev->nbio.funcs &&
6381             adev->nbio.funcs->clear_doorbell_interrupt)
6382                 adev->nbio.funcs->clear_doorbell_interrupt(adev);
6383
6384         return 0;
6385 }
6386
6387 /**
6388  * amdgpu_pci_error_detected - Called when a PCI error is detected.
6389  * @pdev: PCI device struct
6390  * @state: PCI channel state
6391  *
6392  * Description: Called when a PCI error is detected.
6393  *
6394  * Return: PCI_ERS_RESULT_NEED_RESET or PCI_ERS_RESULT_DISCONNECT.
6395  */
6396 pci_ers_result_t amdgpu_pci_error_detected(struct pci_dev *pdev, pci_channel_state_t state)
6397 {
6398         struct drm_device *dev = pci_get_drvdata(pdev);
6399         struct amdgpu_device *adev = drm_to_adev(dev);
6400         int i;
6401
6402         DRM_INFO("PCI error: detected callback, state(%d)!!\n", state);
6403
6404         if (adev->gmc.xgmi.num_physical_nodes > 1) {
6405                 DRM_WARN("No support for XGMI hive yet...");
6406                 return PCI_ERS_RESULT_DISCONNECT;
6407         }
6408
6409         adev->pci_channel_state = state;
6410
6411         switch (state) {
6412         case pci_channel_io_normal:
6413                 return PCI_ERS_RESULT_CAN_RECOVER;
6414         /* Fatal error, prepare for slot reset */
6415         case pci_channel_io_frozen:
6416                 /*
6417                  * Locking adev->reset_domain->sem will prevent any external access
6418                  * to GPU during PCI error recovery
6419                  */
6420                 amdgpu_device_lock_reset_domain(adev->reset_domain);
6421                 amdgpu_device_set_mp1_state(adev);
6422
6423                 /*
6424                  * Block any work scheduling as we do for regular GPU reset
6425                  * for the duration of the recovery
6426                  */
6427                 for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6428                         struct amdgpu_ring *ring = adev->rings[i];
6429
6430                         if (!amdgpu_ring_sched_ready(ring))
6431                                 continue;
6432
6433                         drm_sched_stop(&ring->sched, NULL);
6434                 }
6435                 atomic_inc(&adev->gpu_reset_counter);
6436                 return PCI_ERS_RESULT_NEED_RESET;
6437         case pci_channel_io_perm_failure:
6438                 /* Permanent error, prepare for device removal */
6439                 return PCI_ERS_RESULT_DISCONNECT;
6440         }
6441
6442         return PCI_ERS_RESULT_NEED_RESET;
6443 }
6444
6445 /**
6446  * amdgpu_pci_mmio_enabled - Enable MMIO and dump debug registers
6447  * @pdev: pointer to PCI device
6448  */
6449 pci_ers_result_t amdgpu_pci_mmio_enabled(struct pci_dev *pdev)
6450 {
6451
6452         DRM_INFO("PCI error: mmio enabled callback!!\n");
6453
6454         /* TODO - dump whatever for debugging purposes */
6455
6456         /* This called only if amdgpu_pci_error_detected returns
6457          * PCI_ERS_RESULT_CAN_RECOVER. Read/write to the device still
6458          * works, no need to reset slot.
6459          */
6460
6461         return PCI_ERS_RESULT_RECOVERED;
6462 }
6463
6464 /**
6465  * amdgpu_pci_slot_reset - Called when PCI slot has been reset.
6466  * @pdev: PCI device struct
6467  *
6468  * Description: This routine is called by the pci error recovery
6469  * code after the PCI slot has been reset, just before we
6470  * should resume normal operations.
6471  */
6472 pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
6473 {
6474         struct drm_device *dev = pci_get_drvdata(pdev);
6475         struct amdgpu_device *adev = drm_to_adev(dev);
6476         int r, i;
6477         struct amdgpu_reset_context reset_context;
6478         u32 memsize;
6479         struct list_head device_list;
6480
6481         /* PCI error slot reset should be skipped During RAS recovery */
6482         if ((amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 3) ||
6483             amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(9, 4, 4)) &&
6484             amdgpu_ras_in_recovery(adev))
6485                 return PCI_ERS_RESULT_RECOVERED;
6486
6487         DRM_INFO("PCI error: slot reset callback!!\n");
6488
6489         memset(&reset_context, 0, sizeof(reset_context));
6490
6491         INIT_LIST_HEAD(&device_list);
6492         list_add_tail(&adev->reset_list, &device_list);
6493
6494         /* wait for asic to come out of reset */
6495         msleep(500);
6496
6497         /* Restore PCI confspace */
6498         amdgpu_device_load_pci_state(pdev);
6499
6500         /* confirm  ASIC came out of reset */
6501         for (i = 0; i < adev->usec_timeout; i++) {
6502                 memsize = amdgpu_asic_get_config_memsize(adev);
6503
6504                 if (memsize != 0xffffffff)
6505                         break;
6506                 udelay(1);
6507         }
6508         if (memsize == 0xffffffff) {
6509                 r = -ETIME;
6510                 goto out;
6511         }
6512
6513         reset_context.method = AMD_RESET_METHOD_NONE;
6514         reset_context.reset_req_dev = adev;
6515         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
6516         set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
6517
6518         adev->no_hw_access = true;
6519         r = amdgpu_device_pre_asic_reset(adev, &reset_context);
6520         adev->no_hw_access = false;
6521         if (r)
6522                 goto out;
6523
6524         r = amdgpu_do_asic_reset(&device_list, &reset_context);
6525
6526 out:
6527         if (!r) {
6528                 if (amdgpu_device_cache_pci_state(adev->pdev))
6529                         pci_restore_state(adev->pdev);
6530
6531                 DRM_INFO("PCIe error recovery succeeded\n");
6532         } else {
6533                 DRM_ERROR("PCIe error recovery failed, err:%d", r);
6534                 amdgpu_device_unset_mp1_state(adev);
6535                 amdgpu_device_unlock_reset_domain(adev->reset_domain);
6536         }
6537
6538         return r ? PCI_ERS_RESULT_DISCONNECT : PCI_ERS_RESULT_RECOVERED;
6539 }
6540
6541 /**
6542  * amdgpu_pci_resume() - resume normal ops after PCI reset
6543  * @pdev: pointer to PCI device
6544  *
6545  * Called when the error recovery driver tells us that its
6546  * OK to resume normal operation.
6547  */
6548 void amdgpu_pci_resume(struct pci_dev *pdev)
6549 {
6550         struct drm_device *dev = pci_get_drvdata(pdev);
6551         struct amdgpu_device *adev = drm_to_adev(dev);
6552         int i;
6553
6554
6555         DRM_INFO("PCI error: resume callback!!\n");
6556
6557         /* Only continue execution for the case of pci_channel_io_frozen */
6558         if (adev->pci_channel_state != pci_channel_io_frozen)
6559                 return;
6560
6561         for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
6562                 struct amdgpu_ring *ring = adev->rings[i];
6563
6564                 if (!amdgpu_ring_sched_ready(ring))
6565                         continue;
6566
6567                 drm_sched_start(&ring->sched, 0);
6568         }
6569
6570         amdgpu_device_unset_mp1_state(adev);
6571         amdgpu_device_unlock_reset_domain(adev->reset_domain);
6572 }
6573
6574 bool amdgpu_device_cache_pci_state(struct pci_dev *pdev)
6575 {
6576         struct drm_device *dev = pci_get_drvdata(pdev);
6577         struct amdgpu_device *adev = drm_to_adev(dev);
6578         int r;
6579
6580         if (amdgpu_sriov_vf(adev))
6581                 return false;
6582
6583         r = pci_save_state(pdev);
6584         if (!r) {
6585                 kfree(adev->pci_state);
6586
6587                 adev->pci_state = pci_store_saved_state(pdev);
6588
6589                 if (!adev->pci_state) {
6590                         DRM_ERROR("Failed to store PCI saved state");
6591                         return false;
6592                 }
6593         } else {
6594                 DRM_WARN("Failed to save PCI state, err:%d\n", r);
6595                 return false;
6596         }
6597
6598         return true;
6599 }
6600
6601 bool amdgpu_device_load_pci_state(struct pci_dev *pdev)
6602 {
6603         struct drm_device *dev = pci_get_drvdata(pdev);
6604         struct amdgpu_device *adev = drm_to_adev(dev);
6605         int r;
6606
6607         if (!adev->pci_state)
6608                 return false;
6609
6610         r = pci_load_saved_state(pdev, adev->pci_state);
6611
6612         if (!r) {
6613                 pci_restore_state(pdev);
6614         } else {
6615                 DRM_WARN("Failed to load PCI state, err:%d\n", r);
6616                 return false;
6617         }
6618
6619         return true;
6620 }
6621
6622 void amdgpu_device_flush_hdp(struct amdgpu_device *adev,
6623                 struct amdgpu_ring *ring)
6624 {
6625 #ifdef CONFIG_X86_64
6626         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
6627                 return;
6628 #endif
6629         if (adev->gmc.xgmi.connected_to_cpu)
6630                 return;
6631
6632         if (ring && ring->funcs->emit_hdp_flush)
6633                 amdgpu_ring_emit_hdp_flush(ring);
6634         else
6635                 amdgpu_asic_flush_hdp(adev, ring);
6636 }
6637
6638 void amdgpu_device_invalidate_hdp(struct amdgpu_device *adev,
6639                 struct amdgpu_ring *ring)
6640 {
6641 #ifdef CONFIG_X86_64
6642         if ((adev->flags & AMD_IS_APU) && !amdgpu_passthrough(adev))
6643                 return;
6644 #endif
6645         if (adev->gmc.xgmi.connected_to_cpu)
6646                 return;
6647
6648         amdgpu_asic_invalidate_hdp(adev, ring);
6649 }
6650
6651 int amdgpu_in_reset(struct amdgpu_device *adev)
6652 {
6653         return atomic_read(&adev->reset_domain->in_gpu_reset);
6654 }
6655
6656 /**
6657  * amdgpu_device_halt() - bring hardware to some kind of halt state
6658  *
6659  * @adev: amdgpu_device pointer
6660  *
6661  * Bring hardware to some kind of halt state so that no one can touch it
6662  * any more. It will help to maintain error context when error occurred.
6663  * Compare to a simple hang, the system will keep stable at least for SSH
6664  * access. Then it should be trivial to inspect the hardware state and
6665  * see what's going on. Implemented as following:
6666  *
6667  * 1. drm_dev_unplug() makes device inaccessible to user space(IOCTLs, etc),
6668  *    clears all CPU mappings to device, disallows remappings through page faults
6669  * 2. amdgpu_irq_disable_all() disables all interrupts
6670  * 3. amdgpu_fence_driver_hw_fini() signals all HW fences
6671  * 4. set adev->no_hw_access to avoid potential crashes after setp 5
6672  * 5. amdgpu_device_unmap_mmio() clears all MMIO mappings
6673  * 6. pci_disable_device() and pci_wait_for_pending_transaction()
6674  *    flush any in flight DMA operations
6675  */
6676 void amdgpu_device_halt(struct amdgpu_device *adev)
6677 {
6678         struct pci_dev *pdev = adev->pdev;
6679         struct drm_device *ddev = adev_to_drm(adev);
6680
6681         amdgpu_xcp_dev_unplug(adev);
6682         drm_dev_unplug(ddev);
6683
6684         amdgpu_irq_disable_all(adev);
6685
6686         amdgpu_fence_driver_hw_fini(adev);
6687
6688         adev->no_hw_access = true;
6689
6690         amdgpu_device_unmap_mmio(adev);
6691
6692         pci_disable_device(pdev);
6693         pci_wait_for_pending_transaction(pdev);
6694 }
6695
6696 u32 amdgpu_device_pcie_port_rreg(struct amdgpu_device *adev,
6697                                 u32 reg)
6698 {
6699         unsigned long flags, address, data;
6700         u32 r;
6701
6702         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
6703         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
6704
6705         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
6706         WREG32(address, reg * 4);
6707         (void)RREG32(address);
6708         r = RREG32(data);
6709         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
6710         return r;
6711 }
6712
6713 void amdgpu_device_pcie_port_wreg(struct amdgpu_device *adev,
6714                                 u32 reg, u32 v)
6715 {
6716         unsigned long flags, address, data;
6717
6718         address = adev->nbio.funcs->get_pcie_port_index_offset(adev);
6719         data = adev->nbio.funcs->get_pcie_port_data_offset(adev);
6720
6721         spin_lock_irqsave(&adev->pcie_idx_lock, flags);
6722         WREG32(address, reg * 4);
6723         (void)RREG32(address);
6724         WREG32(data, v);
6725         (void)RREG32(data);
6726         spin_unlock_irqrestore(&adev->pcie_idx_lock, flags);
6727 }
6728
6729 /**
6730  * amdgpu_device_get_gang - return a reference to the current gang
6731  * @adev: amdgpu_device pointer
6732  *
6733  * Returns: A new reference to the current gang leader.
6734  */
6735 struct dma_fence *amdgpu_device_get_gang(struct amdgpu_device *adev)
6736 {
6737         struct dma_fence *fence;
6738
6739         rcu_read_lock();
6740         fence = dma_fence_get_rcu_safe(&adev->gang_submit);
6741         rcu_read_unlock();
6742         return fence;
6743 }
6744
6745 /**
6746  * amdgpu_device_switch_gang - switch to a new gang
6747  * @adev: amdgpu_device pointer
6748  * @gang: the gang to switch to
6749  *
6750  * Try to switch to a new gang.
6751  * Returns: NULL if we switched to the new gang or a reference to the current
6752  * gang leader.
6753  */
6754 struct dma_fence *amdgpu_device_switch_gang(struct amdgpu_device *adev,
6755                                             struct dma_fence *gang)
6756 {
6757         struct dma_fence *old = NULL;
6758
6759         do {
6760                 dma_fence_put(old);
6761                 old = amdgpu_device_get_gang(adev);
6762                 if (old == gang)
6763                         break;
6764
6765                 if (!dma_fence_is_signaled(old))
6766                         return old;
6767
6768         } while (cmpxchg((struct dma_fence __force **)&adev->gang_submit,
6769                          old, gang) != old);
6770
6771         dma_fence_put(old);
6772         return NULL;
6773 }
6774
6775 bool amdgpu_device_has_display_hardware(struct amdgpu_device *adev)
6776 {
6777         switch (adev->asic_type) {
6778 #ifdef CONFIG_DRM_AMDGPU_SI
6779         case CHIP_HAINAN:
6780 #endif
6781         case CHIP_TOPAZ:
6782                 /* chips with no display hardware */
6783                 return false;
6784 #ifdef CONFIG_DRM_AMDGPU_SI
6785         case CHIP_TAHITI:
6786         case CHIP_PITCAIRN:
6787         case CHIP_VERDE:
6788         case CHIP_OLAND:
6789 #endif
6790 #ifdef CONFIG_DRM_AMDGPU_CIK
6791         case CHIP_BONAIRE:
6792         case CHIP_HAWAII:
6793         case CHIP_KAVERI:
6794         case CHIP_KABINI:
6795         case CHIP_MULLINS:
6796 #endif
6797         case CHIP_TONGA:
6798         case CHIP_FIJI:
6799         case CHIP_POLARIS10:
6800         case CHIP_POLARIS11:
6801         case CHIP_POLARIS12:
6802         case CHIP_VEGAM:
6803         case CHIP_CARRIZO:
6804         case CHIP_STONEY:
6805                 /* chips with display hardware */
6806                 return true;
6807         default:
6808                 /* IP discovery */
6809                 if (!amdgpu_ip_version(adev, DCE_HWIP, 0) ||
6810                     (adev->harvest_ip_mask & AMD_HARVEST_IP_DMU_MASK))
6811                         return false;
6812                 return true;
6813         }
6814 }
6815
6816 uint32_t amdgpu_device_wait_on_rreg(struct amdgpu_device *adev,
6817                 uint32_t inst, uint32_t reg_addr, char reg_name[],
6818                 uint32_t expected_value, uint32_t mask)
6819 {
6820         uint32_t ret = 0;
6821         uint32_t old_ = 0;
6822         uint32_t tmp_ = RREG32(reg_addr);
6823         uint32_t loop = adev->usec_timeout;
6824
6825         while ((tmp_ & (mask)) != (expected_value)) {
6826                 if (old_ != tmp_) {
6827                         loop = adev->usec_timeout;
6828                         old_ = tmp_;
6829                 } else
6830                         udelay(1);
6831                 tmp_ = RREG32(reg_addr);
6832                 loop--;
6833                 if (!loop) {
6834                         DRM_WARN("Register(%d) [%s] failed to reach value 0x%08x != 0x%08xn",
6835                                   inst, reg_name, (uint32_t)expected_value,
6836                                   (uint32_t)(tmp_ & (mask)));
6837                         ret = -ETIMEDOUT;
6838                         break;
6839                 }
6840         }
6841         return ret;
6842 }
6843
6844 ssize_t amdgpu_get_soft_full_reset_mask(struct amdgpu_ring *ring)
6845 {
6846         ssize_t size = 0;
6847
6848         if (!ring || !ring->adev)
6849                 return size;
6850
6851         if (amdgpu_device_should_recover_gpu(ring->adev))
6852                 size |= AMDGPU_RESET_TYPE_FULL;
6853
6854         if (unlikely(!ring->adev->debug_disable_soft_recovery) &&
6855             !amdgpu_sriov_vf(ring->adev) && ring->funcs->soft_recovery)
6856                 size |= AMDGPU_RESET_TYPE_SOFT_RESET;
6857
6858         return size;
6859 }
6860
6861 ssize_t amdgpu_show_reset_mask(char *buf, uint32_t supported_reset)
6862 {
6863         ssize_t size = 0;
6864
6865         if (supported_reset == 0) {
6866                 size += sysfs_emit_at(buf, size, "unsupported");
6867                 size += sysfs_emit_at(buf, size, "\n");
6868                 return size;
6869
6870         }
6871
6872         if (supported_reset & AMDGPU_RESET_TYPE_SOFT_RESET)
6873                 size += sysfs_emit_at(buf, size, "soft ");
6874
6875         if (supported_reset & AMDGPU_RESET_TYPE_PER_QUEUE)
6876                 size += sysfs_emit_at(buf, size, "queue ");
6877
6878         if (supported_reset & AMDGPU_RESET_TYPE_PER_PIPE)
6879                 size += sysfs_emit_at(buf, size, "pipe ");
6880
6881         if (supported_reset & AMDGPU_RESET_TYPE_FULL)
6882                 size += sysfs_emit_at(buf, size, "full ");
6883
6884         size += sysfs_emit_at(buf, size, "\n");
6885         return size;
6886 }