PCI/DPC: Ignore Surprise Down error on hot removal

author Smita Koralahalli <[email protected]>

Wed, 7 Feb 2024 18:18:54 +0000 (18:18 +0000)

committer Bjorn Helgaas <[email protected]>

Wed, 28 Feb 2024 16:24:36 +0000 (10:24 -0600)
author Smita Koralahalli <[email protected]>
Wed, 7 Feb 2024 18:18:54 +0000 (18:18 +0000)
committer Bjorn Helgaas <[email protected]>
Wed, 28 Feb 2024 16:24:36 +0000 (10:24 -0600)
diff --git a/drivers/pci/pcie/dpc.c b/drivers/pci/pcie/dpc.c

index e5d7c12854fa027c548781d53a01904cb3dea7fd..98b42e425bb916f8cf229d6518c6172f5fce60d6 100644 (file)
--- a/drivers/pci/pcie/dpc.c
+++ b/drivers/pci/pcie/dpc.c
@@ -303,10 +303,70 @@ void dpc_process_error(struct pci_dev *pdev)
         }
  }
  
+static void pci_clear_surpdn_errors(struct pci_dev *pdev)
+{
+       if (pdev->dpc_rp_extensions)
+               pci_write_config_dword(pdev, pdev->dpc_cap +
+                                      PCI_EXP_DPC_RP_PIO_STATUS, ~0);
+
+       /*
+        * In practice, Surprise Down errors have been observed to also set
+        * error bits in the Status Register as well as the Fatal Error
+        * Detected bit in the Device Status Register.
+        */
+       pci_write_config_word(pdev, PCI_STATUS, 0xffff);
+
+       pcie_capability_write_word(pdev, PCI_EXP_DEVSTA, PCI_EXP_DEVSTA_FED);
+}
+
+static void dpc_handle_surprise_removal(struct pci_dev *pdev)
+{
+       if (!pcie_wait_for_link(pdev, false)) {
+               pci_info(pdev, "Data Link Layer Link Active not cleared in 1000 msec\n");
+               goto out;
+       }
+
+       if (pdev->dpc_rp_extensions && dpc_wait_rp_inactive(pdev))
+               goto out;
+
+       pci_aer_raw_clear_status(pdev);
+       pci_clear_surpdn_errors(pdev);
+
+       pci_write_config_word(pdev, pdev->dpc_cap + PCI_EXP_DPC_STATUS,
+                             PCI_EXP_DPC_STATUS_TRIGGER);
+
+out:
+       clear_bit(PCI_DPC_RECOVERED, &pdev->priv_flags);
+       wake_up_all(&dpc_completed_waitqueue);
+}
+
+static bool dpc_is_surprise_removal(struct pci_dev *pdev)
+{
+       u16 status;
+
+       if (!pdev->is_hotplug_bridge)
+               return false;
+
+       if (pci_read_config_word(pdev, pdev->aer_cap + PCI_ERR_UNCOR_STATUS,
+                                &status))
+               return false;
+
+       return status & PCI_ERR_UNC_SURPDN;
+}
+
  static irqreturn_t dpc_handler(int irq, void *context)
  {
         struct pci_dev *pdev = context;
  
+       /*
+        * According to PCIe r6.0 sec 6.7.6, errors are an expected side effect
+        * of async removal and should be ignored by software.
+        */
+       if (dpc_is_surprise_removal(pdev)) {
+               dpc_handle_surprise_removal(pdev);
+               return IRQ_HANDLED;
+       }
+
         dpc_process_error(pdev);
  
         /* We configure DPC so it only triggers on ERR_FATAL */
author	Smita Koralahalli <[email protected]>
	Wed, 7 Feb 2024 18:18:54 +0000 (18:18 +0000)
committer	Bjorn Helgaas <[email protected]>
	Wed, 28 Feb 2024 16:24:36 +0000 (10:24 -0600)