cxl/pci: Skip to handle RAS errors if CXL.mem device is detached

author Li Ming <ming4.li@intel.com>

Mon, 29 Jan 2024 13:18:56 +0000 (13:18 +0000)

committer Dan Williams <dan.j.williams@intel.com>

Mon, 29 Jan 2024 20:59:07 +0000 (12:59 -0800)
author Li Ming <ming4.li@intel.com>
Mon, 29 Jan 2024 13:18:56 +0000 (13:18 +0000)
committer Dan Williams <dan.j.williams@intel.com>
Mon, 29 Jan 2024 20:59:07 +0000 (12:59 -0800)
diff --git a/drivers/cxl/core/pci.c b/drivers/cxl/core/pci.c

index 6c9c8d9..480489f 100644 (file)
--- a/drivers/cxl/core/pci.c
+++ b/drivers/cxl/core/pci.c
@@ -932,11 +932,21 @@ static void cxl_handle_rdport_errors(struct cxl_dev_state *cxlds) { }
  void cxl_cor_error_detected(struct pci_dev *pdev)
  {
         struct cxl_dev_state *cxlds = pci_get_drvdata(pdev);
+       struct device *dev = &cxlds->cxlmd->dev;
+
+       scoped_guard(device, dev) {
+               if (!dev->driver) {
+                       dev_warn(&pdev->dev,
+                                "%s: memdev disabled, abort error handling\n",
+                                dev_name(dev));
+                       return;
+               }
  
-       if (cxlds->rcd)
-               cxl_handle_rdport_errors(cxlds);
+               if (cxlds->rcd)
+                       cxl_handle_rdport_errors(cxlds);
  
-       cxl_handle_endpoint_cor_ras(cxlds);
+               cxl_handle_endpoint_cor_ras(cxlds);
+       }
  }
  EXPORT_SYMBOL_NS_GPL(cxl_cor_error_detected, CXL);
  
@@ -948,16 +958,25 @@ pci_ers_result_t cxl_error_detected(struct pci_dev *pdev,
         struct device *dev = &cxlmd->dev;
         bool ue;
  
-       if (cxlds->rcd)
-               cxl_handle_rdport_errors(cxlds);
+       scoped_guard(device, dev) {
+               if (!dev->driver) {
+                       dev_warn(&pdev->dev,
+                                "%s: memdev disabled, abort error handling\n",
+                                dev_name(dev));
+                       return PCI_ERS_RESULT_DISCONNECT;
+               }
+
+               if (cxlds->rcd)
+                       cxl_handle_rdport_errors(cxlds);
+               /*
+                * A frozen channel indicates an impending reset which is fatal to
+                * CXL.mem operation, and will likely crash the system. On the off
+                * chance the situation is recoverable dump the status of the RAS
+                * capability registers and bounce the active state of the memdev.
+                */
+               ue = cxl_handle_endpoint_ras(cxlds);
+       }
  
-       /*
-        * A frozen channel indicates an impending reset which is fatal to
-        * CXL.mem operation, and will likely crash the system. On the off
-        * chance the situation is recoverable dump the status of the RAS
-        * capability registers and bounce the active state of the memdev.
-        */
-       ue = cxl_handle_endpoint_ras(cxlds);
  
         switch (state) {
         case pci_channel_io_normal:
author	Li Ming <ming4.li@intel.com>
	Mon, 29 Jan 2024 13:18:56 +0000 (13:18 +0000)
committer	Dan Williams <dan.j.williams@intel.com>
	Mon, 29 Jan 2024 20:59:07 +0000 (12:59 -0800)