|
@@ -1,8 +1,8 @@
|
|
|
/*
|
|
|
- * eeh.c
|
|
|
* Copyright IBM Corporation 2001, 2005, 2006
|
|
|
* Copyright Dave Engebretsen & Todd Inglett 2001
|
|
|
* Copyright Linas Vepstas 2005, 2006
|
|
|
+ * Copyright 2001-2012 IBM Corporation.
|
|
|
*
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
@@ -22,7 +22,7 @@
|
|
|
*/
|
|
|
|
|
|
#include <linux/delay.h>
|
|
|
-#include <linux/sched.h> /* for init_mm */
|
|
|
+#include <linux/sched.h>
|
|
|
#include <linux/init.h>
|
|
|
#include <linux/list.h>
|
|
|
#include <linux/pci.h>
|
|
@@ -129,9 +129,16 @@ static unsigned long slot_resets;
|
|
|
|
|
|
#define IS_BRIDGE(class_code) (((class_code)<<16) == PCI_BASE_CLASS_BRIDGE)
|
|
|
|
|
|
-/* --------------------------------------------------------------- */
|
|
|
-/* Below lies the EEH event infrastructure */
|
|
|
-
|
|
|
+/**
|
|
|
+ * rtas_slot_error_detail - Retrieve error log through RTAS call
|
|
|
+ * @pdn: device node
|
|
|
+ * @severity: temporary or permanent error log
|
|
|
+ * @driver_log: driver log to be combined with the retrieved error log
|
|
|
+ * @loglen: length of driver log
|
|
|
+ *
|
|
|
+ * This routine should be called to retrieve error log through the dedicated
|
|
|
+ * RTAS call.
|
|
|
+ */
|
|
|
static void rtas_slot_error_detail(struct pci_dn *pdn, int severity,
|
|
|
char *driver_log, size_t loglen)
|
|
|
{
|
|
@@ -163,7 +170,7 @@ static void rtas_slot_error_detail(struct pci_dn *pdn, int severity,
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * gather_pci_data - copy assorted PCI config space registers to buff
|
|
|
+ * gather_pci_data - Copy assorted PCI config space registers to buff
|
|
|
* @pdn: device to report data for
|
|
|
* @buf: point to buffer in which to log
|
|
|
* @len: amount of room in buffer
|
|
@@ -258,6 +265,16 @@ static size_t gather_pci_data(struct pci_dn *pdn, char * buf, size_t len)
|
|
|
return n;
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * eeh_slot_error_detail - Generate combined log including driver log and error log
|
|
|
+ * @pdn: device node
|
|
|
+ * @severity: temporary or permanent error log
|
|
|
+ *
|
|
|
+ * This routine should be called to generate the combined log, which
|
|
|
+ * is comprised of driver log and error log. The driver log is figured
|
|
|
+ * out from the config space of the corresponding PCI device, while
|
|
|
+ * the error log is fetched through platform dependent function call.
|
|
|
+ */
|
|
|
void eeh_slot_error_detail(struct pci_dn *pdn, int severity)
|
|
|
{
|
|
|
size_t loglen = 0;
|
|
@@ -275,6 +292,9 @@ void eeh_slot_error_detail(struct pci_dn *pdn, int severity)
|
|
|
* read_slot_reset_state - Read the reset state of a device node's slot
|
|
|
* @dn: device node to read
|
|
|
* @rets: array to return results in
|
|
|
+ *
|
|
|
+ * Read the reset state of a device node's slot through platform dependent
|
|
|
+ * function call.
|
|
|
*/
|
|
|
static int read_slot_reset_state(struct pci_dn *pdn, int rets[])
|
|
|
{
|
|
@@ -300,9 +320,9 @@ static int read_slot_reset_state(struct pci_dn *pdn, int rets[])
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * eeh_wait_for_slot_status - returns error status of slot
|
|
|
- * @pdn pci device node
|
|
|
- * @max_wait_msecs maximum number to millisecs to wait
|
|
|
+ * eeh_wait_for_slot_status - Returns error status of slot
|
|
|
+ * @pdn: pci device node
|
|
|
+ * @max_wait_msecs: maximum number to millisecs to wait
|
|
|
*
|
|
|
* Return negative value if a permanent error, else return
|
|
|
* Partition Endpoint (PE) status value.
|
|
@@ -332,16 +352,16 @@ eeh_wait_for_slot_status(struct pci_dn *pdn, int max_wait_msecs)
|
|
|
|
|
|
mwait = rets[2];
|
|
|
if (mwait <= 0) {
|
|
|
- printk (KERN_WARNING
|
|
|
- "EEH: Firmware returned bad wait value=%d\n", mwait);
|
|
|
+ printk(KERN_WARNING "EEH: Firmware returned bad wait value=%d\n",
|
|
|
+ mwait);
|
|
|
mwait = 1000;
|
|
|
} else if (mwait > 300*1000) {
|
|
|
- printk (KERN_WARNING
|
|
|
- "EEH: Firmware is taking too long, time=%d\n", mwait);
|
|
|
+ printk(KERN_WARNING "EEH: Firmware is taking too long, time=%d\n",
|
|
|
+ mwait);
|
|
|
mwait = 300*1000;
|
|
|
}
|
|
|
max_wait_msecs -= mwait;
|
|
|
- msleep (mwait);
|
|
|
+ msleep(mwait);
|
|
|
}
|
|
|
|
|
|
printk(KERN_WARNING "EEH: Timed out waiting for slot status\n");
|
|
@@ -349,8 +369,11 @@ eeh_wait_for_slot_status(struct pci_dn *pdn, int max_wait_msecs)
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * eeh_token_to_phys - convert EEH address token to phys address
|
|
|
- * @token i/o token, should be address in the form 0xA....
|
|
|
+ * eeh_token_to_phys - Convert EEH address token to phys address
|
|
|
+ * @token: I/O token, should be address in the form 0xA....
|
|
|
+ *
|
|
|
+ * This routine should be called to convert virtual I/O address
|
|
|
+ * to physical one.
|
|
|
*/
|
|
|
static inline unsigned long eeh_token_to_phys(unsigned long token)
|
|
|
{
|
|
@@ -365,8 +388,11 @@ static inline unsigned long eeh_token_to_phys(unsigned long token)
|
|
|
return pa | (token & (PAGE_SIZE-1));
|
|
|
}
|
|
|
|
|
|
-/**
|
|
|
- * Return the "partitionable endpoint" (pe) under which this device lies
|
|
|
+/**
|
|
|
+ * find_device_pe - Retrieve the PE for the given device
|
|
|
+ * @dn: device node
|
|
|
+ *
|
|
|
+ * Return the PE under which this device lies
|
|
|
*/
|
|
|
struct device_node * find_device_pe(struct device_node *dn)
|
|
|
{
|
|
@@ -377,14 +403,18 @@ struct device_node * find_device_pe(struct device_node *dn)
|
|
|
return dn;
|
|
|
}
|
|
|
|
|
|
-/** Mark all devices that are children of this device as failed.
|
|
|
- * Mark the device driver too, so that it can see the failure
|
|
|
- * immediately; this is critical, since some drivers poll
|
|
|
- * status registers in interrupts ... If a driver is polling,
|
|
|
- * and the slot is frozen, then the driver can deadlock in
|
|
|
- * an interrupt context, which is bad.
|
|
|
+/**
|
|
|
+ * __eeh_mark_slot - Mark all child devices as failed
|
|
|
+ * @parent: parent device
|
|
|
+ * @mode_flag: failure flag
|
|
|
+ *
|
|
|
+ * Mark all devices that are children of this device as failed.
|
|
|
+ * Mark the device driver too, so that it can see the failure
|
|
|
+ * immediately; this is critical, since some drivers poll
|
|
|
+ * status registers in interrupts ... If a driver is polling,
|
|
|
+ * and the slot is frozen, then the driver can deadlock in
|
|
|
+ * an interrupt context, which is bad.
|
|
|
*/
|
|
|
-
|
|
|
static void __eeh_mark_slot(struct device_node *parent, int mode_flag)
|
|
|
{
|
|
|
struct device_node *dn;
|
|
@@ -404,10 +434,18 @@ static void __eeh_mark_slot(struct device_node *parent, int mode_flag)
|
|
|
}
|
|
|
}
|
|
|
|
|
|
-void eeh_mark_slot (struct device_node *dn, int mode_flag)
|
|
|
+/**
|
|
|
+ * eeh_mark_slot - Mark the indicated device and its children as failed
|
|
|
+ * @dn: parent device
|
|
|
+ * @mode_flag: failure flag
|
|
|
+ *
|
|
|
+ * Mark the indicated device and its child devices as failed.
|
|
|
+ * The device drivers are marked as failed as well.
|
|
|
+ */
|
|
|
+void eeh_mark_slot(struct device_node *dn, int mode_flag)
|
|
|
{
|
|
|
struct pci_dev *dev;
|
|
|
- dn = find_device_pe (dn);
|
|
|
+ dn = find_device_pe(dn);
|
|
|
|
|
|
/* Back up one, since config addrs might be shared */
|
|
|
if (!pcibios_find_pci_bus(dn) && PCI_DN(dn->parent))
|
|
@@ -423,6 +461,13 @@ void eeh_mark_slot (struct device_node *dn, int mode_flag)
|
|
|
__eeh_mark_slot(dn, mode_flag);
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * __eeh_clear_slot - Clear failure flag for the child devices
|
|
|
+ * @parent: parent device
|
|
|
+ * @mode_flag: flag to be cleared
|
|
|
+ *
|
|
|
+ * Clear failure flag for the child devices.
|
|
|
+ */
|
|
|
static void __eeh_clear_slot(struct device_node *parent, int mode_flag)
|
|
|
{
|
|
|
struct device_node *dn;
|
|
@@ -436,12 +481,19 @@ static void __eeh_clear_slot(struct device_node *parent, int mode_flag)
|
|
|
}
|
|
|
}
|
|
|
|
|
|
-void eeh_clear_slot (struct device_node *dn, int mode_flag)
|
|
|
+/**
|
|
|
+ * eeh_clear_slot - Clear failure flag for the indicated device and its children
|
|
|
+ * @dn: parent device
|
|
|
+ * @mode_flag: flag to be cleared
|
|
|
+ *
|
|
|
+ * Clear failure flag for the indicated device and its children.
|
|
|
+ */
|
|
|
+void eeh_clear_slot(struct device_node *dn, int mode_flag)
|
|
|
{
|
|
|
unsigned long flags;
|
|
|
raw_spin_lock_irqsave(&confirm_error_lock, flags);
|
|
|
|
|
|
- dn = find_device_pe (dn);
|
|
|
+ dn = find_device_pe(dn);
|
|
|
|
|
|
/* Back up one, since config addrs might be shared */
|
|
|
if (!pcibios_find_pci_bus(dn) && PCI_DN(dn->parent))
|
|
@@ -453,43 +505,10 @@ void eeh_clear_slot (struct device_node *dn, int mode_flag)
|
|
|
raw_spin_unlock_irqrestore(&confirm_error_lock, flags);
|
|
|
}
|
|
|
|
|
|
-void __eeh_set_pe_freset(struct device_node *parent, unsigned int *freset)
|
|
|
-{
|
|
|
- struct device_node *dn;
|
|
|
-
|
|
|
- for_each_child_of_node(parent, dn) {
|
|
|
- if (PCI_DN(dn)) {
|
|
|
-
|
|
|
- struct pci_dev *dev = PCI_DN(dn)->pcidev;
|
|
|
-
|
|
|
- if (dev && dev->driver)
|
|
|
- *freset |= dev->needs_freset;
|
|
|
-
|
|
|
- __eeh_set_pe_freset(dn, freset);
|
|
|
- }
|
|
|
- }
|
|
|
-}
|
|
|
-
|
|
|
-void eeh_set_pe_freset(struct device_node *dn, unsigned int *freset)
|
|
|
-{
|
|
|
- struct pci_dev *dev;
|
|
|
- dn = find_device_pe(dn);
|
|
|
-
|
|
|
- /* Back up one, since config addrs might be shared */
|
|
|
- if (!pcibios_find_pci_bus(dn) && PCI_DN(dn->parent))
|
|
|
- dn = dn->parent;
|
|
|
-
|
|
|
- dev = PCI_DN(dn)->pcidev;
|
|
|
- if (dev)
|
|
|
- *freset |= dev->needs_freset;
|
|
|
-
|
|
|
- __eeh_set_pe_freset(dn, freset);
|
|
|
-}
|
|
|
-
|
|
|
/**
|
|
|
- * eeh_dn_check_failure - check if all 1's data is due to EEH slot freeze
|
|
|
- * @dn device node
|
|
|
- * @dev pci device, if known
|
|
|
+ * eeh_dn_check_failure - Check if all 1's data is due to EEH slot freeze
|
|
|
+ * @dn: device node
|
|
|
+ * @dev: pci device, if known
|
|
|
*
|
|
|
* Check for an EEH failure for the given device node. Call this
|
|
|
* routine if the result of a read was all 0xff's and you want to
|
|
@@ -548,11 +567,11 @@ int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
|
|
|
pdn->eeh_check_count ++;
|
|
|
if (pdn->eeh_check_count % EEH_MAX_FAILS == 0) {
|
|
|
location = of_get_property(dn, "ibm,loc-code", NULL);
|
|
|
- printk (KERN_ERR "EEH: %d reads ignored for recovering device at "
|
|
|
+ printk(KERN_ERR "EEH: %d reads ignored for recovering device at "
|
|
|
"location=%s driver=%s pci addr=%s\n",
|
|
|
pdn->eeh_check_count, location,
|
|
|
eeh_driver_name(dev), eeh_pci_name(dev));
|
|
|
- printk (KERN_ERR "EEH: Might be infinite loop in %s driver\n",
|
|
|
+ printk(KERN_ERR "EEH: Might be infinite loop in %s driver\n",
|
|
|
eeh_driver_name(dev));
|
|
|
dump_stack();
|
|
|
}
|
|
@@ -579,7 +598,8 @@ int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
|
|
|
}
|
|
|
|
|
|
/* Note that config-io to empty slots may fail;
|
|
|
- * they are empty when they don't have children. */
|
|
|
+ * they are empty when they don't have children.
|
|
|
+ */
|
|
|
if ((rets[0] == 5) && (rets[2] == 0) && (dn->child == NULL)) {
|
|
|
false_positives++;
|
|
|
pdn->eeh_false_positives ++;
|
|
@@ -609,15 +629,17 @@ int eeh_dn_check_failure(struct device_node *dn, struct pci_dev *dev)
|
|
|
|
|
|
/* Avoid repeated reports of this failure, including problems
|
|
|
* with other functions on this device, and functions under
|
|
|
- * bridges. */
|
|
|
- eeh_mark_slot (dn, EEH_MODE_ISOLATED);
|
|
|
+ * bridges.
|
|
|
+ */
|
|
|
+ eeh_mark_slot(dn, EEH_MODE_ISOLATED);
|
|
|
raw_spin_unlock_irqrestore(&confirm_error_lock, flags);
|
|
|
|
|
|
- eeh_send_failure_event (dn, dev);
|
|
|
+ eeh_send_failure_event(dn, dev);
|
|
|
|
|
|
/* Most EEH events are due to device driver bugs. Having
|
|
|
* a stack trace will help the device-driver authors figure
|
|
|
- * out what happened. So print that out. */
|
|
|
+ * out what happened. So print that out.
|
|
|
+ */
|
|
|
dump_stack();
|
|
|
return 1;
|
|
|
|
|
@@ -629,9 +651,9 @@ dn_unlock:
|
|
|
EXPORT_SYMBOL_GPL(eeh_dn_check_failure);
|
|
|
|
|
|
/**
|
|
|
- * eeh_check_failure - check if all 1's data is due to EEH slot freeze
|
|
|
- * @token i/o token, should be address in the form 0xA....
|
|
|
- * @val value, should be all 1's (XXX why do we need this arg??)
|
|
|
+ * eeh_check_failure - Check if all 1's data is due to EEH slot freeze
|
|
|
+ * @token: I/O token, should be address in the form 0xA....
|
|
|
+ * @val: value, should be all 1's (XXX why do we need this arg??)
|
|
|
*
|
|
|
* Check for an EEH failure at the given token address. Call this
|
|
|
* routine if the result of a read was all 0xff's and you want to
|
|
@@ -655,7 +677,7 @@ unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned lon
|
|
|
}
|
|
|
|
|
|
dn = pci_device_to_OF_node(dev);
|
|
|
- eeh_dn_check_failure (dn, dev);
|
|
|
+ eeh_dn_check_failure(dn, dev);
|
|
|
|
|
|
pci_dev_put(dev);
|
|
|
return val;
|
|
@@ -663,14 +685,15 @@ unsigned long eeh_check_failure(const volatile void __iomem *token, unsigned lon
|
|
|
|
|
|
EXPORT_SYMBOL(eeh_check_failure);
|
|
|
|
|
|
-/* ------------------------------------------------------------- */
|
|
|
-/* The code below deals with error recovery */
|
|
|
|
|
|
/**
|
|
|
- * rtas_pci_enable - enable MMIO or DMA transfers for this slot
|
|
|
+ * rtas_pci_enable - Enable MMIO or DMA transfers for this slot
|
|
|
* @pdn pci device node
|
|
|
+ *
|
|
|
+ * This routine should be called to reenable frozen MMIO or DMA
|
|
|
+ * so that it would work correctly again. It's useful while doing
|
|
|
+ * recovery or log collection on the indicated device.
|
|
|
*/
|
|
|
-
|
|
|
int
|
|
|
rtas_pci_enable(struct pci_dn *pdn, int function)
|
|
|
{
|
|
@@ -692,7 +715,7 @@ rtas_pci_enable(struct pci_dn *pdn, int function)
|
|
|
printk(KERN_WARNING "EEH: Unexpected state change %d, err=%d dn=%s\n",
|
|
|
function, rc, pdn->node->full_name);
|
|
|
|
|
|
- rc = eeh_wait_for_slot_status (pdn, PCI_BUS_RESET_WAIT_MSEC);
|
|
|
+ rc = eeh_wait_for_slot_status(pdn, PCI_BUS_RESET_WAIT_MSEC);
|
|
|
if ((rc == 4) && (function == EEH_THAW_MMIO))
|
|
|
return 0;
|
|
|
|
|
@@ -700,27 +723,25 @@ rtas_pci_enable(struct pci_dn *pdn, int function)
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * rtas_pci_slot_reset - raises/lowers the pci #RST line
|
|
|
- * @pdn pci device node
|
|
|
+ * rtas_pci_slot_reset - Raises/Lowers the pci #RST line
|
|
|
+ * @pdn: pci device node
|
|
|
* @state: 1/0 to raise/lower the #RST
|
|
|
*
|
|
|
* Clear the EEH-frozen condition on a slot. This routine
|
|
|
* asserts the PCI #RST line if the 'state' argument is '1',
|
|
|
* and drops the #RST line if 'state is '0'. This routine is
|
|
|
* safe to call in an interrupt context.
|
|
|
- *
|
|
|
*/
|
|
|
-
|
|
|
static void
|
|
|
rtas_pci_slot_reset(struct pci_dn *pdn, int state)
|
|
|
{
|
|
|
int config_addr;
|
|
|
int rc;
|
|
|
|
|
|
- BUG_ON (pdn==NULL);
|
|
|
+ BUG_ON(pdn==NULL);
|
|
|
|
|
|
if (!pdn->phb) {
|
|
|
- printk (KERN_WARNING "EEH: in slot reset, device node %s has no phb\n",
|
|
|
+ printk(KERN_WARNING "EEH: in slot reset, device node %s has no phb\n",
|
|
|
pdn->node->full_name);
|
|
|
return;
|
|
|
}
|
|
@@ -752,12 +773,12 @@ rtas_pci_slot_reset(struct pci_dn *pdn, int state)
|
|
|
|
|
|
/**
|
|
|
* pcibios_set_pcie_slot_reset - Set PCI-E reset state
|
|
|
- * @dev: pci device struct
|
|
|
- * @state: reset state to enter
|
|
|
+ * @dev: pci device struct
|
|
|
+ * @state: reset state to enter
|
|
|
*
|
|
|
* Return value:
|
|
|
* 0 if success
|
|
|
- **/
|
|
|
+ */
|
|
|
int pcibios_set_pcie_reset_state(struct pci_dev *dev, enum pcie_reset_state state)
|
|
|
{
|
|
|
struct device_node *dn = pci_device_to_OF_node(dev);
|
|
@@ -781,10 +802,62 @@ int pcibios_set_pcie_reset_state(struct pci_dev *dev, enum pcie_reset_state stat
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * rtas_set_slot_reset -- assert the pci #RST line for 1/4 second
|
|
|
- * @pdn: pci device node to be reset.
|
|
|
+ * __eeh_set_pe_freset - Check the required reset for child devices
|
|
|
+ * @parent: parent device
|
|
|
+ * @freset: return value
|
|
|
+ *
|
|
|
+ * Each device might have its preferred reset type: fundamental or
|
|
|
+ * hot reset. The routine is used to collect the information from
|
|
|
+ * the child devices so that they could be reset accordingly.
|
|
|
*/
|
|
|
+void __eeh_set_pe_freset(struct device_node *parent, unsigned int *freset)
|
|
|
+{
|
|
|
+ struct device_node *dn;
|
|
|
+
|
|
|
+ for_each_child_of_node(parent, dn) {
|
|
|
+ if (PCI_DN(dn)) {
|
|
|
+ struct pci_dev *dev = PCI_DN(dn)->pcidev;
|
|
|
+
|
|
|
+ if (dev && dev->driver)
|
|
|
+ *freset |= dev->needs_freset;
|
|
|
+
|
|
|
+ __eeh_set_pe_freset(dn, freset);
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+/**
|
|
|
+ * eeh_set_pe_freset - Check the required reset for the indicated device and its children
|
|
|
+ * @dn: parent device
|
|
|
+ * @freset: return value
|
|
|
+ *
|
|
|
+ * Each device might have its preferred reset type: fundamental or
|
|
|
+ * hot reset. The routine is used to collected the information for
|
|
|
+ * the indicated device and its children so that the bunch of the
|
|
|
+ * devices could be reset properly.
|
|
|
+ */
|
|
|
+void eeh_set_pe_freset(struct device_node *dn, unsigned int *freset)
|
|
|
+{
|
|
|
+ struct pci_dev *dev;
|
|
|
+ dn = find_device_pe(dn);
|
|
|
+
|
|
|
+ /* Back up one, since config addrs might be shared */
|
|
|
+ if (!pcibios_find_pci_bus(dn) && PCI_DN(dn->parent))
|
|
|
+ dn = dn->parent;
|
|
|
|
|
|
+ dev = PCI_DN(dn)->pcidev;
|
|
|
+ if (dev)
|
|
|
+ *freset |= dev->needs_freset;
|
|
|
+
|
|
|
+ __eeh_set_pe_freset(dn, freset);
|
|
|
+}
|
|
|
+
|
|
|
+/**
|
|
|
+ * __rtas_set_slot_reset - Assert the pci #RST line for 1/4 second
|
|
|
+ * @pdn: pci device node to be reset.
|
|
|
+ *
|
|
|
+ * Assert the PCI #RST line for 1/4 second.
|
|
|
+ */
|
|
|
static void __rtas_set_slot_reset(struct pci_dn *pdn)
|
|
|
{
|
|
|
unsigned int freset = 0;
|
|
@@ -803,25 +876,35 @@ static void __rtas_set_slot_reset(struct pci_dn *pdn)
|
|
|
rtas_pci_slot_reset(pdn, 1);
|
|
|
|
|
|
/* The PCI bus requires that the reset be held high for at least
|
|
|
- * a 100 milliseconds. We wait a bit longer 'just in case'. */
|
|
|
-
|
|
|
+ * a 100 milliseconds. We wait a bit longer 'just in case'.
|
|
|
+ */
|
|
|
#define PCI_BUS_RST_HOLD_TIME_MSEC 250
|
|
|
- msleep (PCI_BUS_RST_HOLD_TIME_MSEC);
|
|
|
+ msleep(PCI_BUS_RST_HOLD_TIME_MSEC);
|
|
|
|
|
|
/* We might get hit with another EEH freeze as soon as the
|
|
|
* pci slot reset line is dropped. Make sure we don't miss
|
|
|
- * these, and clear the flag now. */
|
|
|
- eeh_clear_slot (pdn->node, EEH_MODE_ISOLATED);
|
|
|
+ * these, and clear the flag now.
|
|
|
+ */
|
|
|
+ eeh_clear_slot(pdn->node, EEH_MODE_ISOLATED);
|
|
|
|
|
|
- rtas_pci_slot_reset (pdn, 0);
|
|
|
+ rtas_pci_slot_reset(pdn, 0);
|
|
|
|
|
|
/* After a PCI slot has been reset, the PCI Express spec requires
|
|
|
* a 1.5 second idle time for the bus to stabilize, before starting
|
|
|
- * up traffic. */
|
|
|
+ * up traffic.
|
|
|
+ */
|
|
|
#define PCI_BUS_SETTLE_TIME_MSEC 1800
|
|
|
- msleep (PCI_BUS_SETTLE_TIME_MSEC);
|
|
|
+ msleep(PCI_BUS_SETTLE_TIME_MSEC);
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * rtas_set_slot_reset - Reset the indicated PE
|
|
|
+ * @pdn: PCI device node
|
|
|
+ *
|
|
|
+ * This routine should be called to reset indicated device, including
|
|
|
+ * PE. A PE might include multiple PCI devices and sometimes PCI bridges
|
|
|
+ * might be involved as well.
|
|
|
+ */
|
|
|
int rtas_set_slot_reset(struct pci_dn *pdn)
|
|
|
{
|
|
|
int i, rc;
|
|
@@ -846,7 +929,6 @@ int rtas_set_slot_reset(struct pci_dn *pdn)
|
|
|
return -1;
|
|
|
}
|
|
|
|
|
|
-/* ------------------------------------------------------- */
|
|
|
/** Save and restore of PCI BARs
|
|
|
*
|
|
|
* Although firmware will set up BARs during boot, it doesn't
|
|
@@ -863,7 +945,7 @@ int rtas_set_slot_reset(struct pci_dn *pdn)
|
|
|
* the expansion ROM base address, the latency timer, and etc.
|
|
|
* from the saved values in the device node.
|
|
|
*/
|
|
|
-static inline void __restore_bars (struct pci_dn *pdn)
|
|
|
+static inline void __restore_bars(struct pci_dn *pdn)
|
|
|
{
|
|
|
int i;
|
|
|
u32 cmd;
|
|
@@ -879,17 +961,18 @@ static inline void __restore_bars (struct pci_dn *pdn)
|
|
|
#define BYTE_SWAP(OFF) (8*((OFF)/4)+3-(OFF))
|
|
|
#define SAVED_BYTE(OFF) (((u8 *)(pdn->config_space))[BYTE_SWAP(OFF)])
|
|
|
|
|
|
- rtas_write_config (pdn, PCI_CACHE_LINE_SIZE, 1,
|
|
|
+ rtas_write_config(pdn, PCI_CACHE_LINE_SIZE, 1,
|
|
|
SAVED_BYTE(PCI_CACHE_LINE_SIZE));
|
|
|
|
|
|
- rtas_write_config (pdn, PCI_LATENCY_TIMER, 1,
|
|
|
+ rtas_write_config(pdn, PCI_LATENCY_TIMER, 1,
|
|
|
SAVED_BYTE(PCI_LATENCY_TIMER));
|
|
|
|
|
|
/* max latency, min grant, interrupt pin and line */
|
|
|
rtas_write_config(pdn, 15*4, 4, pdn->config_space[15]);
|
|
|
|
|
|
/* Restore PERR & SERR bits, some devices require it,
|
|
|
- don't touch the other command bits */
|
|
|
+ * don't touch the other command bits
|
|
|
+ */
|
|
|
rtas_read_config(pdn, PCI_COMMAND, 4, &cmd);
|
|
|
if (pdn->config_space[1] & PCI_COMMAND_PARITY)
|
|
|
cmd |= PCI_COMMAND_PARITY;
|
|
@@ -903,7 +986,8 @@ static inline void __restore_bars (struct pci_dn *pdn)
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * eeh_restore_bars - restore the PCI config space info
|
|
|
+ * eeh_restore_bars - Restore the PCI config space info
|
|
|
+ * @pdn: PCI device node
|
|
|
*
|
|
|
* This routine performs a recursive walk to the children
|
|
|
* of this device as well.
|
|
@@ -915,14 +999,15 @@ void eeh_restore_bars(struct pci_dn *pdn)
|
|
|
return;
|
|
|
|
|
|
if ((pdn->eeh_mode & EEH_MODE_SUPPORTED) && !IS_BRIDGE(pdn->class_code))
|
|
|
- __restore_bars (pdn);
|
|
|
+ __restore_bars(pdn);
|
|
|
|
|
|
for_each_child_of_node(pdn->node, dn)
|
|
|
- eeh_restore_bars (PCI_DN(dn));
|
|
|
+ eeh_restore_bars(PCI_DN(dn));
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * eeh_save_bars - save device bars
|
|
|
+ * eeh_save_bars - Save device bars
|
|
|
+ * @pdn: PCI device node
|
|
|
*
|
|
|
* Save the values of the device bars. Unlike the restore
|
|
|
* routine, this routine is *not* recursive. This is because
|
|
@@ -940,6 +1025,14 @@ static void eeh_save_bars(struct pci_dn *pdn)
|
|
|
rtas_read_config(pdn, i * 4, 4, &pdn->config_space[i]);
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * rtas_configure_bridge - Configure PCI bridges for the indicated PE
|
|
|
+ * @pdn: PCI device node
|
|
|
+ *
|
|
|
+ * PCI bridges might be included in PE. In order to make the PE work
|
|
|
+ * again. The included PCI bridges should be recovered after the PE
|
|
|
+ * encounters frozen state.
|
|
|
+ */
|
|
|
void
|
|
|
rtas_configure_bridge(struct pci_dn *pdn)
|
|
|
{
|
|
@@ -963,17 +1056,11 @@ rtas_configure_bridge(struct pci_dn *pdn)
|
|
|
BUID_HI(pdn->phb->buid),
|
|
|
BUID_LO(pdn->phb->buid));
|
|
|
if (rc) {
|
|
|
- printk (KERN_WARNING "EEH: Unable to configure device bridge (%d) for %s\n",
|
|
|
+ printk(KERN_WARNING "EEH: Unable to configure device bridge (%d) for %s\n",
|
|
|
rc, pdn->node->full_name);
|
|
|
}
|
|
|
}
|
|
|
|
|
|
-/* ------------------------------------------------------------- */
|
|
|
-/* The code below deals with enabling EEH for devices during the
|
|
|
- * early boot sequence. EEH must be enabled before any PCI probing
|
|
|
- * can be done.
|
|
|
- */
|
|
|
-
|
|
|
#define EEH_ENABLE 1
|
|
|
|
|
|
struct eeh_early_enable_info {
|
|
@@ -981,7 +1068,18 @@ struct eeh_early_enable_info {
|
|
|
unsigned int buid_lo;
|
|
|
};
|
|
|
|
|
|
-static int get_pe_addr (int config_addr,
|
|
|
+/**
|
|
|
+ * get_pe_addr - Retrieve PE address with given BDF address
|
|
|
+ * @config_addr: BDF address
|
|
|
+ * @info: BUID of the associated PHB
|
|
|
+ *
|
|
|
+ * There're 2 kinds of addresses existing in EEH core components:
|
|
|
+ * BDF address and PE address. Besides, there has dedicated platform
|
|
|
+ * dependent function call to retrieve the PE address according to
|
|
|
+ * the given BDF address. Further more, we prefer PE address on BDF
|
|
|
+ * address in EEH core components.
|
|
|
+ */
|
|
|
+static int get_pe_addr(int config_addr,
|
|
|
struct eeh_early_enable_info *info)
|
|
|
{
|
|
|
unsigned int rets[3];
|
|
@@ -990,12 +1088,12 @@ static int get_pe_addr (int config_addr,
|
|
|
/* Use latest config-addr token on power6 */
|
|
|
if (ibm_get_config_addr_info2 != RTAS_UNKNOWN_SERVICE) {
|
|
|
/* Make sure we have a PE in hand */
|
|
|
- ret = rtas_call (ibm_get_config_addr_info2, 4, 2, rets,
|
|
|
+ ret = rtas_call(ibm_get_config_addr_info2, 4, 2, rets,
|
|
|
config_addr, info->buid_hi, info->buid_lo, 1);
|
|
|
if (ret || (rets[0]==0))
|
|
|
return 0;
|
|
|
|
|
|
- ret = rtas_call (ibm_get_config_addr_info2, 4, 2, rets,
|
|
|
+ ret = rtas_call(ibm_get_config_addr_info2, 4, 2, rets,
|
|
|
config_addr, info->buid_hi, info->buid_lo, 0);
|
|
|
if (ret)
|
|
|
return 0;
|
|
@@ -1004,7 +1102,7 @@ static int get_pe_addr (int config_addr,
|
|
|
|
|
|
/* Use older config-addr token on power5 */
|
|
|
if (ibm_get_config_addr_info != RTAS_UNKNOWN_SERVICE) {
|
|
|
- ret = rtas_call (ibm_get_config_addr_info, 4, 2, rets,
|
|
|
+ ret = rtas_call(ibm_get_config_addr_info, 4, 2, rets,
|
|
|
config_addr, info->buid_hi, info->buid_lo, 0);
|
|
|
if (ret)
|
|
|
return 0;
|
|
@@ -1013,7 +1111,15 @@ static int get_pe_addr (int config_addr,
|
|
|
return 0;
|
|
|
}
|
|
|
|
|
|
-/* Enable eeh for the given device node. */
|
|
|
+/**
|
|
|
+ * early_enable_eeh - Early enable EEH on the indicated device
|
|
|
+ * @dn: device node
|
|
|
+ * @data: BUID
|
|
|
+ *
|
|
|
+ * Enable EEH functionality on the specified PCI device. The function
|
|
|
+ * is expected to be called before real PCI probing is done. However,
|
|
|
+ * the PHBs have been initialized at this point.
|
|
|
+ */
|
|
|
static void *early_enable_eeh(struct device_node *dn, void *data)
|
|
|
{
|
|
|
unsigned int rets[3];
|
|
@@ -1047,7 +1153,8 @@ static void *early_enable_eeh(struct device_node *dn, void *data)
|
|
|
pdn->class_code = *class_code;
|
|
|
|
|
|
/* Ok... see if this device supports EEH. Some do, some don't,
|
|
|
- * and the only way to find out is to check each and every one. */
|
|
|
+ * and the only way to find out is to check each and every one.
|
|
|
+ */
|
|
|
regs = of_get_property(dn, "reg", NULL);
|
|
|
if (regs) {
|
|
|
/* First register entry is addr (00BBSS00) */
|
|
@@ -1061,13 +1168,15 @@ static void *early_enable_eeh(struct device_node *dn, void *data)
|
|
|
pdn->eeh_config_addr = regs[0];
|
|
|
|
|
|
/* If the newer, better, ibm,get-config-addr-info is supported,
|
|
|
- * then use that instead. */
|
|
|
+ * then use that instead.
|
|
|
+ */
|
|
|
pdn->eeh_pe_config_addr = get_pe_addr(pdn->eeh_config_addr, info);
|
|
|
|
|
|
/* Some older systems (Power4) allow the
|
|
|
* ibm,set-eeh-option call to succeed even on nodes
|
|
|
* where EEH is not supported. Verify support
|
|
|
- * explicitly. */
|
|
|
+ * explicitly.
|
|
|
+ */
|
|
|
ret = read_slot_reset_state(pdn, rets);
|
|
|
if ((ret == 0) && (rets[1] == 1))
|
|
|
enable = 1;
|
|
@@ -1083,7 +1192,8 @@ static void *early_enable_eeh(struct device_node *dn, void *data)
|
|
|
} else {
|
|
|
|
|
|
/* This device doesn't support EEH, but it may have an
|
|
|
- * EEH parent, in which case we mark it as supported. */
|
|
|
+ * EEH parent, in which case we mark it as supported.
|
|
|
+ */
|
|
|
if (dn->parent && PCI_DN(dn->parent)
|
|
|
&& (PCI_DN(dn->parent)->eeh_mode & EEH_MODE_SUPPORTED)) {
|
|
|
/* Parent supports EEH. */
|
|
@@ -1101,7 +1211,9 @@ static void *early_enable_eeh(struct device_node *dn, void *data)
|
|
|
return NULL;
|
|
|
}
|
|
|
|
|
|
-/*
|
|
|
+/**
|
|
|
+ * eeh_init - EEH initialization
|
|
|
+ *
|
|
|
* Initialize EEH by trying to enable it for all of the adapters in the system.
|
|
|
* As a side effect we can determine here if eeh is supported at all.
|
|
|
* Note that we leave EEH on so failed config cycles won't cause a machine
|
|
@@ -1133,7 +1245,7 @@ void __init eeh_init(void)
|
|
|
ibm_slot_error_detail = rtas_token("ibm,slot-error-detail");
|
|
|
ibm_get_config_addr_info = rtas_token("ibm,get-config-addr-info");
|
|
|
ibm_get_config_addr_info2 = rtas_token("ibm,get-config-addr-info2");
|
|
|
- ibm_configure_bridge = rtas_token ("ibm,configure-bridge");
|
|
|
+ ibm_configure_bridge = rtas_token("ibm,configure-bridge");
|
|
|
ibm_configure_pe = rtas_token("ibm,configure-pe");
|
|
|
|
|
|
if (ibm_set_eeh_option == RTAS_UNKNOWN_SERVICE)
|
|
@@ -1170,7 +1282,7 @@ void __init eeh_init(void)
|
|
|
}
|
|
|
|
|
|
/**
|
|
|
- * eeh_add_device_early - enable EEH for the indicated device_node
|
|
|
+ * eeh_add_device_early - Enable EEH for the indicated device_node
|
|
|
* @dn: device node for which to set up EEH
|
|
|
*
|
|
|
* This routine must be used to perform EEH initialization for PCI
|
|
@@ -1199,6 +1311,14 @@ static void eeh_add_device_early(struct device_node *dn)
|
|
|
early_enable_eeh(dn, &info);
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * eeh_add_device_tree_early - Enable EEH for the indicated device
|
|
|
+ * @dn: device node
|
|
|
+ *
|
|
|
+ * This routine must be used to perform EEH initialization for the
|
|
|
+ * indicated PCI device that was added after system boot (e.g.
|
|
|
+ * hotplug, dlpar).
|
|
|
+ */
|
|
|
void eeh_add_device_tree_early(struct device_node *dn)
|
|
|
{
|
|
|
struct device_node *sib;
|
|
@@ -1210,7 +1330,7 @@ void eeh_add_device_tree_early(struct device_node *dn)
|
|
|
EXPORT_SYMBOL_GPL(eeh_add_device_tree_early);
|
|
|
|
|
|
/**
|
|
|
- * eeh_add_device_late - perform EEH initialization for the indicated pci device
|
|
|
+ * eeh_add_device_late - Perform EEH initialization for the indicated pci device
|
|
|
* @dev: pci device for which to set up EEH
|
|
|
*
|
|
|
* This routine must be used to complete EEH initialization for PCI
|
|
@@ -1234,13 +1354,21 @@ static void eeh_add_device_late(struct pci_dev *dev)
|
|
|
}
|
|
|
WARN_ON(pdn->pcidev);
|
|
|
|
|
|
- pci_dev_get (dev);
|
|
|
+ pci_dev_get(dev);
|
|
|
pdn->pcidev = dev;
|
|
|
|
|
|
pci_addr_cache_insert_device(dev);
|
|
|
eeh_sysfs_add_device(dev);
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * eeh_add_device_tree_late - Perform EEH initialization for the indicated PCI bus
|
|
|
+ * @bus: PCI bus
|
|
|
+ *
|
|
|
+ * This routine must be used to perform EEH initialization for PCI
|
|
|
+ * devices which are attached to the indicated PCI bus. The PCI bus
|
|
|
+ * is added after system boot through hotplug or dlpar.
|
|
|
+ */
|
|
|
void eeh_add_device_tree_late(struct pci_bus *bus)
|
|
|
{
|
|
|
struct pci_dev *dev;
|
|
@@ -1257,7 +1385,7 @@ void eeh_add_device_tree_late(struct pci_bus *bus)
|
|
|
EXPORT_SYMBOL_GPL(eeh_add_device_tree_late);
|
|
|
|
|
|
/**
|
|
|
- * eeh_remove_device - undo EEH setup for the indicated pci device
|
|
|
+ * eeh_remove_device - Undo EEH setup for the indicated pci device
|
|
|
* @dev: pci device to be removed
|
|
|
*
|
|
|
* This routine should be called when a device is removed from
|
|
@@ -1281,12 +1409,20 @@ static void eeh_remove_device(struct pci_dev *dev)
|
|
|
return;
|
|
|
}
|
|
|
PCI_DN(dn)->pcidev = NULL;
|
|
|
- pci_dev_put (dev);
|
|
|
+ pci_dev_put(dev);
|
|
|
|
|
|
pci_addr_cache_remove_device(dev);
|
|
|
eeh_sysfs_remove_device(dev);
|
|
|
}
|
|
|
|
|
|
+/**
|
|
|
+ * eeh_remove_bus_device - Undo EEH setup for the indicated PCI device
|
|
|
+ * @dev: PCI device
|
|
|
+ *
|
|
|
+ * This routine must be called when a device is removed from the
|
|
|
+ * running system through hotplug or dlpar. The corresponding
|
|
|
+ * PCI address cache will be removed.
|
|
|
+ */
|
|
|
void eeh_remove_bus_device(struct pci_dev *dev)
|
|
|
{
|
|
|
struct pci_bus *bus = dev->subordinate;
|