Commit 807a827d authored by Gavin Shan's avatar Gavin Shan Committed by Benjamin Herrenschmidt

powerpc/eeh: Keep PE during hotplug

When we do normal hotplug, the PE (shadow EEH structure) shouldn't be
kept around.

However, we need to keep it if the hotplug an artifial one caused by
EEH errors recovery.

Since we remove EEH device through the PCI hook pcibios_release_device(),
the flag "purge_pe" passed to various functions is meaningless. So the patch
removes the meaningless flag and introduce new flag "EEH_PE_KEEP"
to save the PE while doing hotplug during EEH error recovery.
Signed-off-by: default avatarGavin Shan <shangw@linux.vnet.ibm.com>
Signed-off-by: default avatarBenjamin Herrenschmidt <benh@kernel.crashing.org>
parent c7b51bce
...@@ -55,6 +55,8 @@ struct device_node; ...@@ -55,6 +55,8 @@ struct device_node;
#define EEH_PE_RECOVERING (1 << 1) /* Recovering PE */ #define EEH_PE_RECOVERING (1 << 1) /* Recovering PE */
#define EEH_PE_PHB_DEAD (1 << 2) /* Dead PHB */ #define EEH_PE_PHB_DEAD (1 << 2) /* Dead PHB */
#define EEH_PE_KEEP (1 << 8) /* Keep PE on hotplug */
struct eeh_pe { struct eeh_pe {
int type; /* PE type: PHB/Bus/Device */ int type; /* PE type: PHB/Bus/Device */
int state; /* PE EEH dependent mode */ int state; /* PE EEH dependent mode */
...@@ -193,7 +195,7 @@ int eeh_phb_pe_create(struct pci_controller *phb); ...@@ -193,7 +195,7 @@ int eeh_phb_pe_create(struct pci_controller *phb);
struct eeh_pe *eeh_phb_pe_get(struct pci_controller *phb); struct eeh_pe *eeh_phb_pe_get(struct pci_controller *phb);
struct eeh_pe *eeh_pe_get(struct eeh_dev *edev); struct eeh_pe *eeh_pe_get(struct eeh_dev *edev);
int eeh_add_to_parent_pe(struct eeh_dev *edev); int eeh_add_to_parent_pe(struct eeh_dev *edev);
int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe); int eeh_rmv_from_parent_pe(struct eeh_dev *edev);
void eeh_pe_update_time_stamp(struct eeh_pe *pe); void eeh_pe_update_time_stamp(struct eeh_pe *pe);
void *eeh_pe_dev_traverse(struct eeh_pe *root, void *eeh_pe_dev_traverse(struct eeh_pe *root,
eeh_traverse_func fn, void *flag); eeh_traverse_func fn, void *flag);
...@@ -214,8 +216,7 @@ void eeh_add_device_tree_early(struct device_node *); ...@@ -214,8 +216,7 @@ void eeh_add_device_tree_early(struct device_node *);
void eeh_add_device_late(struct pci_dev *); void eeh_add_device_late(struct pci_dev *);
void eeh_add_device_tree_late(struct pci_bus *); void eeh_add_device_tree_late(struct pci_bus *);
void eeh_add_sysfs_files(struct pci_bus *); void eeh_add_sysfs_files(struct pci_bus *);
void eeh_remove_device(struct pci_dev *, int); void eeh_remove_device(struct pci_dev *);
void eeh_remove_bus_device(struct pci_dev *, int);
/** /**
* EEH_POSSIBLE_ERROR() -- test for possible MMIO failure. * EEH_POSSIBLE_ERROR() -- test for possible MMIO failure.
...@@ -265,9 +266,7 @@ static inline void eeh_add_device_tree_late(struct pci_bus *bus) { } ...@@ -265,9 +266,7 @@ static inline void eeh_add_device_tree_late(struct pci_bus *bus) { }
static inline void eeh_add_sysfs_files(struct pci_bus *bus) { } static inline void eeh_add_sysfs_files(struct pci_bus *bus) { }
static inline void eeh_remove_device(struct pci_dev *dev, int purge_pe) { } static inline void eeh_remove_device(struct pci_dev *dev) { }
static inline void eeh_remove_bus_device(struct pci_dev *dev, int purge_pe) { }
#define EEH_POSSIBLE_ERROR(val, type) (0) #define EEH_POSSIBLE_ERROR(val, type) (0)
#define EEH_IO_ERROR_VALUE(size) (-1UL) #define EEH_IO_ERROR_VALUE(size) (-1UL)
......
...@@ -209,7 +209,6 @@ static inline struct eeh_dev *of_node_to_eeh_dev(struct device_node *dn) ...@@ -209,7 +209,6 @@ static inline struct eeh_dev *of_node_to_eeh_dev(struct device_node *dn)
extern struct pci_bus *pcibios_find_pci_bus(struct device_node *dn); extern struct pci_bus *pcibios_find_pci_bus(struct device_node *dn);
/** Remove all of the PCI devices under this bus */ /** Remove all of the PCI devices under this bus */
extern void __pcibios_remove_pci_devices(struct pci_bus *bus, int purge_pe);
extern void pcibios_remove_pci_devices(struct pci_bus *bus); extern void pcibios_remove_pci_devices(struct pci_bus *bus);
/** Discover new pci devices under this bus, and add them */ /** Discover new pci devices under this bus, and add them */
......
...@@ -964,7 +964,6 @@ EXPORT_SYMBOL_GPL(eeh_add_sysfs_files); ...@@ -964,7 +964,6 @@ EXPORT_SYMBOL_GPL(eeh_add_sysfs_files);
/** /**
* eeh_remove_device - Undo EEH setup for the indicated pci device * eeh_remove_device - Undo EEH setup for the indicated pci device
* @dev: pci device to be removed * @dev: pci device to be removed
* @purge_pe: remove the PE or not
* *
* This routine should be called when a device is removed from * This routine should be called when a device is removed from
* a running system (e.g. by hotplug or dlpar). It unregisters * a running system (e.g. by hotplug or dlpar). It unregisters
...@@ -972,7 +971,7 @@ EXPORT_SYMBOL_GPL(eeh_add_sysfs_files); ...@@ -972,7 +971,7 @@ EXPORT_SYMBOL_GPL(eeh_add_sysfs_files);
* this device will no longer be detected after this call; thus, * this device will no longer be detected after this call; thus,
* i/o errors affecting this slot may leave this device unusable. * i/o errors affecting this slot may leave this device unusable.
*/ */
void eeh_remove_device(struct pci_dev *dev, int purge_pe) void eeh_remove_device(struct pci_dev *dev)
{ {
struct eeh_dev *edev; struct eeh_dev *edev;
...@@ -990,34 +989,11 @@ void eeh_remove_device(struct pci_dev *dev, int purge_pe) ...@@ -990,34 +989,11 @@ void eeh_remove_device(struct pci_dev *dev, int purge_pe)
edev->pdev = NULL; edev->pdev = NULL;
dev->dev.archdata.edev = NULL; dev->dev.archdata.edev = NULL;
eeh_rmv_from_parent_pe(edev, purge_pe); eeh_rmv_from_parent_pe(edev);
eeh_addr_cache_rmv_dev(dev); eeh_addr_cache_rmv_dev(dev);
eeh_sysfs_remove_device(dev); eeh_sysfs_remove_device(dev);
} }
/**
* eeh_remove_bus_device - Undo EEH setup for the indicated PCI device
* @dev: PCI device
* @purge_pe: remove the corresponding PE or not
*
* This routine must be called when a device is removed from the
* running system through hotplug or dlpar. The corresponding
* PCI address cache will be removed.
*/
void eeh_remove_bus_device(struct pci_dev *dev, int purge_pe)
{
struct pci_bus *bus = dev->subordinate;
struct pci_dev *child, *tmp;
eeh_remove_device(dev, purge_pe);
if (bus && dev->hdr_type == PCI_HEADER_TYPE_BRIDGE) {
list_for_each_entry_safe(child, tmp, &bus->devices, bus_list)
eeh_remove_bus_device(child, purge_pe);
}
}
EXPORT_SYMBOL_GPL(eeh_remove_bus_device);
static int proc_eeh_show(struct seq_file *m, void *v) static int proc_eeh_show(struct seq_file *m, void *v)
{ {
if (0 == eeh_subsystem_enabled) { if (0 == eeh_subsystem_enabled) {
......
...@@ -362,8 +362,10 @@ static int eeh_reset_device(struct eeh_pe *pe, struct pci_bus *bus) ...@@ -362,8 +362,10 @@ static int eeh_reset_device(struct eeh_pe *pe, struct pci_bus *bus)
* devices are expected to be attached soon when calling * devices are expected to be attached soon when calling
* into pcibios_add_pci_devices(). * into pcibios_add_pci_devices().
*/ */
if (bus) if (bus) {
__pcibios_remove_pci_devices(bus, 0); eeh_pe_state_mark(pe, EEH_PE_KEEP);
pcibios_remove_pci_devices(bus);
}
/* Reset the pci controller. (Asserts RST#; resets config space). /* Reset the pci controller. (Asserts RST#; resets config space).
* Reconfigure bridges and devices. Don't try to bring the system * Reconfigure bridges and devices. Don't try to bring the system
...@@ -386,6 +388,7 @@ static int eeh_reset_device(struct eeh_pe *pe, struct pci_bus *bus) ...@@ -386,6 +388,7 @@ static int eeh_reset_device(struct eeh_pe *pe, struct pci_bus *bus)
if (bus) { if (bus) {
ssleep(5); ssleep(5);
pcibios_add_pci_devices(bus); pcibios_add_pci_devices(bus);
eeh_pe_state_clear(pe, EEH_PE_KEEP);
} }
pe->tstamp = tstamp; pe->tstamp = tstamp;
......
...@@ -333,7 +333,7 @@ int eeh_add_to_parent_pe(struct eeh_dev *edev) ...@@ -333,7 +333,7 @@ int eeh_add_to_parent_pe(struct eeh_dev *edev)
while (parent) { while (parent) {
if (!(parent->type & EEH_PE_INVALID)) if (!(parent->type & EEH_PE_INVALID))
break; break;
parent->type &= ~EEH_PE_INVALID; parent->type &= ~(EEH_PE_INVALID | EEH_PE_KEEP);
parent = parent->parent; parent = parent->parent;
} }
pr_debug("EEH: Add %s to Device PE#%x, Parent PE#%x\n", pr_debug("EEH: Add %s to Device PE#%x, Parent PE#%x\n",
...@@ -397,14 +397,13 @@ int eeh_add_to_parent_pe(struct eeh_dev *edev) ...@@ -397,14 +397,13 @@ int eeh_add_to_parent_pe(struct eeh_dev *edev)
/** /**
* eeh_rmv_from_parent_pe - Remove one EEH device from the associated PE * eeh_rmv_from_parent_pe - Remove one EEH device from the associated PE
* @edev: EEH device * @edev: EEH device
* @purge_pe: remove PE or not
* *
* The PE hierarchy tree might be changed when doing PCI hotplug. * The PE hierarchy tree might be changed when doing PCI hotplug.
* Also, the PCI devices or buses could be removed from the system * Also, the PCI devices or buses could be removed from the system
* during EEH recovery. So we have to call the function remove the * during EEH recovery. So we have to call the function remove the
* corresponding PE accordingly if necessary. * corresponding PE accordingly if necessary.
*/ */
int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe) int eeh_rmv_from_parent_pe(struct eeh_dev *edev)
{ {
struct eeh_pe *pe, *parent, *child; struct eeh_pe *pe, *parent, *child;
int cnt; int cnt;
...@@ -431,7 +430,7 @@ int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe) ...@@ -431,7 +430,7 @@ int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe)
if (pe->type & EEH_PE_PHB) if (pe->type & EEH_PE_PHB)
break; break;
if (purge_pe) { if (!(pe->state & EEH_PE_KEEP)) {
if (list_empty(&pe->edevs) && if (list_empty(&pe->edevs) &&
list_empty(&pe->child_list)) { list_empty(&pe->child_list)) {
list_del(&pe->child); list_del(&pe->child);
......
...@@ -29,49 +29,33 @@ ...@@ -29,49 +29,33 @@
*/ */
void pcibios_release_device(struct pci_dev *dev) void pcibios_release_device(struct pci_dev *dev)
{ {
eeh_remove_device(dev, 1); eeh_remove_device(dev);
} }
/** /**
* __pcibios_remove_pci_devices - remove all devices under this bus * pcibios_remove_pci_devices - remove all devices under this bus
* @bus: the indicated PCI bus * @bus: the indicated PCI bus
* @purge_pe: destroy the PE on removal of PCI devices
* *
* Remove all of the PCI devices under this bus both from the * Remove all of the PCI devices under this bus both from the
* linux pci device tree, and from the powerpc EEH address cache. * linux pci device tree, and from the powerpc EEH address cache.
* By default, the corresponding PE will be destroied during the
* normal PCI hotplug path. For PCI hotplug during EEH recovery,
* the corresponding PE won't be destroied and deallocated.
*/ */
void __pcibios_remove_pci_devices(struct pci_bus *bus, int purge_pe) void pcibios_remove_pci_devices(struct pci_bus *bus)
{ {
struct pci_dev *dev, *tmp; struct pci_dev *dev, *tmp;
struct pci_bus *child_bus; struct pci_bus *child_bus;
/* First go down child busses */ /* First go down child busses */
list_for_each_entry(child_bus, &bus->children, node) list_for_each_entry(child_bus, &bus->children, node)
__pcibios_remove_pci_devices(child_bus, purge_pe); pcibios_remove_pci_devices(child_bus);
pr_debug("PCI: Removing devices on bus %04x:%02x\n", pr_debug("PCI: Removing devices on bus %04x:%02x\n",
pci_domain_nr(bus), bus->number); pci_domain_nr(bus), bus->number);
list_for_each_entry_safe(dev, tmp, &bus->devices, bus_list) { list_for_each_entry_safe(dev, tmp, &bus->devices, bus_list) {
pr_debug(" * Removing %s...\n", pci_name(dev)); pr_debug(" Removing %s...\n", pci_name(dev));
eeh_remove_bus_device(dev, purge_pe);
pci_stop_and_remove_bus_device(dev); pci_stop_and_remove_bus_device(dev);
} }
} }
/**
* pcibios_remove_pci_devices - remove all devices under this bus
* @bus: the indicated PCI bus
*
* Remove all of the PCI devices under this bus both from the
* linux pci device tree, and from the powerpc EEH address cache.
*/
void pcibios_remove_pci_devices(struct pci_bus *bus)
{
__pcibios_remove_pci_devices(bus, 1);
}
EXPORT_SYMBOL_GPL(pcibios_remove_pci_devices); EXPORT_SYMBOL_GPL(pcibios_remove_pci_devices);
/** /**
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment