cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

pnv_php.c (25496B)


      1// SPDX-License-Identifier: GPL-2.0+
      2/*
      3 * PCI Hotplug Driver for PowerPC PowerNV platform.
      4 *
      5 * Copyright Gavin Shan, IBM Corporation 2016.
      6 */
      7
      8#include <linux/libfdt.h>
      9#include <linux/module.h>
     10#include <linux/pci.h>
     11#include <linux/pci_hotplug.h>
     12#include <linux/of_fdt.h>
     13
     14#include <asm/opal.h>
     15#include <asm/pnv-pci.h>
     16#include <asm/ppc-pci.h>
     17
     18#define DRIVER_VERSION	"0.1"
     19#define DRIVER_AUTHOR	"Gavin Shan, IBM Corporation"
     20#define DRIVER_DESC	"PowerPC PowerNV PCI Hotplug Driver"
     21
     22#define SLOT_WARN(sl, x...) \
     23	((sl)->pdev ? pci_warn((sl)->pdev, x) : dev_warn(&(sl)->bus->dev, x))
     24
     25struct pnv_php_event {
     26	bool			added;
     27	struct pnv_php_slot	*php_slot;
     28	struct work_struct	work;
     29};
     30
     31static LIST_HEAD(pnv_php_slot_list);
     32static DEFINE_SPINLOCK(pnv_php_lock);
     33
     34static void pnv_php_register(struct device_node *dn);
     35static void pnv_php_unregister_one(struct device_node *dn);
     36static void pnv_php_unregister(struct device_node *dn);
     37
     38static void pnv_php_disable_irq(struct pnv_php_slot *php_slot,
     39				bool disable_device)
     40{
     41	struct pci_dev *pdev = php_slot->pdev;
     42	int irq = php_slot->irq;
     43	u16 ctrl;
     44
     45	if (php_slot->irq > 0) {
     46		pcie_capability_read_word(pdev, PCI_EXP_SLTCTL, &ctrl);
     47		ctrl &= ~(PCI_EXP_SLTCTL_HPIE |
     48			  PCI_EXP_SLTCTL_PDCE |
     49			  PCI_EXP_SLTCTL_DLLSCE);
     50		pcie_capability_write_word(pdev, PCI_EXP_SLTCTL, ctrl);
     51
     52		free_irq(php_slot->irq, php_slot);
     53		php_slot->irq = 0;
     54	}
     55
     56	if (php_slot->wq) {
     57		destroy_workqueue(php_slot->wq);
     58		php_slot->wq = NULL;
     59	}
     60
     61	if (disable_device || irq > 0) {
     62		if (pdev->msix_enabled)
     63			pci_disable_msix(pdev);
     64		else if (pdev->msi_enabled)
     65			pci_disable_msi(pdev);
     66
     67		pci_disable_device(pdev);
     68	}
     69}
     70
     71static void pnv_php_free_slot(struct kref *kref)
     72{
     73	struct pnv_php_slot *php_slot = container_of(kref,
     74					struct pnv_php_slot, kref);
     75
     76	WARN_ON(!list_empty(&php_slot->children));
     77	pnv_php_disable_irq(php_slot, false);
     78	kfree(php_slot->name);
     79	kfree(php_slot);
     80}
     81
     82static inline void pnv_php_put_slot(struct pnv_php_slot *php_slot)
     83{
     84
     85	if (!php_slot)
     86		return;
     87
     88	kref_put(&php_slot->kref, pnv_php_free_slot);
     89}
     90
     91static struct pnv_php_slot *pnv_php_match(struct device_node *dn,
     92					  struct pnv_php_slot *php_slot)
     93{
     94	struct pnv_php_slot *target, *tmp;
     95
     96	if (php_slot->dn == dn) {
     97		kref_get(&php_slot->kref);
     98		return php_slot;
     99	}
    100
    101	list_for_each_entry(tmp, &php_slot->children, link) {
    102		target = pnv_php_match(dn, tmp);
    103		if (target)
    104			return target;
    105	}
    106
    107	return NULL;
    108}
    109
    110struct pnv_php_slot *pnv_php_find_slot(struct device_node *dn)
    111{
    112	struct pnv_php_slot *php_slot, *tmp;
    113	unsigned long flags;
    114
    115	spin_lock_irqsave(&pnv_php_lock, flags);
    116	list_for_each_entry(tmp, &pnv_php_slot_list, link) {
    117		php_slot = pnv_php_match(dn, tmp);
    118		if (php_slot) {
    119			spin_unlock_irqrestore(&pnv_php_lock, flags);
    120			return php_slot;
    121		}
    122	}
    123	spin_unlock_irqrestore(&pnv_php_lock, flags);
    124
    125	return NULL;
    126}
    127EXPORT_SYMBOL_GPL(pnv_php_find_slot);
    128
    129/*
    130 * Remove pdn for all children of the indicated device node.
    131 * The function should remove pdn in a depth-first manner.
    132 */
    133static void pnv_php_rmv_pdns(struct device_node *dn)
    134{
    135	struct device_node *child;
    136
    137	for_each_child_of_node(dn, child) {
    138		pnv_php_rmv_pdns(child);
    139
    140		pci_remove_device_node_info(child);
    141	}
    142}
    143
    144/*
    145 * Detach all child nodes of the indicated device nodes. The
    146 * function should handle device nodes in depth-first manner.
    147 *
    148 * We should not invoke of_node_release() as the memory for
    149 * individual device node is part of large memory block. The
    150 * large block is allocated from memblock (system bootup) or
    151 * kmalloc() when unflattening the device tree by OF changeset.
    152 * We can not free the large block allocated from memblock. For
    153 * later case, it should be released at once.
    154 */
    155static void pnv_php_detach_device_nodes(struct device_node *parent)
    156{
    157	struct device_node *dn;
    158
    159	for_each_child_of_node(parent, dn) {
    160		pnv_php_detach_device_nodes(dn);
    161
    162		of_node_put(dn);
    163		of_detach_node(dn);
    164	}
    165}
    166
    167static void pnv_php_rmv_devtree(struct pnv_php_slot *php_slot)
    168{
    169	pnv_php_rmv_pdns(php_slot->dn);
    170
    171	/*
    172	 * Decrease the refcount if the device nodes were created
    173	 * through OF changeset before detaching them.
    174	 */
    175	if (php_slot->fdt)
    176		of_changeset_destroy(&php_slot->ocs);
    177	pnv_php_detach_device_nodes(php_slot->dn);
    178
    179	if (php_slot->fdt) {
    180		kfree(php_slot->dt);
    181		kfree(php_slot->fdt);
    182		php_slot->dt        = NULL;
    183		php_slot->dn->child = NULL;
    184		php_slot->fdt       = NULL;
    185	}
    186}
    187
    188/*
    189 * As the nodes in OF changeset are applied in reverse order, we
    190 * need revert the nodes in advance so that we have correct node
    191 * order after the changeset is applied.
    192 */
    193static void pnv_php_reverse_nodes(struct device_node *parent)
    194{
    195	struct device_node *child, *next;
    196
    197	/* In-depth first */
    198	for_each_child_of_node(parent, child)
    199		pnv_php_reverse_nodes(child);
    200
    201	/* Reverse the nodes in the child list */
    202	child = parent->child;
    203	parent->child = NULL;
    204	while (child) {
    205		next = child->sibling;
    206
    207		child->sibling = parent->child;
    208		parent->child = child;
    209		child = next;
    210	}
    211}
    212
    213static int pnv_php_populate_changeset(struct of_changeset *ocs,
    214				      struct device_node *dn)
    215{
    216	struct device_node *child;
    217	int ret = 0;
    218
    219	for_each_child_of_node(dn, child) {
    220		ret = of_changeset_attach_node(ocs, child);
    221		if (ret) {
    222			of_node_put(child);
    223			break;
    224		}
    225
    226		ret = pnv_php_populate_changeset(ocs, child);
    227		if (ret) {
    228			of_node_put(child);
    229			break;
    230		}
    231	}
    232
    233	return ret;
    234}
    235
    236static void *pnv_php_add_one_pdn(struct device_node *dn, void *data)
    237{
    238	struct pci_controller *hose = (struct pci_controller *)data;
    239	struct pci_dn *pdn;
    240
    241	pdn = pci_add_device_node_info(hose, dn);
    242	if (!pdn)
    243		return ERR_PTR(-ENOMEM);
    244
    245	return NULL;
    246}
    247
    248static void pnv_php_add_pdns(struct pnv_php_slot *slot)
    249{
    250	struct pci_controller *hose = pci_bus_to_host(slot->bus);
    251
    252	pci_traverse_device_nodes(slot->dn, pnv_php_add_one_pdn, hose);
    253}
    254
    255static int pnv_php_add_devtree(struct pnv_php_slot *php_slot)
    256{
    257	void *fdt, *fdt1, *dt;
    258	int ret;
    259
    260	/* We don't know the FDT blob size. We try to get it through
    261	 * maximal memory chunk and then copy it to another chunk that
    262	 * fits the real size.
    263	 */
    264	fdt1 = kzalloc(0x10000, GFP_KERNEL);
    265	if (!fdt1) {
    266		ret = -ENOMEM;
    267		goto out;
    268	}
    269
    270	ret = pnv_pci_get_device_tree(php_slot->dn->phandle, fdt1, 0x10000);
    271	if (ret) {
    272		SLOT_WARN(php_slot, "Error %d getting FDT blob\n", ret);
    273		goto free_fdt1;
    274	}
    275
    276	fdt = kmemdup(fdt1, fdt_totalsize(fdt1), GFP_KERNEL);
    277	if (!fdt) {
    278		ret = -ENOMEM;
    279		goto free_fdt1;
    280	}
    281
    282	/* Unflatten device tree blob */
    283	dt = of_fdt_unflatten_tree(fdt, php_slot->dn, NULL);
    284	if (!dt) {
    285		ret = -EINVAL;
    286		SLOT_WARN(php_slot, "Cannot unflatten FDT\n");
    287		goto free_fdt;
    288	}
    289
    290	/* Initialize and apply the changeset */
    291	of_changeset_init(&php_slot->ocs);
    292	pnv_php_reverse_nodes(php_slot->dn);
    293	ret = pnv_php_populate_changeset(&php_slot->ocs, php_slot->dn);
    294	if (ret) {
    295		pnv_php_reverse_nodes(php_slot->dn);
    296		SLOT_WARN(php_slot, "Error %d populating changeset\n",
    297			  ret);
    298		goto free_dt;
    299	}
    300
    301	php_slot->dn->child = NULL;
    302	ret = of_changeset_apply(&php_slot->ocs);
    303	if (ret) {
    304		SLOT_WARN(php_slot, "Error %d applying changeset\n", ret);
    305		goto destroy_changeset;
    306	}
    307
    308	/* Add device node firmware data */
    309	pnv_php_add_pdns(php_slot);
    310	php_slot->fdt = fdt;
    311	php_slot->dt  = dt;
    312	kfree(fdt1);
    313	goto out;
    314
    315destroy_changeset:
    316	of_changeset_destroy(&php_slot->ocs);
    317free_dt:
    318	kfree(dt);
    319	php_slot->dn->child = NULL;
    320free_fdt:
    321	kfree(fdt);
    322free_fdt1:
    323	kfree(fdt1);
    324out:
    325	return ret;
    326}
    327
    328static inline struct pnv_php_slot *to_pnv_php_slot(struct hotplug_slot *slot)
    329{
    330	return container_of(slot, struct pnv_php_slot, slot);
    331}
    332
    333int pnv_php_set_slot_power_state(struct hotplug_slot *slot,
    334				 uint8_t state)
    335{
    336	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    337	struct opal_msg msg;
    338	int ret;
    339
    340	ret = pnv_pci_set_power_state(php_slot->id, state, &msg);
    341	if (ret > 0) {
    342		if (be64_to_cpu(msg.params[1]) != php_slot->dn->phandle	||
    343		    be64_to_cpu(msg.params[2]) != state) {
    344			SLOT_WARN(php_slot, "Wrong msg (%lld, %lld, %lld)\n",
    345				  be64_to_cpu(msg.params[1]),
    346				  be64_to_cpu(msg.params[2]),
    347				  be64_to_cpu(msg.params[3]));
    348			return -ENOMSG;
    349		}
    350		if (be64_to_cpu(msg.params[3]) != OPAL_SUCCESS) {
    351			ret = -ENODEV;
    352			goto error;
    353		}
    354	} else if (ret < 0) {
    355		goto error;
    356	}
    357
    358	if (state == OPAL_PCI_SLOT_POWER_OFF || state == OPAL_PCI_SLOT_OFFLINE)
    359		pnv_php_rmv_devtree(php_slot);
    360	else
    361		ret = pnv_php_add_devtree(php_slot);
    362
    363	return ret;
    364
    365error:
    366	SLOT_WARN(php_slot, "Error %d powering %s\n",
    367		  ret, (state == OPAL_PCI_SLOT_POWER_ON) ? "on" : "off");
    368	return ret;
    369}
    370EXPORT_SYMBOL_GPL(pnv_php_set_slot_power_state);
    371
    372static int pnv_php_get_power_state(struct hotplug_slot *slot, u8 *state)
    373{
    374	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    375	uint8_t power_state = OPAL_PCI_SLOT_POWER_ON;
    376	int ret;
    377
    378	/*
    379	 * Retrieve power status from firmware. If we fail
    380	 * getting that, the power status fails back to
    381	 * be on.
    382	 */
    383	ret = pnv_pci_get_power_state(php_slot->id, &power_state);
    384	if (ret) {
    385		SLOT_WARN(php_slot, "Error %d getting power status\n",
    386			  ret);
    387	} else {
    388		*state = power_state;
    389	}
    390
    391	return 0;
    392}
    393
    394static int pnv_php_get_adapter_state(struct hotplug_slot *slot, u8 *state)
    395{
    396	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    397	uint8_t presence = OPAL_PCI_SLOT_EMPTY;
    398	int ret;
    399
    400	/*
    401	 * Retrieve presence status from firmware. If we can't
    402	 * get that, it will fail back to be empty.
    403	 */
    404	ret = pnv_pci_get_presence_state(php_slot->id, &presence);
    405	if (ret >= 0) {
    406		*state = presence;
    407		ret = 0;
    408	} else {
    409		SLOT_WARN(php_slot, "Error %d getting presence\n", ret);
    410	}
    411
    412	return ret;
    413}
    414
    415static int pnv_php_get_attention_state(struct hotplug_slot *slot, u8 *state)
    416{
    417	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    418
    419	*state = php_slot->attention_state;
    420	return 0;
    421}
    422
    423static int pnv_php_set_attention_state(struct hotplug_slot *slot, u8 state)
    424{
    425	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    426	struct pci_dev *bridge = php_slot->pdev;
    427	u16 new, mask;
    428
    429	php_slot->attention_state = state;
    430	if (!bridge)
    431		return 0;
    432
    433	mask = PCI_EXP_SLTCTL_AIC;
    434
    435	if (state)
    436		new = PCI_EXP_SLTCTL_ATTN_IND_ON;
    437	else
    438		new = PCI_EXP_SLTCTL_ATTN_IND_OFF;
    439
    440	pcie_capability_clear_and_set_word(bridge, PCI_EXP_SLTCTL, mask, new);
    441
    442	return 0;
    443}
    444
    445static int pnv_php_enable(struct pnv_php_slot *php_slot, bool rescan)
    446{
    447	struct hotplug_slot *slot = &php_slot->slot;
    448	uint8_t presence = OPAL_PCI_SLOT_EMPTY;
    449	uint8_t power_status = OPAL_PCI_SLOT_POWER_ON;
    450	int ret;
    451
    452	/* Check if the slot has been configured */
    453	if (php_slot->state != PNV_PHP_STATE_REGISTERED)
    454		return 0;
    455
    456	/* Retrieve slot presence status */
    457	ret = pnv_php_get_adapter_state(slot, &presence);
    458	if (ret)
    459		return ret;
    460
    461	/*
    462	 * Proceed if there have nothing behind the slot. However,
    463	 * we should leave the slot in registered state at the
    464	 * beginning. Otherwise, the PCI devices inserted afterwards
    465	 * won't be probed and populated.
    466	 */
    467	if (presence == OPAL_PCI_SLOT_EMPTY) {
    468		if (!php_slot->power_state_check) {
    469			php_slot->power_state_check = true;
    470
    471			return 0;
    472		}
    473
    474		goto scan;
    475	}
    476
    477	/*
    478	 * If the power supply to the slot is off, we can't detect
    479	 * adapter presence state. That means we have to turn the
    480	 * slot on before going to probe slot's presence state.
    481	 *
    482	 * On the first time, we don't change the power status to
    483	 * boost system boot with assumption that the firmware
    484	 * supplies consistent slot power status: empty slot always
    485	 * has its power off and non-empty slot has its power on.
    486	 */
    487	if (!php_slot->power_state_check) {
    488		php_slot->power_state_check = true;
    489
    490		ret = pnv_php_get_power_state(slot, &power_status);
    491		if (ret)
    492			return ret;
    493
    494		if (power_status != OPAL_PCI_SLOT_POWER_ON)
    495			return 0;
    496	}
    497
    498	/* Check the power status. Scan the slot if it is already on */
    499	ret = pnv_php_get_power_state(slot, &power_status);
    500	if (ret)
    501		return ret;
    502
    503	if (power_status == OPAL_PCI_SLOT_POWER_ON)
    504		goto scan;
    505
    506	/* Power is off, turn it on and then scan the slot */
    507	ret = pnv_php_set_slot_power_state(slot, OPAL_PCI_SLOT_POWER_ON);
    508	if (ret)
    509		return ret;
    510
    511scan:
    512	if (presence == OPAL_PCI_SLOT_PRESENT) {
    513		if (rescan) {
    514			pci_lock_rescan_remove();
    515			pci_hp_add_devices(php_slot->bus);
    516			pci_unlock_rescan_remove();
    517		}
    518
    519		/* Rescan for child hotpluggable slots */
    520		php_slot->state = PNV_PHP_STATE_POPULATED;
    521		if (rescan)
    522			pnv_php_register(php_slot->dn);
    523	} else {
    524		php_slot->state = PNV_PHP_STATE_POPULATED;
    525	}
    526
    527	return 0;
    528}
    529
    530static int pnv_php_reset_slot(struct hotplug_slot *slot, bool probe)
    531{
    532	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    533	struct pci_dev *bridge = php_slot->pdev;
    534	uint16_t sts;
    535
    536	/*
    537	 * The CAPI folks want pnv_php to drive OpenCAPI slots
    538	 * which don't have a bridge. Only claim to support
    539	 * reset_slot() if we have a bridge device (for now...)
    540	 */
    541	if (probe)
    542		return !bridge;
    543
    544	/* mask our interrupt while resetting the bridge */
    545	if (php_slot->irq > 0)
    546		disable_irq(php_slot->irq);
    547
    548	pci_bridge_secondary_bus_reset(bridge);
    549
    550	/* clear any state changes that happened due to the reset */
    551	pcie_capability_read_word(php_slot->pdev, PCI_EXP_SLTSTA, &sts);
    552	sts &= (PCI_EXP_SLTSTA_PDC | PCI_EXP_SLTSTA_DLLSC);
    553	pcie_capability_write_word(php_slot->pdev, PCI_EXP_SLTSTA, sts);
    554
    555	if (php_slot->irq > 0)
    556		enable_irq(php_slot->irq);
    557
    558	return 0;
    559}
    560
    561static int pnv_php_enable_slot(struct hotplug_slot *slot)
    562{
    563	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    564
    565	return pnv_php_enable(php_slot, true);
    566}
    567
    568static int pnv_php_disable_slot(struct hotplug_slot *slot)
    569{
    570	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
    571	int ret;
    572
    573	/*
    574	 * Allow to disable a slot already in the registered state to
    575	 * cover cases where the slot couldn't be enabled and never
    576	 * reached the populated state
    577	 */
    578	if (php_slot->state != PNV_PHP_STATE_POPULATED &&
    579	    php_slot->state != PNV_PHP_STATE_REGISTERED)
    580		return 0;
    581
    582	/* Remove all devices behind the slot */
    583	pci_lock_rescan_remove();
    584	pci_hp_remove_devices(php_slot->bus);
    585	pci_unlock_rescan_remove();
    586
    587	/* Detach the child hotpluggable slots */
    588	pnv_php_unregister(php_slot->dn);
    589
    590	/* Notify firmware and remove device nodes */
    591	ret = pnv_php_set_slot_power_state(slot, OPAL_PCI_SLOT_POWER_OFF);
    592
    593	php_slot->state = PNV_PHP_STATE_REGISTERED;
    594	return ret;
    595}
    596
    597static const struct hotplug_slot_ops php_slot_ops = {
    598	.get_power_status	= pnv_php_get_power_state,
    599	.get_adapter_status	= pnv_php_get_adapter_state,
    600	.get_attention_status	= pnv_php_get_attention_state,
    601	.set_attention_status	= pnv_php_set_attention_state,
    602	.enable_slot		= pnv_php_enable_slot,
    603	.disable_slot		= pnv_php_disable_slot,
    604	.reset_slot		= pnv_php_reset_slot,
    605};
    606
    607static void pnv_php_release(struct pnv_php_slot *php_slot)
    608{
    609	unsigned long flags;
    610
    611	/* Remove from global or child list */
    612	spin_lock_irqsave(&pnv_php_lock, flags);
    613	list_del(&php_slot->link);
    614	spin_unlock_irqrestore(&pnv_php_lock, flags);
    615
    616	/* Detach from parent */
    617	pnv_php_put_slot(php_slot);
    618	pnv_php_put_slot(php_slot->parent);
    619}
    620
    621static struct pnv_php_slot *pnv_php_alloc_slot(struct device_node *dn)
    622{
    623	struct pnv_php_slot *php_slot;
    624	struct pci_bus *bus;
    625	const char *label;
    626	uint64_t id;
    627	int ret;
    628
    629	ret = of_property_read_string(dn, "ibm,slot-label", &label);
    630	if (ret)
    631		return NULL;
    632
    633	if (pnv_pci_get_slot_id(dn, &id))
    634		return NULL;
    635
    636	bus = pci_find_bus_by_node(dn);
    637	if (!bus)
    638		return NULL;
    639
    640	php_slot = kzalloc(sizeof(*php_slot), GFP_KERNEL);
    641	if (!php_slot)
    642		return NULL;
    643
    644	php_slot->name = kstrdup(label, GFP_KERNEL);
    645	if (!php_slot->name) {
    646		kfree(php_slot);
    647		return NULL;
    648	}
    649
    650	if (dn->child && PCI_DN(dn->child))
    651		php_slot->slot_no = PCI_SLOT(PCI_DN(dn->child)->devfn);
    652	else
    653		php_slot->slot_no = -1;   /* Placeholder slot */
    654
    655	kref_init(&php_slot->kref);
    656	php_slot->state	                = PNV_PHP_STATE_INITIALIZED;
    657	php_slot->dn	                = dn;
    658	php_slot->pdev	                = bus->self;
    659	php_slot->bus	                = bus;
    660	php_slot->id	                = id;
    661	php_slot->power_state_check     = false;
    662	php_slot->slot.ops              = &php_slot_ops;
    663
    664	INIT_LIST_HEAD(&php_slot->children);
    665	INIT_LIST_HEAD(&php_slot->link);
    666
    667	return php_slot;
    668}
    669
    670static int pnv_php_register_slot(struct pnv_php_slot *php_slot)
    671{
    672	struct pnv_php_slot *parent;
    673	struct device_node *dn = php_slot->dn;
    674	unsigned long flags;
    675	int ret;
    676
    677	/* Check if the slot is registered or not */
    678	parent = pnv_php_find_slot(php_slot->dn);
    679	if (parent) {
    680		pnv_php_put_slot(parent);
    681		return -EEXIST;
    682	}
    683
    684	/* Register PCI slot */
    685	ret = pci_hp_register(&php_slot->slot, php_slot->bus,
    686			      php_slot->slot_no, php_slot->name);
    687	if (ret) {
    688		SLOT_WARN(php_slot, "Error %d registering slot\n", ret);
    689		return ret;
    690	}
    691
    692	/* Attach to the parent's child list or global list */
    693	while ((dn = of_get_parent(dn))) {
    694		if (!PCI_DN(dn)) {
    695			of_node_put(dn);
    696			break;
    697		}
    698
    699		parent = pnv_php_find_slot(dn);
    700		if (parent) {
    701			of_node_put(dn);
    702			break;
    703		}
    704
    705		of_node_put(dn);
    706	}
    707
    708	spin_lock_irqsave(&pnv_php_lock, flags);
    709	php_slot->parent = parent;
    710	if (parent)
    711		list_add_tail(&php_slot->link, &parent->children);
    712	else
    713		list_add_tail(&php_slot->link, &pnv_php_slot_list);
    714	spin_unlock_irqrestore(&pnv_php_lock, flags);
    715
    716	php_slot->state = PNV_PHP_STATE_REGISTERED;
    717	return 0;
    718}
    719
    720static int pnv_php_enable_msix(struct pnv_php_slot *php_slot)
    721{
    722	struct pci_dev *pdev = php_slot->pdev;
    723	struct msix_entry entry;
    724	int nr_entries, ret;
    725	u16 pcie_flag;
    726
    727	/* Get total number of MSIx entries */
    728	nr_entries = pci_msix_vec_count(pdev);
    729	if (nr_entries < 0)
    730		return nr_entries;
    731
    732	/* Check hotplug MSIx entry is in range */
    733	pcie_capability_read_word(pdev, PCI_EXP_FLAGS, &pcie_flag);
    734	entry.entry = (pcie_flag & PCI_EXP_FLAGS_IRQ) >> 9;
    735	if (entry.entry >= nr_entries)
    736		return -ERANGE;
    737
    738	/* Enable MSIx */
    739	ret = pci_enable_msix_exact(pdev, &entry, 1);
    740	if (ret) {
    741		SLOT_WARN(php_slot, "Error %d enabling MSIx\n", ret);
    742		return ret;
    743	}
    744
    745	return entry.vector;
    746}
    747
    748static void pnv_php_event_handler(struct work_struct *work)
    749{
    750	struct pnv_php_event *event =
    751		container_of(work, struct pnv_php_event, work);
    752	struct pnv_php_slot *php_slot = event->php_slot;
    753
    754	if (event->added)
    755		pnv_php_enable_slot(&php_slot->slot);
    756	else
    757		pnv_php_disable_slot(&php_slot->slot);
    758
    759	kfree(event);
    760}
    761
    762static irqreturn_t pnv_php_interrupt(int irq, void *data)
    763{
    764	struct pnv_php_slot *php_slot = data;
    765	struct pci_dev *pchild, *pdev = php_slot->pdev;
    766	struct eeh_dev *edev;
    767	struct eeh_pe *pe;
    768	struct pnv_php_event *event;
    769	u16 sts, lsts;
    770	u8 presence;
    771	bool added;
    772	unsigned long flags;
    773	int ret;
    774
    775	pcie_capability_read_word(pdev, PCI_EXP_SLTSTA, &sts);
    776	sts &= (PCI_EXP_SLTSTA_PDC | PCI_EXP_SLTSTA_DLLSC);
    777	pcie_capability_write_word(pdev, PCI_EXP_SLTSTA, sts);
    778
    779	pci_dbg(pdev, "PCI slot [%s]: HP int! DLAct: %d, PresDet: %d\n",
    780			php_slot->name,
    781			!!(sts & PCI_EXP_SLTSTA_DLLSC),
    782			!!(sts & PCI_EXP_SLTSTA_PDC));
    783
    784	if (sts & PCI_EXP_SLTSTA_DLLSC) {
    785		pcie_capability_read_word(pdev, PCI_EXP_LNKSTA, &lsts);
    786		added = !!(lsts & PCI_EXP_LNKSTA_DLLLA);
    787	} else if (!(php_slot->flags & PNV_PHP_FLAG_BROKEN_PDC) &&
    788		   (sts & PCI_EXP_SLTSTA_PDC)) {
    789		ret = pnv_pci_get_presence_state(php_slot->id, &presence);
    790		if (ret) {
    791			SLOT_WARN(php_slot,
    792				  "PCI slot [%s] error %d getting presence (0x%04x), to retry the operation.\n",
    793				  php_slot->name, ret, sts);
    794			return IRQ_HANDLED;
    795		}
    796
    797		added = !!(presence == OPAL_PCI_SLOT_PRESENT);
    798	} else {
    799		pci_dbg(pdev, "PCI slot [%s]: Spurious IRQ?\n", php_slot->name);
    800		return IRQ_NONE;
    801	}
    802
    803	/* Freeze the removed PE to avoid unexpected error reporting */
    804	if (!added) {
    805		pchild = list_first_entry_or_null(&php_slot->bus->devices,
    806						  struct pci_dev, bus_list);
    807		edev = pchild ? pci_dev_to_eeh_dev(pchild) : NULL;
    808		pe = edev ? edev->pe : NULL;
    809		if (pe) {
    810			eeh_serialize_lock(&flags);
    811			eeh_pe_mark_isolated(pe);
    812			eeh_serialize_unlock(flags);
    813			eeh_pe_set_option(pe, EEH_OPT_FREEZE_PE);
    814		}
    815	}
    816
    817	/*
    818	 * The PE is left in frozen state if the event is missed. It's
    819	 * fine as the PCI devices (PE) aren't functional any more.
    820	 */
    821	event = kzalloc(sizeof(*event), GFP_ATOMIC);
    822	if (!event) {
    823		SLOT_WARN(php_slot,
    824			  "PCI slot [%s] missed hotplug event 0x%04x\n",
    825			  php_slot->name, sts);
    826		return IRQ_HANDLED;
    827	}
    828
    829	pci_info(pdev, "PCI slot [%s] %s (IRQ: %d)\n",
    830		 php_slot->name, added ? "added" : "removed", irq);
    831	INIT_WORK(&event->work, pnv_php_event_handler);
    832	event->added = added;
    833	event->php_slot = php_slot;
    834	queue_work(php_slot->wq, &event->work);
    835
    836	return IRQ_HANDLED;
    837}
    838
    839static void pnv_php_init_irq(struct pnv_php_slot *php_slot, int irq)
    840{
    841	struct pci_dev *pdev = php_slot->pdev;
    842	u32 broken_pdc = 0;
    843	u16 sts, ctrl;
    844	int ret;
    845
    846	/* Allocate workqueue */
    847	php_slot->wq = alloc_workqueue("pciehp-%s", 0, 0, php_slot->name);
    848	if (!php_slot->wq) {
    849		SLOT_WARN(php_slot, "Cannot alloc workqueue\n");
    850		pnv_php_disable_irq(php_slot, true);
    851		return;
    852	}
    853
    854	/* Check PDC (Presence Detection Change) is broken or not */
    855	ret = of_property_read_u32(php_slot->dn, "ibm,slot-broken-pdc",
    856				   &broken_pdc);
    857	if (!ret && broken_pdc)
    858		php_slot->flags |= PNV_PHP_FLAG_BROKEN_PDC;
    859
    860	/* Clear pending interrupts */
    861	pcie_capability_read_word(pdev, PCI_EXP_SLTSTA, &sts);
    862	if (php_slot->flags & PNV_PHP_FLAG_BROKEN_PDC)
    863		sts |= PCI_EXP_SLTSTA_DLLSC;
    864	else
    865		sts |= (PCI_EXP_SLTSTA_PDC | PCI_EXP_SLTSTA_DLLSC);
    866	pcie_capability_write_word(pdev, PCI_EXP_SLTSTA, sts);
    867
    868	/* Request the interrupt */
    869	ret = request_irq(irq, pnv_php_interrupt, IRQF_SHARED,
    870			  php_slot->name, php_slot);
    871	if (ret) {
    872		pnv_php_disable_irq(php_slot, true);
    873		SLOT_WARN(php_slot, "Error %d enabling IRQ %d\n", ret, irq);
    874		return;
    875	}
    876
    877	/* Enable the interrupts */
    878	pcie_capability_read_word(pdev, PCI_EXP_SLTCTL, &ctrl);
    879	if (php_slot->flags & PNV_PHP_FLAG_BROKEN_PDC) {
    880		ctrl &= ~PCI_EXP_SLTCTL_PDCE;
    881		ctrl |= (PCI_EXP_SLTCTL_HPIE |
    882			 PCI_EXP_SLTCTL_DLLSCE);
    883	} else {
    884		ctrl |= (PCI_EXP_SLTCTL_HPIE |
    885			 PCI_EXP_SLTCTL_PDCE |
    886			 PCI_EXP_SLTCTL_DLLSCE);
    887	}
    888	pcie_capability_write_word(pdev, PCI_EXP_SLTCTL, ctrl);
    889
    890	/* The interrupt is initialized successfully when @irq is valid */
    891	php_slot->irq = irq;
    892}
    893
    894static void pnv_php_enable_irq(struct pnv_php_slot *php_slot)
    895{
    896	struct pci_dev *pdev = php_slot->pdev;
    897	int irq, ret;
    898
    899	/*
    900	 * The MSI/MSIx interrupt might have been occupied by other
    901	 * drivers. Don't populate the surprise hotplug capability
    902	 * in that case.
    903	 */
    904	if (pci_dev_msi_enabled(pdev))
    905		return;
    906
    907	ret = pci_enable_device(pdev);
    908	if (ret) {
    909		SLOT_WARN(php_slot, "Error %d enabling device\n", ret);
    910		return;
    911	}
    912
    913	pci_set_master(pdev);
    914
    915	/* Enable MSIx interrupt */
    916	irq = pnv_php_enable_msix(php_slot);
    917	if (irq > 0) {
    918		pnv_php_init_irq(php_slot, irq);
    919		return;
    920	}
    921
    922	/*
    923	 * Use MSI if MSIx doesn't work. Fail back to legacy INTx
    924	 * if MSI doesn't work either
    925	 */
    926	ret = pci_enable_msi(pdev);
    927	if (!ret || pdev->irq) {
    928		irq = pdev->irq;
    929		pnv_php_init_irq(php_slot, irq);
    930	}
    931}
    932
    933static int pnv_php_register_one(struct device_node *dn)
    934{
    935	struct pnv_php_slot *php_slot;
    936	u32 prop32;
    937	int ret;
    938
    939	/* Check if it's hotpluggable slot */
    940	ret = of_property_read_u32(dn, "ibm,slot-pluggable", &prop32);
    941	if (ret || !prop32)
    942		return -ENXIO;
    943
    944	ret = of_property_read_u32(dn, "ibm,reset-by-firmware", &prop32);
    945	if (ret || !prop32)
    946		return -ENXIO;
    947
    948	php_slot = pnv_php_alloc_slot(dn);
    949	if (!php_slot)
    950		return -ENODEV;
    951
    952	ret = pnv_php_register_slot(php_slot);
    953	if (ret)
    954		goto free_slot;
    955
    956	ret = pnv_php_enable(php_slot, false);
    957	if (ret)
    958		goto unregister_slot;
    959
    960	/* Enable interrupt if the slot supports surprise hotplug */
    961	ret = of_property_read_u32(dn, "ibm,slot-surprise-pluggable", &prop32);
    962	if (!ret && prop32)
    963		pnv_php_enable_irq(php_slot);
    964
    965	return 0;
    966
    967unregister_slot:
    968	pnv_php_unregister_one(php_slot->dn);
    969free_slot:
    970	pnv_php_put_slot(php_slot);
    971	return ret;
    972}
    973
    974static void pnv_php_register(struct device_node *dn)
    975{
    976	struct device_node *child;
    977
    978	/*
    979	 * The parent slots should be registered before their
    980	 * child slots.
    981	 */
    982	for_each_child_of_node(dn, child) {
    983		pnv_php_register_one(child);
    984		pnv_php_register(child);
    985	}
    986}
    987
    988static void pnv_php_unregister_one(struct device_node *dn)
    989{
    990	struct pnv_php_slot *php_slot;
    991
    992	php_slot = pnv_php_find_slot(dn);
    993	if (!php_slot)
    994		return;
    995
    996	php_slot->state = PNV_PHP_STATE_OFFLINE;
    997	pci_hp_deregister(&php_slot->slot);
    998	pnv_php_release(php_slot);
    999	pnv_php_put_slot(php_slot);
   1000}
   1001
   1002static void pnv_php_unregister(struct device_node *dn)
   1003{
   1004	struct device_node *child;
   1005
   1006	/* The child slots should go before their parent slots */
   1007	for_each_child_of_node(dn, child) {
   1008		pnv_php_unregister(child);
   1009		pnv_php_unregister_one(child);
   1010	}
   1011}
   1012
   1013static int __init pnv_php_init(void)
   1014{
   1015	struct device_node *dn;
   1016
   1017	pr_info(DRIVER_DESC " version: " DRIVER_VERSION "\n");
   1018	for_each_compatible_node(dn, NULL, "ibm,ioda2-phb")
   1019		pnv_php_register(dn);
   1020
   1021	for_each_compatible_node(dn, NULL, "ibm,ioda3-phb")
   1022		pnv_php_register(dn);
   1023
   1024	for_each_compatible_node(dn, NULL, "ibm,ioda2-npu2-opencapi-phb")
   1025		pnv_php_register_one(dn); /* slot directly under the PHB */
   1026	return 0;
   1027}
   1028
   1029static void __exit pnv_php_exit(void)
   1030{
   1031	struct device_node *dn;
   1032
   1033	for_each_compatible_node(dn, NULL, "ibm,ioda2-phb")
   1034		pnv_php_unregister(dn);
   1035
   1036	for_each_compatible_node(dn, NULL, "ibm,ioda3-phb")
   1037		pnv_php_unregister(dn);
   1038
   1039	for_each_compatible_node(dn, NULL, "ibm,ioda2-npu2-opencapi-phb")
   1040		pnv_php_unregister_one(dn); /* slot directly under the PHB */
   1041}
   1042
   1043module_init(pnv_php_init);
   1044module_exit(pnv_php_exit);
   1045
   1046MODULE_VERSION(DRIVER_VERSION);
   1047MODULE_LICENSE("GPL v2");
   1048MODULE_AUTHOR(DRIVER_AUTHOR);
   1049MODULE_DESCRIPTION(DRIVER_DESC);