Linux Audio

Check our new training course

Loading...
Note: File does not exist in v3.1.
   1// SPDX-License-Identifier: GPL-2.0+
   2/*
   3 * PCI Hotplug Driver for PowerPC PowerNV platform.
   4 *
   5 * Copyright Gavin Shan, IBM Corporation 2016.
   6 */
   7
   8#include <linux/libfdt.h>
   9#include <linux/module.h>
  10#include <linux/pci.h>
  11#include <linux/pci_hotplug.h>
  12#include <linux/of_fdt.h>
  13
  14#include <asm/opal.h>
  15#include <asm/pnv-pci.h>
  16#include <asm/ppc-pci.h>
  17
  18#define DRIVER_VERSION	"0.1"
  19#define DRIVER_AUTHOR	"Gavin Shan, IBM Corporation"
  20#define DRIVER_DESC	"PowerPC PowerNV PCI Hotplug Driver"
  21
  22#define SLOT_WARN(sl, x...) \
  23	((sl)->pdev ? pci_warn((sl)->pdev, x) : dev_warn(&(sl)->bus->dev, x))
  24
  25struct pnv_php_event {
  26	bool			added;
  27	struct pnv_php_slot	*php_slot;
  28	struct work_struct	work;
  29};
  30
  31static LIST_HEAD(pnv_php_slot_list);
  32static DEFINE_SPINLOCK(pnv_php_lock);
  33
  34static void pnv_php_register(struct device_node *dn);
  35static void pnv_php_unregister_one(struct device_node *dn);
  36static void pnv_php_unregister(struct device_node *dn);
  37
  38static void pnv_php_disable_irq(struct pnv_php_slot *php_slot,
  39				bool disable_device)
  40{
  41	struct pci_dev *pdev = php_slot->pdev;
  42	int irq = php_slot->irq;
  43	u16 ctrl;
  44
  45	if (php_slot->irq > 0) {
  46		pcie_capability_read_word(pdev, PCI_EXP_SLTCTL, &ctrl);
  47		ctrl &= ~(PCI_EXP_SLTCTL_HPIE |
  48			  PCI_EXP_SLTCTL_PDCE |
  49			  PCI_EXP_SLTCTL_DLLSCE);
  50		pcie_capability_write_word(pdev, PCI_EXP_SLTCTL, ctrl);
  51
  52		free_irq(php_slot->irq, php_slot);
  53		php_slot->irq = 0;
  54	}
  55
  56	if (php_slot->wq) {
  57		destroy_workqueue(php_slot->wq);
  58		php_slot->wq = NULL;
  59	}
  60
  61	if (disable_device || irq > 0) {
  62		if (pdev->msix_enabled)
  63			pci_disable_msix(pdev);
  64		else if (pdev->msi_enabled)
  65			pci_disable_msi(pdev);
  66
  67		pci_disable_device(pdev);
  68	}
  69}
  70
  71static void pnv_php_free_slot(struct kref *kref)
  72{
  73	struct pnv_php_slot *php_slot = container_of(kref,
  74					struct pnv_php_slot, kref);
  75
  76	WARN_ON(!list_empty(&php_slot->children));
  77	pnv_php_disable_irq(php_slot, false);
  78	kfree(php_slot->name);
  79	kfree(php_slot);
  80}
  81
  82static inline void pnv_php_put_slot(struct pnv_php_slot *php_slot)
  83{
  84
  85	if (!php_slot)
  86		return;
  87
  88	kref_put(&php_slot->kref, pnv_php_free_slot);
  89}
  90
  91static struct pnv_php_slot *pnv_php_match(struct device_node *dn,
  92					  struct pnv_php_slot *php_slot)
  93{
  94	struct pnv_php_slot *target, *tmp;
  95
  96	if (php_slot->dn == dn) {
  97		kref_get(&php_slot->kref);
  98		return php_slot;
  99	}
 100
 101	list_for_each_entry(tmp, &php_slot->children, link) {
 102		target = pnv_php_match(dn, tmp);
 103		if (target)
 104			return target;
 105	}
 106
 107	return NULL;
 108}
 109
 110struct pnv_php_slot *pnv_php_find_slot(struct device_node *dn)
 111{
 112	struct pnv_php_slot *php_slot, *tmp;
 113	unsigned long flags;
 114
 115	spin_lock_irqsave(&pnv_php_lock, flags);
 116	list_for_each_entry(tmp, &pnv_php_slot_list, link) {
 117		php_slot = pnv_php_match(dn, tmp);
 118		if (php_slot) {
 119			spin_unlock_irqrestore(&pnv_php_lock, flags);
 120			return php_slot;
 121		}
 122	}
 123	spin_unlock_irqrestore(&pnv_php_lock, flags);
 124
 125	return NULL;
 126}
 127EXPORT_SYMBOL_GPL(pnv_php_find_slot);
 128
 129/*
 130 * Remove pdn for all children of the indicated device node.
 131 * The function should remove pdn in a depth-first manner.
 132 */
 133static void pnv_php_rmv_pdns(struct device_node *dn)
 134{
 135	struct device_node *child;
 136
 137	for_each_child_of_node(dn, child) {
 138		pnv_php_rmv_pdns(child);
 139
 140		pci_remove_device_node_info(child);
 141	}
 142}
 143
 144/*
 145 * Detach all child nodes of the indicated device nodes. The
 146 * function should handle device nodes in depth-first manner.
 147 *
 148 * We should not invoke of_node_release() as the memory for
 149 * individual device node is part of large memory block. The
 150 * large block is allocated from memblock (system bootup) or
 151 * kmalloc() when unflattening the device tree by OF changeset.
 152 * We can not free the large block allocated from memblock. For
 153 * later case, it should be released at once.
 154 */
 155static void pnv_php_detach_device_nodes(struct device_node *parent)
 156{
 157	struct device_node *dn;
 158
 159	for_each_child_of_node(parent, dn) {
 160		pnv_php_detach_device_nodes(dn);
 161
 162		of_node_put(dn);
 163		of_detach_node(dn);
 164	}
 165}
 166
 167static void pnv_php_rmv_devtree(struct pnv_php_slot *php_slot)
 168{
 169	pnv_php_rmv_pdns(php_slot->dn);
 170
 171	/*
 172	 * Decrease the refcount if the device nodes were created
 173	 * through OF changeset before detaching them.
 174	 */
 175	if (php_slot->fdt)
 176		of_changeset_destroy(&php_slot->ocs);
 177	pnv_php_detach_device_nodes(php_slot->dn);
 178
 179	if (php_slot->fdt) {
 180		kfree(php_slot->dt);
 181		kfree(php_slot->fdt);
 182		php_slot->dt        = NULL;
 183		php_slot->dn->child = NULL;
 184		php_slot->fdt       = NULL;
 185	}
 186}
 187
 188/*
 189 * As the nodes in OF changeset are applied in reverse order, we
 190 * need revert the nodes in advance so that we have correct node
 191 * order after the changeset is applied.
 192 */
 193static void pnv_php_reverse_nodes(struct device_node *parent)
 194{
 195	struct device_node *child, *next;
 196
 197	/* In-depth first */
 198	for_each_child_of_node(parent, child)
 199		pnv_php_reverse_nodes(child);
 200
 201	/* Reverse the nodes in the child list */
 202	child = parent->child;
 203	parent->child = NULL;
 204	while (child) {
 205		next = child->sibling;
 206
 207		child->sibling = parent->child;
 208		parent->child = child;
 209		child = next;
 210	}
 211}
 212
 213static int pnv_php_populate_changeset(struct of_changeset *ocs,
 214				      struct device_node *dn)
 215{
 216	struct device_node *child;
 217	int ret = 0;
 218
 219	for_each_child_of_node(dn, child) {
 220		ret = of_changeset_attach_node(ocs, child);
 221		if (ret) {
 222			of_node_put(child);
 223			break;
 224		}
 225
 226		ret = pnv_php_populate_changeset(ocs, child);
 227		if (ret) {
 228			of_node_put(child);
 229			break;
 230		}
 231	}
 232
 233	return ret;
 234}
 235
 236static void *pnv_php_add_one_pdn(struct device_node *dn, void *data)
 237{
 238	struct pci_controller *hose = (struct pci_controller *)data;
 239	struct pci_dn *pdn;
 240
 241	pdn = pci_add_device_node_info(hose, dn);
 242	if (!pdn)
 243		return ERR_PTR(-ENOMEM);
 244
 245	return NULL;
 246}
 247
 248static void pnv_php_add_pdns(struct pnv_php_slot *slot)
 249{
 250	struct pci_controller *hose = pci_bus_to_host(slot->bus);
 251
 252	pci_traverse_device_nodes(slot->dn, pnv_php_add_one_pdn, hose);
 253}
 254
 255static int pnv_php_add_devtree(struct pnv_php_slot *php_slot)
 256{
 257	void *fdt, *fdt1, *dt;
 258	int ret;
 259
 260	/* We don't know the FDT blob size. We try to get it through
 261	 * maximal memory chunk and then copy it to another chunk that
 262	 * fits the real size.
 263	 */
 264	fdt1 = kzalloc(0x10000, GFP_KERNEL);
 265	if (!fdt1) {
 266		ret = -ENOMEM;
 267		goto out;
 268	}
 269
 270	ret = pnv_pci_get_device_tree(php_slot->dn->phandle, fdt1, 0x10000);
 271	if (ret) {
 272		SLOT_WARN(php_slot, "Error %d getting FDT blob\n", ret);
 273		goto free_fdt1;
 274	}
 275
 276	fdt = kmemdup(fdt1, fdt_totalsize(fdt1), GFP_KERNEL);
 277	if (!fdt) {
 278		ret = -ENOMEM;
 279		goto free_fdt1;
 280	}
 281
 282	/* Unflatten device tree blob */
 283	dt = of_fdt_unflatten_tree(fdt, php_slot->dn, NULL);
 284	if (!dt) {
 285		ret = -EINVAL;
 286		SLOT_WARN(php_slot, "Cannot unflatten FDT\n");
 287		goto free_fdt;
 288	}
 289
 290	/* Initialize and apply the changeset */
 291	of_changeset_init(&php_slot->ocs);
 292	pnv_php_reverse_nodes(php_slot->dn);
 293	ret = pnv_php_populate_changeset(&php_slot->ocs, php_slot->dn);
 294	if (ret) {
 295		pnv_php_reverse_nodes(php_slot->dn);
 296		SLOT_WARN(php_slot, "Error %d populating changeset\n",
 297			  ret);
 298		goto free_dt;
 299	}
 300
 301	php_slot->dn->child = NULL;
 302	ret = of_changeset_apply(&php_slot->ocs);
 303	if (ret) {
 304		SLOT_WARN(php_slot, "Error %d applying changeset\n", ret);
 305		goto destroy_changeset;
 306	}
 307
 308	/* Add device node firmware data */
 309	pnv_php_add_pdns(php_slot);
 310	php_slot->fdt = fdt;
 311	php_slot->dt  = dt;
 312	kfree(fdt1);
 313	goto out;
 314
 315destroy_changeset:
 316	of_changeset_destroy(&php_slot->ocs);
 317free_dt:
 318	kfree(dt);
 319	php_slot->dn->child = NULL;
 320free_fdt:
 321	kfree(fdt);
 322free_fdt1:
 323	kfree(fdt1);
 324out:
 325	return ret;
 326}
 327
 328static inline struct pnv_php_slot *to_pnv_php_slot(struct hotplug_slot *slot)
 329{
 330	return container_of(slot, struct pnv_php_slot, slot);
 331}
 332
 333int pnv_php_set_slot_power_state(struct hotplug_slot *slot,
 334				 uint8_t state)
 335{
 336	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 337	struct opal_msg msg;
 338	int ret;
 339
 340	ret = pnv_pci_set_power_state(php_slot->id, state, &msg);
 341	if (ret > 0) {
 342		if (be64_to_cpu(msg.params[1]) != php_slot->dn->phandle	||
 343		    be64_to_cpu(msg.params[2]) != state) {
 344			SLOT_WARN(php_slot, "Wrong msg (%lld, %lld, %lld)\n",
 345				  be64_to_cpu(msg.params[1]),
 346				  be64_to_cpu(msg.params[2]),
 347				  be64_to_cpu(msg.params[3]));
 348			return -ENOMSG;
 349		}
 350		if (be64_to_cpu(msg.params[3]) != OPAL_SUCCESS) {
 351			ret = -ENODEV;
 352			goto error;
 353		}
 354	} else if (ret < 0) {
 355		goto error;
 356	}
 357
 358	if (state == OPAL_PCI_SLOT_POWER_OFF || state == OPAL_PCI_SLOT_OFFLINE)
 359		pnv_php_rmv_devtree(php_slot);
 360	else
 361		ret = pnv_php_add_devtree(php_slot);
 362
 363	return ret;
 364
 365error:
 366	SLOT_WARN(php_slot, "Error %d powering %s\n",
 367		  ret, (state == OPAL_PCI_SLOT_POWER_ON) ? "on" : "off");
 368	return ret;
 369}
 370EXPORT_SYMBOL_GPL(pnv_php_set_slot_power_state);
 371
 372static int pnv_php_get_power_state(struct hotplug_slot *slot, u8 *state)
 373{
 374	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 375	uint8_t power_state = OPAL_PCI_SLOT_POWER_ON;
 376	int ret;
 377
 378	/*
 379	 * Retrieve power status from firmware. If we fail
 380	 * getting that, the power status fails back to
 381	 * be on.
 382	 */
 383	ret = pnv_pci_get_power_state(php_slot->id, &power_state);
 384	if (ret) {
 385		SLOT_WARN(php_slot, "Error %d getting power status\n",
 386			  ret);
 387	} else {
 388		*state = power_state;
 389	}
 390
 391	return 0;
 392}
 393
 394static int pnv_php_get_adapter_state(struct hotplug_slot *slot, u8 *state)
 395{
 396	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 397	uint8_t presence = OPAL_PCI_SLOT_EMPTY;
 398	int ret;
 399
 400	/*
 401	 * Retrieve presence status from firmware. If we can't
 402	 * get that, it will fail back to be empty.
 403	 */
 404	ret = pnv_pci_get_presence_state(php_slot->id, &presence);
 405	if (ret >= 0) {
 406		*state = presence;
 407		ret = 0;
 408	} else {
 409		SLOT_WARN(php_slot, "Error %d getting presence\n", ret);
 410	}
 411
 412	return ret;
 413}
 414
 415static int pnv_php_get_attention_state(struct hotplug_slot *slot, u8 *state)
 416{
 417	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 418
 419	*state = php_slot->attention_state;
 420	return 0;
 421}
 422
 423static int pnv_php_set_attention_state(struct hotplug_slot *slot, u8 state)
 424{
 425	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 426	struct pci_dev *bridge = php_slot->pdev;
 427	u16 new, mask;
 428
 429	php_slot->attention_state = state;
 430	if (!bridge)
 431		return 0;
 432
 433	mask = PCI_EXP_SLTCTL_AIC;
 434
 435	if (state)
 436		new = PCI_EXP_SLTCTL_ATTN_IND_ON;
 437	else
 438		new = PCI_EXP_SLTCTL_ATTN_IND_OFF;
 439
 440	pcie_capability_clear_and_set_word(bridge, PCI_EXP_SLTCTL, mask, new);
 441
 442	return 0;
 443}
 444
 445static int pnv_php_enable(struct pnv_php_slot *php_slot, bool rescan)
 446{
 447	struct hotplug_slot *slot = &php_slot->slot;
 448	uint8_t presence = OPAL_PCI_SLOT_EMPTY;
 449	uint8_t power_status = OPAL_PCI_SLOT_POWER_ON;
 450	int ret;
 451
 452	/* Check if the slot has been configured */
 453	if (php_slot->state != PNV_PHP_STATE_REGISTERED)
 454		return 0;
 455
 456	/* Retrieve slot presence status */
 457	ret = pnv_php_get_adapter_state(slot, &presence);
 458	if (ret)
 459		return ret;
 460
 461	/*
 462	 * Proceed if there have nothing behind the slot. However,
 463	 * we should leave the slot in registered state at the
 464	 * beginning. Otherwise, the PCI devices inserted afterwards
 465	 * won't be probed and populated.
 466	 */
 467	if (presence == OPAL_PCI_SLOT_EMPTY) {
 468		if (!php_slot->power_state_check) {
 469			php_slot->power_state_check = true;
 470
 471			return 0;
 472		}
 473
 474		goto scan;
 475	}
 476
 477	/*
 478	 * If the power supply to the slot is off, we can't detect
 479	 * adapter presence state. That means we have to turn the
 480	 * slot on before going to probe slot's presence state.
 481	 *
 482	 * On the first time, we don't change the power status to
 483	 * boost system boot with assumption that the firmware
 484	 * supplies consistent slot power status: empty slot always
 485	 * has its power off and non-empty slot has its power on.
 486	 */
 487	if (!php_slot->power_state_check) {
 488		php_slot->power_state_check = true;
 489
 490		ret = pnv_php_get_power_state(slot, &power_status);
 491		if (ret)
 492			return ret;
 493
 494		if (power_status != OPAL_PCI_SLOT_POWER_ON)
 495			return 0;
 496	}
 497
 498	/* Check the power status. Scan the slot if it is already on */
 499	ret = pnv_php_get_power_state(slot, &power_status);
 500	if (ret)
 501		return ret;
 502
 503	if (power_status == OPAL_PCI_SLOT_POWER_ON)
 504		goto scan;
 505
 506	/* Power is off, turn it on and then scan the slot */
 507	ret = pnv_php_set_slot_power_state(slot, OPAL_PCI_SLOT_POWER_ON);
 508	if (ret)
 509		return ret;
 510
 511scan:
 512	if (presence == OPAL_PCI_SLOT_PRESENT) {
 513		if (rescan) {
 514			pci_lock_rescan_remove();
 515			pci_hp_add_devices(php_slot->bus);
 516			pci_unlock_rescan_remove();
 517		}
 518
 519		/* Rescan for child hotpluggable slots */
 520		php_slot->state = PNV_PHP_STATE_POPULATED;
 521		if (rescan)
 522			pnv_php_register(php_slot->dn);
 523	} else {
 524		php_slot->state = PNV_PHP_STATE_POPULATED;
 525	}
 526
 527	return 0;
 528}
 529
 530static int pnv_php_reset_slot(struct hotplug_slot *slot, bool probe)
 531{
 532	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 533	struct pci_dev *bridge = php_slot->pdev;
 534	uint16_t sts;
 535
 536	/*
 537	 * The CAPI folks want pnv_php to drive OpenCAPI slots
 538	 * which don't have a bridge. Only claim to support
 539	 * reset_slot() if we have a bridge device (for now...)
 540	 */
 541	if (probe)
 542		return !bridge;
 543
 544	/* mask our interrupt while resetting the bridge */
 545	if (php_slot->irq > 0)
 546		disable_irq(php_slot->irq);
 547
 548	pci_bridge_secondary_bus_reset(bridge);
 549
 550	/* clear any state changes that happened due to the reset */
 551	pcie_capability_read_word(php_slot->pdev, PCI_EXP_SLTSTA, &sts);
 552	sts &= (PCI_EXP_SLTSTA_PDC | PCI_EXP_SLTSTA_DLLSC);
 553	pcie_capability_write_word(php_slot->pdev, PCI_EXP_SLTSTA, sts);
 554
 555	if (php_slot->irq > 0)
 556		enable_irq(php_slot->irq);
 557
 558	return 0;
 559}
 560
 561static int pnv_php_enable_slot(struct hotplug_slot *slot)
 562{
 563	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 564
 565	return pnv_php_enable(php_slot, true);
 566}
 567
 568static int pnv_php_disable_slot(struct hotplug_slot *slot)
 569{
 570	struct pnv_php_slot *php_slot = to_pnv_php_slot(slot);
 571	int ret;
 572
 573	/*
 574	 * Allow to disable a slot already in the registered state to
 575	 * cover cases where the slot couldn't be enabled and never
 576	 * reached the populated state
 577	 */
 578	if (php_slot->state != PNV_PHP_STATE_POPULATED &&
 579	    php_slot->state != PNV_PHP_STATE_REGISTERED)
 580		return 0;
 581
 582	/* Remove all devices behind the slot */
 583	pci_lock_rescan_remove();
 584	pci_hp_remove_devices(php_slot->bus);
 585	pci_unlock_rescan_remove();
 586
 587	/* Detach the child hotpluggable slots */
 588	pnv_php_unregister(php_slot->dn);
 589
 590	/* Notify firmware and remove device nodes */
 591	ret = pnv_php_set_slot_power_state(slot, OPAL_PCI_SLOT_POWER_OFF);
 592
 593	php_slot->state = PNV_PHP_STATE_REGISTERED;
 594	return ret;
 595}
 596
 597static const struct hotplug_slot_ops php_slot_ops = {
 598	.get_power_status	= pnv_php_get_power_state,
 599	.get_adapter_status	= pnv_php_get_adapter_state,
 600	.get_attention_status	= pnv_php_get_attention_state,
 601	.set_attention_status	= pnv_php_set_attention_state,
 602	.enable_slot		= pnv_php_enable_slot,
 603	.disable_slot		= pnv_php_disable_slot,
 604	.reset_slot		= pnv_php_reset_slot,
 605};
 606
 607static void pnv_php_release(struct pnv_php_slot *php_slot)
 608{
 609	unsigned long flags;
 610
 611	/* Remove from global or child list */
 612	spin_lock_irqsave(&pnv_php_lock, flags);
 613	list_del(&php_slot->link);
 614	spin_unlock_irqrestore(&pnv_php_lock, flags);
 615
 616	/* Detach from parent */
 617	pnv_php_put_slot(php_slot);
 618	pnv_php_put_slot(php_slot->parent);
 619}
 620
 621static struct pnv_php_slot *pnv_php_alloc_slot(struct device_node *dn)
 622{
 623	struct pnv_php_slot *php_slot;
 624	struct pci_bus *bus;
 625	const char *label;
 626	uint64_t id;
 627	int ret;
 628
 629	ret = of_property_read_string(dn, "ibm,slot-label", &label);
 630	if (ret)
 631		return NULL;
 632
 633	if (pnv_pci_get_slot_id(dn, &id))
 634		return NULL;
 635
 636	bus = pci_find_bus_by_node(dn);
 637	if (!bus)
 638		return NULL;
 639
 640	php_slot = kzalloc(sizeof(*php_slot), GFP_KERNEL);
 641	if (!php_slot)
 642		return NULL;
 643
 644	php_slot->name = kstrdup(label, GFP_KERNEL);
 645	if (!php_slot->name) {
 646		kfree(php_slot);
 647		return NULL;
 648	}
 649
 650	if (dn->child && PCI_DN(dn->child))
 651		php_slot->slot_no = PCI_SLOT(PCI_DN(dn->child)->devfn);
 652	else
 653		php_slot->slot_no = -1;   /* Placeholder slot */
 654
 655	kref_init(&php_slot->kref);
 656	php_slot->state	                = PNV_PHP_STATE_INITIALIZED;
 657	php_slot->dn	                = dn;
 658	php_slot->pdev	                = bus->self;
 659	php_slot->bus	                = bus;
 660	php_slot->id	                = id;
 661	php_slot->power_state_check     = false;
 662	php_slot->slot.ops              = &php_slot_ops;
 663
 664	INIT_LIST_HEAD(&php_slot->children);
 665	INIT_LIST_HEAD(&php_slot->link);
 666
 667	return php_slot;
 668}
 669
 670static int pnv_php_register_slot(struct pnv_php_slot *php_slot)
 671{
 672	struct pnv_php_slot *parent;
 673	struct device_node *dn = php_slot->dn;
 674	unsigned long flags;
 675	int ret;
 676
 677	/* Check if the slot is registered or not */
 678	parent = pnv_php_find_slot(php_slot->dn);
 679	if (parent) {
 680		pnv_php_put_slot(parent);
 681		return -EEXIST;
 682	}
 683
 684	/* Register PCI slot */
 685	ret = pci_hp_register(&php_slot->slot, php_slot->bus,
 686			      php_slot->slot_no, php_slot->name);
 687	if (ret) {
 688		SLOT_WARN(php_slot, "Error %d registering slot\n", ret);
 689		return ret;
 690	}
 691
 692	/* Attach to the parent's child list or global list */
 693	while ((dn = of_get_parent(dn))) {
 694		if (!PCI_DN(dn)) {
 695			of_node_put(dn);
 696			break;
 697		}
 698
 699		parent = pnv_php_find_slot(dn);
 700		if (parent) {
 701			of_node_put(dn);
 702			break;
 703		}
 704
 705		of_node_put(dn);
 706	}
 707
 708	spin_lock_irqsave(&pnv_php_lock, flags);
 709	php_slot->parent = parent;
 710	if (parent)
 711		list_add_tail(&php_slot->link, &parent->children);
 712	else
 713		list_add_tail(&php_slot->link, &pnv_php_slot_list);
 714	spin_unlock_irqrestore(&pnv_php_lock, flags);
 715
 716	php_slot->state = PNV_PHP_STATE_REGISTERED;
 717	return 0;
 718}
 719
 720static int pnv_php_enable_msix(struct pnv_php_slot *php_slot)
 721{
 722	struct pci_dev *pdev = php_slot->pdev;
 723	struct msix_entry entry;
 724	int nr_entries, ret;
 725	u16 pcie_flag;
 726
 727	/* Get total number of MSIx entries */
 728	nr_entries = pci_msix_vec_count(pdev);
 729	if (nr_entries < 0)
 730		return nr_entries;
 731
 732	/* Check hotplug MSIx entry is in range */
 733	pcie_capability_read_word(pdev, PCI_EXP_FLAGS, &pcie_flag);
 734	entry.entry = (pcie_flag & PCI_EXP_FLAGS_IRQ) >> 9;
 735	if (entry.entry >= nr_entries)
 736		return -ERANGE;
 737
 738	/* Enable MSIx */
 739	ret = pci_enable_msix_exact(pdev, &entry, 1);
 740	if (ret) {
 741		SLOT_WARN(php_slot, "Error %d enabling MSIx\n", ret);
 742		return ret;
 743	}
 744
 745	return entry.vector;
 746}
 747
 748static void pnv_php_event_handler(struct work_struct *work)
 749{
 750	struct pnv_php_event *event =
 751		container_of(work, struct pnv_php_event, work);
 752	struct pnv_php_slot *php_slot = event->php_slot;
 753
 754	if (event->added)
 755		pnv_php_enable_slot(&php_slot->slot);
 756	else
 757		pnv_php_disable_slot(&php_slot->slot);
 758
 759	kfree(event);
 760}
 761
 762static irqreturn_t pnv_php_interrupt(int irq, void *data)
 763{
 764	struct pnv_php_slot *php_slot = data;
 765	struct pci_dev *pchild, *pdev = php_slot->pdev;
 766	struct eeh_dev *edev;
 767	struct eeh_pe *pe;
 768	struct pnv_php_event *event;
 769	u16 sts, lsts;
 770	u8 presence;
 771	bool added;
 772	unsigned long flags;
 773	int ret;
 774
 775	pcie_capability_read_word(pdev, PCI_EXP_SLTSTA, &sts);
 776	sts &= (PCI_EXP_SLTSTA_PDC | PCI_EXP_SLTSTA_DLLSC);
 777	pcie_capability_write_word(pdev, PCI_EXP_SLTSTA, sts);
 778
 779	pci_dbg(pdev, "PCI slot [%s]: HP int! DLAct: %d, PresDet: %d\n",
 780			php_slot->name,
 781			!!(sts & PCI_EXP_SLTSTA_DLLSC),
 782			!!(sts & PCI_EXP_SLTSTA_PDC));
 783
 784	if (sts & PCI_EXP_SLTSTA_DLLSC) {
 785		pcie_capability_read_word(pdev, PCI_EXP_LNKSTA, &lsts);
 786		added = !!(lsts & PCI_EXP_LNKSTA_DLLLA);
 787	} else if (!(php_slot->flags & PNV_PHP_FLAG_BROKEN_PDC) &&
 788		   (sts & PCI_EXP_SLTSTA_PDC)) {
 789		ret = pnv_pci_get_presence_state(php_slot->id, &presence);
 790		if (ret) {
 791			SLOT_WARN(php_slot,
 792				  "PCI slot [%s] error %d getting presence (0x%04x), to retry the operation.\n",
 793				  php_slot->name, ret, sts);
 794			return IRQ_HANDLED;
 795		}
 796
 797		added = !!(presence == OPAL_PCI_SLOT_PRESENT);
 798	} else {
 799		pci_dbg(pdev, "PCI slot [%s]: Spurious IRQ?\n", php_slot->name);
 800		return IRQ_NONE;
 801	}
 802
 803	/* Freeze the removed PE to avoid unexpected error reporting */
 804	if (!added) {
 805		pchild = list_first_entry_or_null(&php_slot->bus->devices,
 806						  struct pci_dev, bus_list);
 807		edev = pchild ? pci_dev_to_eeh_dev(pchild) : NULL;
 808		pe = edev ? edev->pe : NULL;
 809		if (pe) {
 810			eeh_serialize_lock(&flags);
 811			eeh_pe_mark_isolated(pe);
 812			eeh_serialize_unlock(flags);
 813			eeh_pe_set_option(pe, EEH_OPT_FREEZE_PE);
 814		}
 815	}
 816
 817	/*
 818	 * The PE is left in frozen state if the event is missed. It's
 819	 * fine as the PCI devices (PE) aren't functional any more.
 820	 */
 821	event = kzalloc(sizeof(*event), GFP_ATOMIC);
 822	if (!event) {
 823		SLOT_WARN(php_slot,
 824			  "PCI slot [%s] missed hotplug event 0x%04x\n",
 825			  php_slot->name, sts);
 826		return IRQ_HANDLED;
 827	}
 828
 829	pci_info(pdev, "PCI slot [%s] %s (IRQ: %d)\n",
 830		 php_slot->name, added ? "added" : "removed", irq);
 831	INIT_WORK(&event->work, pnv_php_event_handler);
 832	event->added = added;
 833	event->php_slot = php_slot;
 834	queue_work(php_slot->wq, &event->work);
 835
 836	return IRQ_HANDLED;
 837}
 838
 839static void pnv_php_init_irq(struct pnv_php_slot *php_slot, int irq)
 840{
 841	struct pci_dev *pdev = php_slot->pdev;
 842	u32 broken_pdc = 0;
 843	u16 sts, ctrl;
 844	int ret;
 845
 846	/* Allocate workqueue */
 847	php_slot->wq = alloc_workqueue("pciehp-%s", 0, 0, php_slot->name);
 848	if (!php_slot->wq) {
 849		SLOT_WARN(php_slot, "Cannot alloc workqueue\n");
 850		pnv_php_disable_irq(php_slot, true);
 851		return;
 852	}
 853
 854	/* Check PDC (Presence Detection Change) is broken or not */
 855	ret = of_property_read_u32(php_slot->dn, "ibm,slot-broken-pdc",
 856				   &broken_pdc);
 857	if (!ret && broken_pdc)
 858		php_slot->flags |= PNV_PHP_FLAG_BROKEN_PDC;
 859
 860	/* Clear pending interrupts */
 861	pcie_capability_read_word(pdev, PCI_EXP_SLTSTA, &sts);
 862	if (php_slot->flags & PNV_PHP_FLAG_BROKEN_PDC)
 863		sts |= PCI_EXP_SLTSTA_DLLSC;
 864	else
 865		sts |= (PCI_EXP_SLTSTA_PDC | PCI_EXP_SLTSTA_DLLSC);
 866	pcie_capability_write_word(pdev, PCI_EXP_SLTSTA, sts);
 867
 868	/* Request the interrupt */
 869	ret = request_irq(irq, pnv_php_interrupt, IRQF_SHARED,
 870			  php_slot->name, php_slot);
 871	if (ret) {
 872		pnv_php_disable_irq(php_slot, true);
 873		SLOT_WARN(php_slot, "Error %d enabling IRQ %d\n", ret, irq);
 874		return;
 875	}
 876
 877	/* Enable the interrupts */
 878	pcie_capability_read_word(pdev, PCI_EXP_SLTCTL, &ctrl);
 879	if (php_slot->flags & PNV_PHP_FLAG_BROKEN_PDC) {
 880		ctrl &= ~PCI_EXP_SLTCTL_PDCE;
 881		ctrl |= (PCI_EXP_SLTCTL_HPIE |
 882			 PCI_EXP_SLTCTL_DLLSCE);
 883	} else {
 884		ctrl |= (PCI_EXP_SLTCTL_HPIE |
 885			 PCI_EXP_SLTCTL_PDCE |
 886			 PCI_EXP_SLTCTL_DLLSCE);
 887	}
 888	pcie_capability_write_word(pdev, PCI_EXP_SLTCTL, ctrl);
 889
 890	/* The interrupt is initialized successfully when @irq is valid */
 891	php_slot->irq = irq;
 892}
 893
 894static void pnv_php_enable_irq(struct pnv_php_slot *php_slot)
 895{
 896	struct pci_dev *pdev = php_slot->pdev;
 897	int irq, ret;
 898
 899	/*
 900	 * The MSI/MSIx interrupt might have been occupied by other
 901	 * drivers. Don't populate the surprise hotplug capability
 902	 * in that case.
 903	 */
 904	if (pci_dev_msi_enabled(pdev))
 905		return;
 906
 907	ret = pci_enable_device(pdev);
 908	if (ret) {
 909		SLOT_WARN(php_slot, "Error %d enabling device\n", ret);
 910		return;
 911	}
 912
 913	pci_set_master(pdev);
 914
 915	/* Enable MSIx interrupt */
 916	irq = pnv_php_enable_msix(php_slot);
 917	if (irq > 0) {
 918		pnv_php_init_irq(php_slot, irq);
 919		return;
 920	}
 921
 922	/*
 923	 * Use MSI if MSIx doesn't work. Fail back to legacy INTx
 924	 * if MSI doesn't work either
 925	 */
 926	ret = pci_enable_msi(pdev);
 927	if (!ret || pdev->irq) {
 928		irq = pdev->irq;
 929		pnv_php_init_irq(php_slot, irq);
 930	}
 931}
 932
 933static int pnv_php_register_one(struct device_node *dn)
 934{
 935	struct pnv_php_slot *php_slot;
 936	u32 prop32;
 937	int ret;
 938
 939	/* Check if it's hotpluggable slot */
 940	ret = of_property_read_u32(dn, "ibm,slot-pluggable", &prop32);
 941	if (ret || !prop32)
 942		return -ENXIO;
 943
 944	ret = of_property_read_u32(dn, "ibm,reset-by-firmware", &prop32);
 945	if (ret || !prop32)
 946		return -ENXIO;
 947
 948	php_slot = pnv_php_alloc_slot(dn);
 949	if (!php_slot)
 950		return -ENODEV;
 951
 952	ret = pnv_php_register_slot(php_slot);
 953	if (ret)
 954		goto free_slot;
 955
 956	ret = pnv_php_enable(php_slot, false);
 957	if (ret)
 958		goto unregister_slot;
 959
 960	/* Enable interrupt if the slot supports surprise hotplug */
 961	ret = of_property_read_u32(dn, "ibm,slot-surprise-pluggable", &prop32);
 962	if (!ret && prop32)
 963		pnv_php_enable_irq(php_slot);
 964
 965	return 0;
 966
 967unregister_slot:
 968	pnv_php_unregister_one(php_slot->dn);
 969free_slot:
 970	pnv_php_put_slot(php_slot);
 971	return ret;
 972}
 973
 974static void pnv_php_register(struct device_node *dn)
 975{
 976	struct device_node *child;
 977
 978	/*
 979	 * The parent slots should be registered before their
 980	 * child slots.
 981	 */
 982	for_each_child_of_node(dn, child) {
 983		pnv_php_register_one(child);
 984		pnv_php_register(child);
 985	}
 986}
 987
 988static void pnv_php_unregister_one(struct device_node *dn)
 989{
 990	struct pnv_php_slot *php_slot;
 991
 992	php_slot = pnv_php_find_slot(dn);
 993	if (!php_slot)
 994		return;
 995
 996	php_slot->state = PNV_PHP_STATE_OFFLINE;
 997	pci_hp_deregister(&php_slot->slot);
 998	pnv_php_release(php_slot);
 999	pnv_php_put_slot(php_slot);
1000}
1001
1002static void pnv_php_unregister(struct device_node *dn)
1003{
1004	struct device_node *child;
1005
1006	/* The child slots should go before their parent slots */
1007	for_each_child_of_node(dn, child) {
1008		pnv_php_unregister(child);
1009		pnv_php_unregister_one(child);
1010	}
1011}
1012
1013static int __init pnv_php_init(void)
1014{
1015	struct device_node *dn;
1016
1017	pr_info(DRIVER_DESC " version: " DRIVER_VERSION "\n");
1018	for_each_compatible_node(dn, NULL, "ibm,ioda2-phb")
1019		pnv_php_register(dn);
1020
1021	for_each_compatible_node(dn, NULL, "ibm,ioda3-phb")
1022		pnv_php_register(dn);
1023
1024	for_each_compatible_node(dn, NULL, "ibm,ioda2-npu2-opencapi-phb")
1025		pnv_php_register_one(dn); /* slot directly under the PHB */
1026	return 0;
1027}
1028
1029static void __exit pnv_php_exit(void)
1030{
1031	struct device_node *dn;
1032
1033	for_each_compatible_node(dn, NULL, "ibm,ioda2-phb")
1034		pnv_php_unregister(dn);
1035
1036	for_each_compatible_node(dn, NULL, "ibm,ioda3-phb")
1037		pnv_php_unregister(dn);
1038
1039	for_each_compatible_node(dn, NULL, "ibm,ioda2-npu2-opencapi-phb")
1040		pnv_php_unregister_one(dn); /* slot directly under the PHB */
1041}
1042
1043module_init(pnv_php_init);
1044module_exit(pnv_php_exit);
1045
1046MODULE_VERSION(DRIVER_VERSION);
1047MODULE_LICENSE("GPL v2");
1048MODULE_AUTHOR(DRIVER_AUTHOR);
1049MODULE_DESCRIPTION(DRIVER_DESC);