eeh_pe.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652
  1. /*
  2. * The file intends to implement PE based on the information from
  3. * platforms. Basically, there have 3 types of PEs: PHB/Bus/Device.
  4. * All the PEs should be organized as hierarchy tree. The first level
  5. * of the tree will be associated to existing PHBs since the particular
  6. * PE is only meaningful in one PHB domain.
  7. *
  8. * Copyright Benjamin Herrenschmidt & Gavin Shan, IBM Corporation 2012.
  9. *
  10. * This program is free software; you can redistribute it and/or modify
  11. * it under the terms of the GNU General Public License as published by
  12. * the Free Software Foundation; either version 2 of the License, or
  13. * (at your option) any later version.
  14. *
  15. * This program is distributed in the hope that it will be useful,
  16. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  18. * GNU General Public License for more details.
  19. *
  20. * You should have received a copy of the GNU General Public License
  21. * along with this program; if not, write to the Free Software
  22. * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  23. */
  24. #include <linux/export.h>
  25. #include <linux/gfp.h>
  26. #include <linux/init.h>
  27. #include <linux/kernel.h>
  28. #include <linux/pci.h>
  29. #include <linux/string.h>
  30. #include <asm/pci-bridge.h>
  31. #include <asm/ppc-pci.h>
  32. static LIST_HEAD(eeh_phb_pe);
  33. /**
  34. * eeh_pe_alloc - Allocate PE
  35. * @phb: PCI controller
  36. * @type: PE type
  37. *
  38. * Allocate PE instance dynamically.
  39. */
  40. static struct eeh_pe *eeh_pe_alloc(struct pci_controller *phb, int type)
  41. {
  42. struct eeh_pe *pe;
  43. /* Allocate PHB PE */
  44. pe = kzalloc(sizeof(struct eeh_pe), GFP_KERNEL);
  45. if (!pe) return NULL;
  46. /* Initialize PHB PE */
  47. pe->type = type;
  48. pe->phb = phb;
  49. INIT_LIST_HEAD(&pe->child_list);
  50. INIT_LIST_HEAD(&pe->child);
  51. INIT_LIST_HEAD(&pe->edevs);
  52. return pe;
  53. }
  54. /**
  55. * eeh_phb_pe_create - Create PHB PE
  56. * @phb: PCI controller
  57. *
  58. * The function should be called while the PHB is detected during
  59. * system boot or PCI hotplug in order to create PHB PE.
  60. */
  61. int eeh_phb_pe_create(struct pci_controller *phb)
  62. {
  63. struct eeh_pe *pe;
  64. /* Allocate PHB PE */
  65. pe = eeh_pe_alloc(phb, EEH_PE_PHB);
  66. if (!pe) {
  67. pr_err("%s: out of memory!\n", __func__);
  68. return -ENOMEM;
  69. }
  70. /* Put it into the list */
  71. eeh_lock();
  72. list_add_tail(&pe->child, &eeh_phb_pe);
  73. eeh_unlock();
  74. pr_debug("EEH: Add PE for PHB#%d\n", phb->global_number);
  75. return 0;
  76. }
  77. /**
  78. * eeh_phb_pe_get - Retrieve PHB PE based on the given PHB
  79. * @phb: PCI controller
  80. *
  81. * The overall PEs form hierarchy tree. The first layer of the
  82. * hierarchy tree is composed of PHB PEs. The function is used
  83. * to retrieve the corresponding PHB PE according to the given PHB.
  84. */
  85. static struct eeh_pe *eeh_phb_pe_get(struct pci_controller *phb)
  86. {
  87. struct eeh_pe *pe;
  88. list_for_each_entry(pe, &eeh_phb_pe, child) {
  89. /*
  90. * Actually, we needn't check the type since
  91. * the PE for PHB has been determined when that
  92. * was created.
  93. */
  94. if ((pe->type & EEH_PE_PHB) && pe->phb == phb)
  95. return pe;
  96. }
  97. return NULL;
  98. }
  99. /**
  100. * eeh_pe_next - Retrieve the next PE in the tree
  101. * @pe: current PE
  102. * @root: root PE
  103. *
  104. * The function is used to retrieve the next PE in the
  105. * hierarchy PE tree.
  106. */
  107. static struct eeh_pe *eeh_pe_next(struct eeh_pe *pe,
  108. struct eeh_pe *root)
  109. {
  110. struct list_head *next = pe->child_list.next;
  111. if (next == &pe->child_list) {
  112. while (1) {
  113. if (pe == root)
  114. return NULL;
  115. next = pe->child.next;
  116. if (next != &pe->parent->child_list)
  117. break;
  118. pe = pe->parent;
  119. }
  120. }
  121. return list_entry(next, struct eeh_pe, child);
  122. }
  123. /**
  124. * eeh_pe_traverse - Traverse PEs in the specified PHB
  125. * @root: root PE
  126. * @fn: callback
  127. * @flag: extra parameter to callback
  128. *
  129. * The function is used to traverse the specified PE and its
  130. * child PEs. The traversing is to be terminated once the
  131. * callback returns something other than NULL, or no more PEs
  132. * to be traversed.
  133. */
  134. static void *eeh_pe_traverse(struct eeh_pe *root,
  135. eeh_traverse_func fn, void *flag)
  136. {
  137. struct eeh_pe *pe;
  138. void *ret;
  139. for (pe = root; pe; pe = eeh_pe_next(pe, root)) {
  140. ret = fn(pe, flag);
  141. if (ret) return ret;
  142. }
  143. return NULL;
  144. }
  145. /**
  146. * eeh_pe_dev_traverse - Traverse the devices from the PE
  147. * @root: EEH PE
  148. * @fn: function callback
  149. * @flag: extra parameter to callback
  150. *
  151. * The function is used to traverse the devices of the specified
  152. * PE and its child PEs.
  153. */
  154. void *eeh_pe_dev_traverse(struct eeh_pe *root,
  155. eeh_traverse_func fn, void *flag)
  156. {
  157. struct eeh_pe *pe;
  158. struct eeh_dev *edev;
  159. void *ret;
  160. if (!root) {
  161. pr_warning("%s: Invalid PE %p\n", __func__, root);
  162. return NULL;
  163. }
  164. eeh_lock();
  165. /* Traverse root PE */
  166. for (pe = root; pe; pe = eeh_pe_next(pe, root)) {
  167. eeh_pe_for_each_dev(pe, edev) {
  168. ret = fn(edev, flag);
  169. if (ret) {
  170. eeh_unlock();
  171. return ret;
  172. }
  173. }
  174. }
  175. eeh_unlock();
  176. return NULL;
  177. }
  178. /**
  179. * __eeh_pe_get - Check the PE address
  180. * @data: EEH PE
  181. * @flag: EEH device
  182. *
  183. * For one particular PE, it can be identified by PE address
  184. * or tranditional BDF address. BDF address is composed of
  185. * Bus/Device/Function number. The extra data referred by flag
  186. * indicates which type of address should be used.
  187. */
  188. static void *__eeh_pe_get(void *data, void *flag)
  189. {
  190. struct eeh_pe *pe = (struct eeh_pe *)data;
  191. struct eeh_dev *edev = (struct eeh_dev *)flag;
  192. /* Unexpected PHB PE */
  193. if (pe->type & EEH_PE_PHB)
  194. return NULL;
  195. /* We prefer PE address */
  196. if (edev->pe_config_addr &&
  197. (edev->pe_config_addr == pe->addr))
  198. return pe;
  199. /* Try BDF address */
  200. if (edev->pe_config_addr &&
  201. (edev->config_addr == pe->config_addr))
  202. return pe;
  203. return NULL;
  204. }
  205. /**
  206. * eeh_pe_get - Search PE based on the given address
  207. * @edev: EEH device
  208. *
  209. * Search the corresponding PE based on the specified address which
  210. * is included in the eeh device. The function is used to check if
  211. * the associated PE has been created against the PE address. It's
  212. * notable that the PE address has 2 format: traditional PE address
  213. * which is composed of PCI bus/device/function number, or unified
  214. * PE address.
  215. */
  216. static struct eeh_pe *eeh_pe_get(struct eeh_dev *edev)
  217. {
  218. struct eeh_pe *root = eeh_phb_pe_get(edev->phb);
  219. struct eeh_pe *pe;
  220. pe = eeh_pe_traverse(root, __eeh_pe_get, edev);
  221. return pe;
  222. }
  223. /**
  224. * eeh_pe_get_parent - Retrieve the parent PE
  225. * @edev: EEH device
  226. *
  227. * The whole PEs existing in the system are organized as hierarchy
  228. * tree. The function is used to retrieve the parent PE according
  229. * to the parent EEH device.
  230. */
  231. static struct eeh_pe *eeh_pe_get_parent(struct eeh_dev *edev)
  232. {
  233. struct device_node *dn;
  234. struct eeh_dev *parent;
  235. /*
  236. * It might have the case for the indirect parent
  237. * EEH device already having associated PE, but
  238. * the direct parent EEH device doesn't have yet.
  239. */
  240. dn = edev->dn->parent;
  241. while (dn) {
  242. /* We're poking out of PCI territory */
  243. if (!PCI_DN(dn)) return NULL;
  244. parent = of_node_to_eeh_dev(dn);
  245. /* We're poking out of PCI territory */
  246. if (!parent) return NULL;
  247. if (parent->pe)
  248. return parent->pe;
  249. dn = dn->parent;
  250. }
  251. return NULL;
  252. }
  253. /**
  254. * eeh_add_to_parent_pe - Add EEH device to parent PE
  255. * @edev: EEH device
  256. *
  257. * Add EEH device to the parent PE. If the parent PE already
  258. * exists, the PE type will be changed to EEH_PE_BUS. Otherwise,
  259. * we have to create new PE to hold the EEH device and the new
  260. * PE will be linked to its parent PE as well.
  261. */
  262. int eeh_add_to_parent_pe(struct eeh_dev *edev)
  263. {
  264. struct eeh_pe *pe, *parent;
  265. eeh_lock();
  266. /*
  267. * Search the PE has been existing or not according
  268. * to the PE address. If that has been existing, the
  269. * PE should be composed of PCI bus and its subordinate
  270. * components.
  271. */
  272. pe = eeh_pe_get(edev);
  273. if (pe && !(pe->type & EEH_PE_INVALID)) {
  274. if (!edev->pe_config_addr) {
  275. eeh_unlock();
  276. pr_err("%s: PE with addr 0x%x already exists\n",
  277. __func__, edev->config_addr);
  278. return -EEXIST;
  279. }
  280. /* Mark the PE as type of PCI bus */
  281. pe->type = EEH_PE_BUS;
  282. edev->pe = pe;
  283. /* Put the edev to PE */
  284. list_add_tail(&edev->list, &pe->edevs);
  285. eeh_unlock();
  286. pr_debug("EEH: Add %s to Bus PE#%x\n",
  287. edev->dn->full_name, pe->addr);
  288. return 0;
  289. } else if (pe && (pe->type & EEH_PE_INVALID)) {
  290. list_add_tail(&edev->list, &pe->edevs);
  291. edev->pe = pe;
  292. /*
  293. * We're running to here because of PCI hotplug caused by
  294. * EEH recovery. We need clear EEH_PE_INVALID until the top.
  295. */
  296. parent = pe;
  297. while (parent) {
  298. if (!(parent->type & EEH_PE_INVALID))
  299. break;
  300. parent->type &= ~EEH_PE_INVALID;
  301. parent = parent->parent;
  302. }
  303. eeh_unlock();
  304. pr_debug("EEH: Add %s to Device PE#%x, Parent PE#%x\n",
  305. edev->dn->full_name, pe->addr, pe->parent->addr);
  306. return 0;
  307. }
  308. /* Create a new EEH PE */
  309. pe = eeh_pe_alloc(edev->phb, EEH_PE_DEVICE);
  310. if (!pe) {
  311. eeh_unlock();
  312. pr_err("%s: out of memory!\n", __func__);
  313. return -ENOMEM;
  314. }
  315. pe->addr = edev->pe_config_addr;
  316. pe->config_addr = edev->config_addr;
  317. /*
  318. * Put the new EEH PE into hierarchy tree. If the parent
  319. * can't be found, the newly created PE will be attached
  320. * to PHB directly. Otherwise, we have to associate the
  321. * PE with its parent.
  322. */
  323. parent = eeh_pe_get_parent(edev);
  324. if (!parent) {
  325. parent = eeh_phb_pe_get(edev->phb);
  326. if (!parent) {
  327. eeh_unlock();
  328. pr_err("%s: No PHB PE is found (PHB Domain=%d)\n",
  329. __func__, edev->phb->global_number);
  330. edev->pe = NULL;
  331. kfree(pe);
  332. return -EEXIST;
  333. }
  334. }
  335. pe->parent = parent;
  336. /*
  337. * Put the newly created PE into the child list and
  338. * link the EEH device accordingly.
  339. */
  340. list_add_tail(&pe->child, &parent->child_list);
  341. list_add_tail(&edev->list, &pe->edevs);
  342. edev->pe = pe;
  343. eeh_unlock();
  344. pr_debug("EEH: Add %s to Device PE#%x, Parent PE#%x\n",
  345. edev->dn->full_name, pe->addr, pe->parent->addr);
  346. return 0;
  347. }
  348. /**
  349. * eeh_rmv_from_parent_pe - Remove one EEH device from the associated PE
  350. * @edev: EEH device
  351. * @purge_pe: remove PE or not
  352. *
  353. * The PE hierarchy tree might be changed when doing PCI hotplug.
  354. * Also, the PCI devices or buses could be removed from the system
  355. * during EEH recovery. So we have to call the function remove the
  356. * corresponding PE accordingly if necessary.
  357. */
  358. int eeh_rmv_from_parent_pe(struct eeh_dev *edev, int purge_pe)
  359. {
  360. struct eeh_pe *pe, *parent, *child;
  361. int cnt;
  362. if (!edev->pe) {
  363. pr_warning("%s: No PE found for EEH device %s\n",
  364. __func__, edev->dn->full_name);
  365. return -EEXIST;
  366. }
  367. eeh_lock();
  368. /* Remove the EEH device */
  369. pe = edev->pe;
  370. edev->pe = NULL;
  371. list_del(&edev->list);
  372. /*
  373. * Check if the parent PE includes any EEH devices.
  374. * If not, we should delete that. Also, we should
  375. * delete the parent PE if it doesn't have associated
  376. * child PEs and EEH devices.
  377. */
  378. while (1) {
  379. parent = pe->parent;
  380. if (pe->type & EEH_PE_PHB)
  381. break;
  382. if (purge_pe) {
  383. if (list_empty(&pe->edevs) &&
  384. list_empty(&pe->child_list)) {
  385. list_del(&pe->child);
  386. kfree(pe);
  387. } else {
  388. break;
  389. }
  390. } else {
  391. if (list_empty(&pe->edevs)) {
  392. cnt = 0;
  393. list_for_each_entry(child, &pe->child_list, child) {
  394. if (!(child->type & EEH_PE_INVALID)) {
  395. cnt++;
  396. break;
  397. }
  398. }
  399. if (!cnt)
  400. pe->type |= EEH_PE_INVALID;
  401. else
  402. break;
  403. }
  404. }
  405. pe = parent;
  406. }
  407. eeh_unlock();
  408. return 0;
  409. }
  410. /**
  411. * __eeh_pe_state_mark - Mark the state for the PE
  412. * @data: EEH PE
  413. * @flag: state
  414. *
  415. * The function is used to mark the indicated state for the given
  416. * PE. Also, the associated PCI devices will be put into IO frozen
  417. * state as well.
  418. */
  419. static void *__eeh_pe_state_mark(void *data, void *flag)
  420. {
  421. struct eeh_pe *pe = (struct eeh_pe *)data;
  422. int state = *((int *)flag);
  423. struct eeh_dev *tmp;
  424. struct pci_dev *pdev;
  425. /*
  426. * Mark the PE with the indicated state. Also,
  427. * the associated PCI device will be put into
  428. * I/O frozen state to avoid I/O accesses from
  429. * the PCI device driver.
  430. */
  431. pe->state |= state;
  432. eeh_pe_for_each_dev(pe, tmp) {
  433. pdev = eeh_dev_to_pci_dev(tmp);
  434. if (pdev)
  435. pdev->error_state = pci_channel_io_frozen;
  436. }
  437. return NULL;
  438. }
  439. /**
  440. * eeh_pe_state_mark - Mark specified state for PE and its associated device
  441. * @pe: EEH PE
  442. *
  443. * EEH error affects the current PE and its child PEs. The function
  444. * is used to mark appropriate state for the affected PEs and the
  445. * associated devices.
  446. */
  447. void eeh_pe_state_mark(struct eeh_pe *pe, int state)
  448. {
  449. eeh_lock();
  450. eeh_pe_traverse(pe, __eeh_pe_state_mark, &state);
  451. eeh_unlock();
  452. }
  453. /**
  454. * __eeh_pe_state_clear - Clear state for the PE
  455. * @data: EEH PE
  456. * @flag: state
  457. *
  458. * The function is used to clear the indicated state from the
  459. * given PE. Besides, we also clear the check count of the PE
  460. * as well.
  461. */
  462. static void *__eeh_pe_state_clear(void *data, void *flag)
  463. {
  464. struct eeh_pe *pe = (struct eeh_pe *)data;
  465. int state = *((int *)flag);
  466. pe->state &= ~state;
  467. pe->check_count = 0;
  468. return NULL;
  469. }
  470. /**
  471. * eeh_pe_state_clear - Clear state for the PE and its children
  472. * @pe: PE
  473. * @state: state to be cleared
  474. *
  475. * When the PE and its children has been recovered from error,
  476. * we need clear the error state for that. The function is used
  477. * for the purpose.
  478. */
  479. void eeh_pe_state_clear(struct eeh_pe *pe, int state)
  480. {
  481. eeh_lock();
  482. eeh_pe_traverse(pe, __eeh_pe_state_clear, &state);
  483. eeh_unlock();
  484. }
  485. /**
  486. * eeh_restore_one_device_bars - Restore the Base Address Registers for one device
  487. * @data: EEH device
  488. * @flag: Unused
  489. *
  490. * Loads the PCI configuration space base address registers,
  491. * the expansion ROM base address, the latency timer, and etc.
  492. * from the saved values in the device node.
  493. */
  494. static void *eeh_restore_one_device_bars(void *data, void *flag)
  495. {
  496. int i;
  497. u32 cmd;
  498. struct eeh_dev *edev = (struct eeh_dev *)data;
  499. struct device_node *dn = eeh_dev_to_of_node(edev);
  500. for (i = 4; i < 10; i++)
  501. eeh_ops->write_config(dn, i*4, 4, edev->config_space[i]);
  502. /* 12 == Expansion ROM Address */
  503. eeh_ops->write_config(dn, 12*4, 4, edev->config_space[12]);
  504. #define BYTE_SWAP(OFF) (8*((OFF)/4)+3-(OFF))
  505. #define SAVED_BYTE(OFF) (((u8 *)(edev->config_space))[BYTE_SWAP(OFF)])
  506. eeh_ops->write_config(dn, PCI_CACHE_LINE_SIZE, 1,
  507. SAVED_BYTE(PCI_CACHE_LINE_SIZE));
  508. eeh_ops->write_config(dn, PCI_LATENCY_TIMER, 1,
  509. SAVED_BYTE(PCI_LATENCY_TIMER));
  510. /* max latency, min grant, interrupt pin and line */
  511. eeh_ops->write_config(dn, 15*4, 4, edev->config_space[15]);
  512. /*
  513. * Restore PERR & SERR bits, some devices require it,
  514. * don't touch the other command bits
  515. */
  516. eeh_ops->read_config(dn, PCI_COMMAND, 4, &cmd);
  517. if (edev->config_space[1] & PCI_COMMAND_PARITY)
  518. cmd |= PCI_COMMAND_PARITY;
  519. else
  520. cmd &= ~PCI_COMMAND_PARITY;
  521. if (edev->config_space[1] & PCI_COMMAND_SERR)
  522. cmd |= PCI_COMMAND_SERR;
  523. else
  524. cmd &= ~PCI_COMMAND_SERR;
  525. eeh_ops->write_config(dn, PCI_COMMAND, 4, cmd);
  526. return NULL;
  527. }
  528. /**
  529. * eeh_pe_restore_bars - Restore the PCI config space info
  530. * @pe: EEH PE
  531. *
  532. * This routine performs a recursive walk to the children
  533. * of this device as well.
  534. */
  535. void eeh_pe_restore_bars(struct eeh_pe *pe)
  536. {
  537. /*
  538. * We needn't take the EEH lock since eeh_pe_dev_traverse()
  539. * will take that.
  540. */
  541. eeh_pe_dev_traverse(pe, eeh_restore_one_device_bars, NULL);
  542. }
  543. /**
  544. * eeh_pe_bus_get - Retrieve PCI bus according to the given PE
  545. * @pe: EEH PE
  546. *
  547. * Retrieve the PCI bus according to the given PE. Basically,
  548. * there're 3 types of PEs: PHB/Bus/Device. For PHB PE, the
  549. * primary PCI bus will be retrieved. The parent bus will be
  550. * returned for BUS PE. However, we don't have associated PCI
  551. * bus for DEVICE PE.
  552. */
  553. struct pci_bus *eeh_pe_bus_get(struct eeh_pe *pe)
  554. {
  555. struct pci_bus *bus = NULL;
  556. struct eeh_dev *edev;
  557. struct pci_dev *pdev;
  558. eeh_lock();
  559. if (pe->type & EEH_PE_PHB) {
  560. bus = pe->phb->bus;
  561. } else if (pe->type & EEH_PE_BUS) {
  562. edev = list_first_entry(&pe->edevs, struct eeh_dev, list);
  563. pdev = eeh_dev_to_pci_dev(edev);
  564. if (pdev)
  565. bus = pdev->bus;
  566. }
  567. eeh_unlock();
  568. return bus;
  569. }