aerdrv.c 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353
  1. /*
  2. * drivers/pci/pcie/aer/aerdrv.c
  3. *
  4. * This file is subject to the terms and conditions of the GNU General Public
  5. * License. See the file "COPYING" in the main directory of this archive
  6. * for more details.
  7. *
  8. * This file implements the AER root port service driver. The driver will
  9. * register an irq handler. When root port triggers an AER interrupt, the irq
  10. * handler will collect root port status and schedule a work.
  11. *
  12. * Copyright (C) 2006 Intel Corp.
  13. * Tom Long Nguyen (tom.l.nguyen@intel.com)
  14. * Zhang Yanmin (yanmin.zhang@intel.com)
  15. *
  16. */
  17. #include <linux/module.h>
  18. #include <linux/pci.h>
  19. #include <linux/kernel.h>
  20. #include <linux/errno.h>
  21. #include <linux/pm.h>
  22. #include <linux/init.h>
  23. #include <linux/interrupt.h>
  24. #include <linux/delay.h>
  25. #include <linux/pcieport_if.h>
  26. #include "aerdrv.h"
  27. /*
  28. * Version Information
  29. */
  30. #define DRIVER_VERSION "v1.0"
  31. #define DRIVER_AUTHOR "tom.l.nguyen@intel.com"
  32. #define DRIVER_DESC "Root Port Advanced Error Reporting Driver"
  33. MODULE_AUTHOR(DRIVER_AUTHOR);
  34. MODULE_DESCRIPTION(DRIVER_DESC);
  35. MODULE_LICENSE("GPL");
  36. static int __devinit aer_probe (struct pcie_device *dev,
  37. const struct pcie_port_service_id *id );
  38. static void aer_remove(struct pcie_device *dev);
  39. static int aer_suspend(struct pcie_device *dev, pm_message_t state)
  40. {return 0;}
  41. static int aer_resume(struct pcie_device *dev) {return 0;}
  42. static pci_ers_result_t aer_error_detected(struct pci_dev *dev,
  43. enum pci_channel_state error);
  44. static void aer_error_resume(struct pci_dev *dev);
  45. static pci_ers_result_t aer_root_reset(struct pci_dev *dev);
  46. /*
  47. * PCI Express bus's AER Root service driver data structure
  48. */
  49. static struct pcie_port_service_id aer_id[] = {
  50. {
  51. .vendor = PCI_ANY_ID,
  52. .device = PCI_ANY_ID,
  53. .port_type = PCIE_RC_PORT,
  54. .service_type = PCIE_PORT_SERVICE_AER,
  55. },
  56. { /* end: all zeroes */ }
  57. };
  58. static struct pci_error_handlers aer_error_handlers = {
  59. .error_detected = aer_error_detected,
  60. .resume = aer_error_resume,
  61. };
  62. static struct pcie_port_service_driver aerdriver = {
  63. .name = "aer",
  64. .id_table = &aer_id[0],
  65. .probe = aer_probe,
  66. .remove = aer_remove,
  67. .suspend = aer_suspend,
  68. .resume = aer_resume,
  69. .err_handler = &aer_error_handlers,
  70. .reset_link = aer_root_reset,
  71. };
  72. static int pcie_aer_disable;
  73. void pci_no_aer(void)
  74. {
  75. pcie_aer_disable = 1; /* has priority over 'forceload' */
  76. }
  77. /**
  78. * aer_irq - Root Port's ISR
  79. * @irq: IRQ assigned to Root Port
  80. * @context: pointer to Root Port data structure
  81. *
  82. * Invoked when Root Port detects AER messages.
  83. **/
  84. static irqreturn_t aer_irq(int irq, void *context)
  85. {
  86. unsigned int status, id;
  87. struct pcie_device *pdev = (struct pcie_device *)context;
  88. struct aer_rpc *rpc = get_service_data(pdev);
  89. int next_prod_idx;
  90. unsigned long flags;
  91. int pos;
  92. pos = pci_find_aer_capability(pdev->port);
  93. /*
  94. * Must lock access to Root Error Status Reg, Root Error ID Reg,
  95. * and Root error producer/consumer index
  96. */
  97. spin_lock_irqsave(&rpc->e_lock, flags);
  98. /* Read error status */
  99. pci_read_config_dword(pdev->port, pos + PCI_ERR_ROOT_STATUS, &status);
  100. if (!(status & ROOT_ERR_STATUS_MASKS)) {
  101. spin_unlock_irqrestore(&rpc->e_lock, flags);
  102. return IRQ_NONE;
  103. }
  104. /* Read error source and clear error status */
  105. pci_read_config_dword(pdev->port, pos + PCI_ERR_ROOT_COR_SRC, &id);
  106. pci_write_config_dword(pdev->port, pos + PCI_ERR_ROOT_STATUS, status);
  107. /* Store error source for later DPC handler */
  108. next_prod_idx = rpc->prod_idx + 1;
  109. if (next_prod_idx == AER_ERROR_SOURCES_MAX)
  110. next_prod_idx = 0;
  111. if (next_prod_idx == rpc->cons_idx) {
  112. /*
  113. * Error Storm Condition - possibly the same error occurred.
  114. * Drop the error.
  115. */
  116. spin_unlock_irqrestore(&rpc->e_lock, flags);
  117. return IRQ_HANDLED;
  118. }
  119. rpc->e_sources[rpc->prod_idx].status = status;
  120. rpc->e_sources[rpc->prod_idx].id = id;
  121. rpc->prod_idx = next_prod_idx;
  122. spin_unlock_irqrestore(&rpc->e_lock, flags);
  123. /* Invoke DPC handler */
  124. schedule_work(&rpc->dpc_handler);
  125. return IRQ_HANDLED;
  126. }
  127. /**
  128. * aer_alloc_rpc - allocate Root Port data structure
  129. * @dev: pointer to the pcie_dev data structure
  130. *
  131. * Invoked when Root Port's AER service is loaded.
  132. **/
  133. static struct aer_rpc* aer_alloc_rpc(struct pcie_device *dev)
  134. {
  135. struct aer_rpc *rpc;
  136. if (!(rpc = kzalloc(sizeof(struct aer_rpc),
  137. GFP_KERNEL)))
  138. return NULL;
  139. /*
  140. * Initialize Root lock access, e_lock, to Root Error Status Reg,
  141. * Root Error ID Reg, and Root error producer/consumer index.
  142. */
  143. spin_lock_init(&rpc->e_lock);
  144. rpc->rpd = dev;
  145. INIT_WORK(&rpc->dpc_handler, aer_isr);
  146. rpc->prod_idx = rpc->cons_idx = 0;
  147. mutex_init(&rpc->rpc_mutex);
  148. init_waitqueue_head(&rpc->wait_release);
  149. /* Use PCIE bus function to store rpc into PCIE device */
  150. set_service_data(dev, rpc);
  151. return rpc;
  152. }
  153. /**
  154. * aer_remove - clean up resources
  155. * @dev: pointer to the pcie_dev data structure
  156. *
  157. * Invoked when PCI Express bus unloads or AER probe fails.
  158. **/
  159. static void aer_remove(struct pcie_device *dev)
  160. {
  161. struct aer_rpc *rpc = get_service_data(dev);
  162. if (rpc) {
  163. /* If register interrupt service, it must be free. */
  164. if (rpc->isr)
  165. free_irq(dev->irq, dev);
  166. wait_event(rpc->wait_release, rpc->prod_idx == rpc->cons_idx);
  167. aer_delete_rootport(rpc);
  168. set_service_data(dev, NULL);
  169. }
  170. }
  171. /**
  172. * aer_probe - initialize resources
  173. * @dev: pointer to the pcie_dev data structure
  174. * @id: pointer to the service id data structure
  175. *
  176. * Invoked when PCI Express bus loads AER service driver.
  177. **/
  178. static int __devinit aer_probe (struct pcie_device *dev,
  179. const struct pcie_port_service_id *id )
  180. {
  181. int status;
  182. struct aer_rpc *rpc;
  183. struct device *device = &dev->device;
  184. /* Init */
  185. if ((status = aer_init(dev)))
  186. return status;
  187. /* Alloc rpc data structure */
  188. if (!(rpc = aer_alloc_rpc(dev))) {
  189. printk(KERN_DEBUG "%s: Alloc rpc fails on PCIE device[%s]\n",
  190. __FUNCTION__, device->bus_id);
  191. aer_remove(dev);
  192. return -ENOMEM;
  193. }
  194. /* Request IRQ ISR */
  195. if ((status = request_irq(dev->irq, aer_irq, IRQF_SHARED, "aerdrv",
  196. dev))) {
  197. printk(KERN_DEBUG "%s: Request ISR fails on PCIE device[%s]\n",
  198. __FUNCTION__, device->bus_id);
  199. aer_remove(dev);
  200. return status;
  201. }
  202. rpc->isr = 1;
  203. aer_enable_rootport(rpc);
  204. return status;
  205. }
  206. /**
  207. * aer_root_reset - reset link on Root Port
  208. * @dev: pointer to Root Port's pci_dev data structure
  209. *
  210. * Invoked by Port Bus driver when performing link reset at Root Port.
  211. **/
  212. static pci_ers_result_t aer_root_reset(struct pci_dev *dev)
  213. {
  214. u16 p2p_ctrl;
  215. u32 status;
  216. int pos;
  217. pos = pci_find_aer_capability(dev);
  218. /* Disable Root's interrupt in response to error messages */
  219. pci_write_config_dword(dev, pos + PCI_ERR_ROOT_COMMAND, 0);
  220. /* Assert Secondary Bus Reset */
  221. pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &p2p_ctrl);
  222. p2p_ctrl |= PCI_CB_BRIDGE_CTL_CB_RESET;
  223. pci_write_config_word(dev, PCI_BRIDGE_CONTROL, p2p_ctrl);
  224. /* De-assert Secondary Bus Reset */
  225. p2p_ctrl &= ~PCI_CB_BRIDGE_CTL_CB_RESET;
  226. pci_write_config_word(dev, PCI_BRIDGE_CONTROL, p2p_ctrl);
  227. /*
  228. * System software must wait for at least 100ms from the end
  229. * of a reset of one or more device before it is permitted
  230. * to issue Configuration Requests to those devices.
  231. */
  232. msleep(200);
  233. printk(KERN_DEBUG "Complete link reset at Root[%s]\n", dev->dev.bus_id);
  234. /* Enable Root Port's interrupt in response to error messages */
  235. pci_read_config_dword(dev, pos + PCI_ERR_ROOT_STATUS, &status);
  236. pci_write_config_dword(dev, pos + PCI_ERR_ROOT_STATUS, status);
  237. pci_write_config_dword(dev,
  238. pos + PCI_ERR_ROOT_COMMAND,
  239. ROOT_PORT_INTR_ON_MESG_MASK);
  240. return PCI_ERS_RESULT_RECOVERED;
  241. }
  242. /**
  243. * aer_error_detected - update severity status
  244. * @dev: pointer to Root Port's pci_dev data structure
  245. * @error: error severity being notified by port bus
  246. *
  247. * Invoked by Port Bus driver during error recovery.
  248. **/
  249. static pci_ers_result_t aer_error_detected(struct pci_dev *dev,
  250. enum pci_channel_state error)
  251. {
  252. /* Root Port has no impact. Always recovers. */
  253. return PCI_ERS_RESULT_CAN_RECOVER;
  254. }
  255. /**
  256. * aer_error_resume - clean up corresponding error status bits
  257. * @dev: pointer to Root Port's pci_dev data structure
  258. *
  259. * Invoked by Port Bus driver during nonfatal recovery.
  260. **/
  261. static void aer_error_resume(struct pci_dev *dev)
  262. {
  263. int pos;
  264. u32 status, mask;
  265. u16 reg16;
  266. /* Clean up Root device status */
  267. pos = pci_find_capability(dev, PCI_CAP_ID_EXP);
  268. pci_read_config_word(dev, pos + PCI_EXP_DEVSTA, &reg16);
  269. pci_write_config_word(dev, pos + PCI_EXP_DEVSTA, reg16);
  270. /* Clean AER Root Error Status */
  271. pos = pci_find_aer_capability(dev);
  272. pci_read_config_dword(dev, pos + PCI_ERR_UNCOR_STATUS, &status);
  273. pci_read_config_dword(dev, pos + PCI_ERR_UNCOR_SEVER, &mask);
  274. if (dev->error_state == pci_channel_io_normal)
  275. status &= ~mask; /* Clear corresponding nonfatal bits */
  276. else
  277. status &= mask; /* Clear corresponding fatal bits */
  278. pci_write_config_dword(dev, pos + PCI_ERR_UNCOR_STATUS, status);
  279. }
  280. /**
  281. * aer_service_init - register AER root service driver
  282. *
  283. * Invoked when AER root service driver is loaded.
  284. **/
  285. static int __init aer_service_init(void)
  286. {
  287. if (pcie_aer_disable)
  288. return -ENXIO;
  289. return pcie_port_service_register(&aerdriver);
  290. }
  291. /**
  292. * aer_service_exit - unregister AER root service driver
  293. *
  294. * Invoked when AER root service driver is unloaded.
  295. **/
  296. static void __exit aer_service_exit(void)
  297. {
  298. pcie_port_service_unregister(&aerdriver);
  299. }
  300. module_init(aer_service_init);
  301. module_exit(aer_service_exit);