iosapic.c 30 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114
  1. /*
  2. * I/O SAPIC support.
  3. *
  4. * Copyright (C) 1999 Intel Corp.
  5. * Copyright (C) 1999 Asit Mallick <asit.k.mallick@intel.com>
  6. * Copyright (C) 2000-2002 J.I. Lee <jung-ik.lee@intel.com>
  7. * Copyright (C) 1999-2000, 2002-2003 Hewlett-Packard Co.
  8. * David Mosberger-Tang <davidm@hpl.hp.com>
  9. * Copyright (C) 1999 VA Linux Systems
  10. * Copyright (C) 1999,2000 Walt Drummond <drummond@valinux.com>
  11. *
  12. * 00/04/19 D. Mosberger Rewritten to mirror more closely the x86 I/O APIC code.
  13. * In particular, we now have separate handlers for edge
  14. * and level triggered interrupts.
  15. * 00/10/27 Asit Mallick, Goutham Rao <goutham.rao@intel.com> IRQ vector allocation
  16. * PCI to vector mapping, shared PCI interrupts.
  17. * 00/10/27 D. Mosberger Document things a bit more to make them more understandable.
  18. * Clean up much of the old IOSAPIC cruft.
  19. * 01/07/27 J.I. Lee PCI irq routing, Platform/Legacy interrupts and fixes for
  20. * ACPI S5(SoftOff) support.
  21. * 02/01/23 J.I. Lee iosapic pgm fixes for PCI irq routing from _PRT
  22. * 02/01/07 E. Focht <efocht@ess.nec.de> Redirectable interrupt vectors in
  23. * iosapic_set_affinity(), initializations for
  24. * /proc/irq/#/smp_affinity
  25. * 02/04/02 P. Diefenbaugh Cleaned up ACPI PCI IRQ routing.
  26. * 02/04/18 J.I. Lee bug fix in iosapic_init_pci_irq
  27. * 02/04/30 J.I. Lee bug fix in find_iosapic to fix ACPI PCI IRQ to IOSAPIC mapping
  28. * error
  29. * 02/07/29 T. Kochi Allocate interrupt vectors dynamically
  30. * 02/08/04 T. Kochi Cleaned up terminology (irq, global system interrupt, vector, etc.)
  31. * 02/09/20 D. Mosberger Simplified by taking advantage of ACPI's pci_irq code.
  32. * 03/02/19 B. Helgaas Make pcat_compat system-wide, not per-IOSAPIC.
  33. * Remove iosapic_address & gsi_base from external interfaces.
  34. * Rationalize __init/__devinit attributes.
  35. * 04/12/04 Ashok Raj <ashok.raj@intel.com> Intel Corporation 2004
  36. * Updated to work with irq migration necessary for CPU Hotplug
  37. */
  38. /*
  39. * Here is what the interrupt logic between a PCI device and the kernel looks like:
  40. *
  41. * (1) A PCI device raises one of the four interrupt pins (INTA, INTB, INTC, INTD). The
  42. * device is uniquely identified by its bus--, and slot-number (the function
  43. * number does not matter here because all functions share the same interrupt
  44. * lines).
  45. *
  46. * (2) The motherboard routes the interrupt line to a pin on a IOSAPIC controller.
  47. * Multiple interrupt lines may have to share the same IOSAPIC pin (if they're level
  48. * triggered and use the same polarity). Each interrupt line has a unique Global
  49. * System Interrupt (GSI) number which can be calculated as the sum of the controller's
  50. * base GSI number and the IOSAPIC pin number to which the line connects.
  51. *
  52. * (3) The IOSAPIC uses an internal routing table entries (RTEs) to map the IOSAPIC pin
  53. * into the IA-64 interrupt vector. This interrupt vector is then sent to the CPU.
  54. *
  55. * (4) The kernel recognizes an interrupt as an IRQ. The IRQ interface is used as
  56. * architecture-independent interrupt handling mechanism in Linux. As an
  57. * IRQ is a number, we have to have IA-64 interrupt vector number <-> IRQ number
  58. * mapping. On smaller systems, we use one-to-one mapping between IA-64 vector and
  59. * IRQ. A platform can implement platform_irq_to_vector(irq) and
  60. * platform_local_vector_to_irq(vector) APIs to differentiate the mapping.
  61. * Please see also include/asm-ia64/hw_irq.h for those APIs.
  62. *
  63. * To sum up, there are three levels of mappings involved:
  64. *
  65. * PCI pin -> global system interrupt (GSI) -> IA-64 vector <-> IRQ
  66. *
  67. * Note: The term "IRQ" is loosely used everywhere in Linux kernel to describe interrupts.
  68. * Now we use "IRQ" only for Linux IRQ's. ISA IRQ (isa_irq) is the only exception in this
  69. * source code.
  70. */
  71. #include <linux/config.h>
  72. #include <linux/acpi.h>
  73. #include <linux/init.h>
  74. #include <linux/irq.h>
  75. #include <linux/kernel.h>
  76. #include <linux/list.h>
  77. #include <linux/pci.h>
  78. #include <linux/smp.h>
  79. #include <linux/smp_lock.h>
  80. #include <linux/string.h>
  81. #include <linux/bootmem.h>
  82. #include <asm/delay.h>
  83. #include <asm/hw_irq.h>
  84. #include <asm/io.h>
  85. #include <asm/iosapic.h>
  86. #include <asm/machvec.h>
  87. #include <asm/processor.h>
  88. #include <asm/ptrace.h>
  89. #include <asm/system.h>
  90. #undef DEBUG_INTERRUPT_ROUTING
  91. #ifdef DEBUG_INTERRUPT_ROUTING
  92. #define DBG(fmt...) printk(fmt)
  93. #else
  94. #define DBG(fmt...)
  95. #endif
  96. #define NR_PREALLOCATE_RTE_ENTRIES (PAGE_SIZE / sizeof(struct iosapic_rte_info))
  97. #define RTE_PREALLOCATED (1)
  98. static DEFINE_SPINLOCK(iosapic_lock);
  99. /* These tables map IA-64 vectors to the IOSAPIC pin that generates this vector. */
  100. struct iosapic_rte_info {
  101. struct list_head rte_list; /* node in list of RTEs sharing the same vector */
  102. char __iomem *addr; /* base address of IOSAPIC */
  103. unsigned int gsi_base; /* first GSI assigned to this IOSAPIC */
  104. char rte_index; /* IOSAPIC RTE index */
  105. int refcnt; /* reference counter */
  106. unsigned int flags; /* flags */
  107. } ____cacheline_aligned;
  108. static struct iosapic_intr_info {
  109. struct list_head rtes; /* RTEs using this vector (empty => not an IOSAPIC interrupt) */
  110. int count; /* # of RTEs that shares this vector */
  111. u32 low32; /* current value of low word of Redirection table entry */
  112. unsigned int dest; /* destination CPU physical ID */
  113. unsigned char dmode : 3; /* delivery mode (see iosapic.h) */
  114. unsigned char polarity: 1; /* interrupt polarity (see iosapic.h) */
  115. unsigned char trigger : 1; /* trigger mode (see iosapic.h) */
  116. } iosapic_intr_info[IA64_NUM_VECTORS];
  117. static struct iosapic {
  118. char __iomem *addr; /* base address of IOSAPIC */
  119. unsigned int gsi_base; /* first GSI assigned to this IOSAPIC */
  120. unsigned short num_rte; /* number of RTE in this IOSAPIC */
  121. int rtes_inuse; /* # of RTEs in use on this IOSAPIC */
  122. #ifdef CONFIG_NUMA
  123. unsigned short node; /* numa node association via pxm */
  124. #endif
  125. } iosapic_lists[NR_IOSAPICS];
  126. static unsigned char pcat_compat __devinitdata; /* 8259 compatibility flag */
  127. static int iosapic_kmalloc_ok;
  128. static LIST_HEAD(free_rte_list);
  129. /*
  130. * Find an IOSAPIC associated with a GSI
  131. */
  132. static inline int
  133. find_iosapic (unsigned int gsi)
  134. {
  135. int i;
  136. for (i = 0; i < NR_IOSAPICS; i++) {
  137. if ((unsigned) (gsi - iosapic_lists[i].gsi_base) < iosapic_lists[i].num_rte)
  138. return i;
  139. }
  140. return -1;
  141. }
  142. static inline int
  143. _gsi_to_vector (unsigned int gsi)
  144. {
  145. struct iosapic_intr_info *info;
  146. struct iosapic_rte_info *rte;
  147. for (info = iosapic_intr_info; info < iosapic_intr_info + IA64_NUM_VECTORS; ++info)
  148. list_for_each_entry(rte, &info->rtes, rte_list)
  149. if (rte->gsi_base + rte->rte_index == gsi)
  150. return info - iosapic_intr_info;
  151. return -1;
  152. }
  153. /*
  154. * Translate GSI number to the corresponding IA-64 interrupt vector. If no
  155. * entry exists, return -1.
  156. */
  157. inline int
  158. gsi_to_vector (unsigned int gsi)
  159. {
  160. return _gsi_to_vector(gsi);
  161. }
  162. int
  163. gsi_to_irq (unsigned int gsi)
  164. {
  165. unsigned long flags;
  166. int irq;
  167. /*
  168. * XXX fix me: this assumes an identity mapping vetween IA-64 vector and Linux irq
  169. * numbers...
  170. */
  171. spin_lock_irqsave(&iosapic_lock, flags);
  172. {
  173. irq = _gsi_to_vector(gsi);
  174. }
  175. spin_unlock_irqrestore(&iosapic_lock, flags);
  176. return irq;
  177. }
  178. static struct iosapic_rte_info *gsi_vector_to_rte(unsigned int gsi, unsigned int vec)
  179. {
  180. struct iosapic_rte_info *rte;
  181. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list)
  182. if (rte->gsi_base + rte->rte_index == gsi)
  183. return rte;
  184. return NULL;
  185. }
  186. static void
  187. set_rte (unsigned int gsi, unsigned int vector, unsigned int dest, int mask)
  188. {
  189. unsigned long pol, trigger, dmode;
  190. u32 low32, high32;
  191. char __iomem *addr;
  192. int rte_index;
  193. char redir;
  194. struct iosapic_rte_info *rte;
  195. DBG(KERN_DEBUG"IOSAPIC: routing vector %d to 0x%x\n", vector, dest);
  196. rte = gsi_vector_to_rte(gsi, vector);
  197. if (!rte)
  198. return; /* not an IOSAPIC interrupt */
  199. rte_index = rte->rte_index;
  200. addr = rte->addr;
  201. pol = iosapic_intr_info[vector].polarity;
  202. trigger = iosapic_intr_info[vector].trigger;
  203. dmode = iosapic_intr_info[vector].dmode;
  204. redir = (dmode == IOSAPIC_LOWEST_PRIORITY) ? 1 : 0;
  205. #ifdef CONFIG_SMP
  206. {
  207. unsigned int irq;
  208. for (irq = 0; irq < NR_IRQS; ++irq)
  209. if (irq_to_vector(irq) == vector) {
  210. set_irq_affinity_info(irq, (int)(dest & 0xffff), redir);
  211. break;
  212. }
  213. }
  214. #endif
  215. low32 = ((pol << IOSAPIC_POLARITY_SHIFT) |
  216. (trigger << IOSAPIC_TRIGGER_SHIFT) |
  217. (dmode << IOSAPIC_DELIVERY_SHIFT) |
  218. ((mask ? 1 : 0) << IOSAPIC_MASK_SHIFT) |
  219. vector);
  220. /* dest contains both id and eid */
  221. high32 = (dest << IOSAPIC_DEST_SHIFT);
  222. iosapic_write(addr, IOSAPIC_RTE_HIGH(rte_index), high32);
  223. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  224. iosapic_intr_info[vector].low32 = low32;
  225. iosapic_intr_info[vector].dest = dest;
  226. }
  227. static void
  228. nop (unsigned int vector)
  229. {
  230. /* do nothing... */
  231. }
  232. static void
  233. mask_irq (unsigned int irq)
  234. {
  235. unsigned long flags;
  236. char __iomem *addr;
  237. u32 low32;
  238. int rte_index;
  239. ia64_vector vec = irq_to_vector(irq);
  240. struct iosapic_rte_info *rte;
  241. if (list_empty(&iosapic_intr_info[vec].rtes))
  242. return; /* not an IOSAPIC interrupt! */
  243. spin_lock_irqsave(&iosapic_lock, flags);
  244. {
  245. /* set only the mask bit */
  246. low32 = iosapic_intr_info[vec].low32 |= IOSAPIC_MASK;
  247. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list) {
  248. addr = rte->addr;
  249. rte_index = rte->rte_index;
  250. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  251. }
  252. }
  253. spin_unlock_irqrestore(&iosapic_lock, flags);
  254. }
  255. static void
  256. unmask_irq (unsigned int irq)
  257. {
  258. unsigned long flags;
  259. char __iomem *addr;
  260. u32 low32;
  261. int rte_index;
  262. ia64_vector vec = irq_to_vector(irq);
  263. struct iosapic_rte_info *rte;
  264. if (list_empty(&iosapic_intr_info[vec].rtes))
  265. return; /* not an IOSAPIC interrupt! */
  266. spin_lock_irqsave(&iosapic_lock, flags);
  267. {
  268. low32 = iosapic_intr_info[vec].low32 &= ~IOSAPIC_MASK;
  269. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list) {
  270. addr = rte->addr;
  271. rte_index = rte->rte_index;
  272. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  273. }
  274. }
  275. spin_unlock_irqrestore(&iosapic_lock, flags);
  276. }
  277. static void
  278. iosapic_set_affinity (unsigned int irq, cpumask_t mask)
  279. {
  280. #ifdef CONFIG_SMP
  281. unsigned long flags;
  282. u32 high32, low32;
  283. int dest, rte_index;
  284. char __iomem *addr;
  285. int redir = (irq & IA64_IRQ_REDIRECTED) ? 1 : 0;
  286. ia64_vector vec;
  287. struct iosapic_rte_info *rte;
  288. irq &= (~IA64_IRQ_REDIRECTED);
  289. vec = irq_to_vector(irq);
  290. if (cpus_empty(mask))
  291. return;
  292. dest = cpu_physical_id(first_cpu(mask));
  293. if (list_empty(&iosapic_intr_info[vec].rtes))
  294. return; /* not an IOSAPIC interrupt */
  295. set_irq_affinity_info(irq, dest, redir);
  296. /* dest contains both id and eid */
  297. high32 = dest << IOSAPIC_DEST_SHIFT;
  298. spin_lock_irqsave(&iosapic_lock, flags);
  299. {
  300. low32 = iosapic_intr_info[vec].low32 & ~(7 << IOSAPIC_DELIVERY_SHIFT);
  301. if (redir)
  302. /* change delivery mode to lowest priority */
  303. low32 |= (IOSAPIC_LOWEST_PRIORITY << IOSAPIC_DELIVERY_SHIFT);
  304. else
  305. /* change delivery mode to fixed */
  306. low32 |= (IOSAPIC_FIXED << IOSAPIC_DELIVERY_SHIFT);
  307. iosapic_intr_info[vec].low32 = low32;
  308. iosapic_intr_info[vec].dest = dest;
  309. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list) {
  310. addr = rte->addr;
  311. rte_index = rte->rte_index;
  312. iosapic_write(addr, IOSAPIC_RTE_HIGH(rte_index), high32);
  313. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  314. }
  315. }
  316. spin_unlock_irqrestore(&iosapic_lock, flags);
  317. #endif
  318. }
  319. /*
  320. * Handlers for level-triggered interrupts.
  321. */
  322. static unsigned int
  323. iosapic_startup_level_irq (unsigned int irq)
  324. {
  325. unmask_irq(irq);
  326. return 0;
  327. }
  328. static void
  329. iosapic_end_level_irq (unsigned int irq)
  330. {
  331. ia64_vector vec = irq_to_vector(irq);
  332. struct iosapic_rte_info *rte;
  333. move_irq(irq);
  334. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list)
  335. iosapic_eoi(rte->addr, vec);
  336. }
  337. #define iosapic_shutdown_level_irq mask_irq
  338. #define iosapic_enable_level_irq unmask_irq
  339. #define iosapic_disable_level_irq mask_irq
  340. #define iosapic_ack_level_irq nop
  341. struct hw_interrupt_type irq_type_iosapic_level = {
  342. .typename = "IO-SAPIC-level",
  343. .startup = iosapic_startup_level_irq,
  344. .shutdown = iosapic_shutdown_level_irq,
  345. .enable = iosapic_enable_level_irq,
  346. .disable = iosapic_disable_level_irq,
  347. .ack = iosapic_ack_level_irq,
  348. .end = iosapic_end_level_irq,
  349. .set_affinity = iosapic_set_affinity
  350. };
  351. /*
  352. * Handlers for edge-triggered interrupts.
  353. */
  354. static unsigned int
  355. iosapic_startup_edge_irq (unsigned int irq)
  356. {
  357. unmask_irq(irq);
  358. /*
  359. * IOSAPIC simply drops interrupts pended while the
  360. * corresponding pin was masked, so we can't know if an
  361. * interrupt is pending already. Let's hope not...
  362. */
  363. return 0;
  364. }
  365. static void
  366. iosapic_ack_edge_irq (unsigned int irq)
  367. {
  368. irq_desc_t *idesc = irq_descp(irq);
  369. move_irq(irq);
  370. /*
  371. * Once we have recorded IRQ_PENDING already, we can mask the
  372. * interrupt for real. This prevents IRQ storms from unhandled
  373. * devices.
  374. */
  375. if ((idesc->status & (IRQ_PENDING|IRQ_DISABLED)) == (IRQ_PENDING|IRQ_DISABLED))
  376. mask_irq(irq);
  377. }
  378. #define iosapic_enable_edge_irq unmask_irq
  379. #define iosapic_disable_edge_irq nop
  380. #define iosapic_end_edge_irq nop
  381. struct hw_interrupt_type irq_type_iosapic_edge = {
  382. .typename = "IO-SAPIC-edge",
  383. .startup = iosapic_startup_edge_irq,
  384. .shutdown = iosapic_disable_edge_irq,
  385. .enable = iosapic_enable_edge_irq,
  386. .disable = iosapic_disable_edge_irq,
  387. .ack = iosapic_ack_edge_irq,
  388. .end = iosapic_end_edge_irq,
  389. .set_affinity = iosapic_set_affinity
  390. };
  391. unsigned int
  392. iosapic_version (char __iomem *addr)
  393. {
  394. /*
  395. * IOSAPIC Version Register return 32 bit structure like:
  396. * {
  397. * unsigned int version : 8;
  398. * unsigned int reserved1 : 8;
  399. * unsigned int max_redir : 8;
  400. * unsigned int reserved2 : 8;
  401. * }
  402. */
  403. return iosapic_read(addr, IOSAPIC_VERSION);
  404. }
  405. static int iosapic_find_sharable_vector (unsigned long trigger, unsigned long pol)
  406. {
  407. int i, vector = -1, min_count = -1;
  408. struct iosapic_intr_info *info;
  409. /*
  410. * shared vectors for edge-triggered interrupts are not
  411. * supported yet
  412. */
  413. if (trigger == IOSAPIC_EDGE)
  414. return -1;
  415. for (i = IA64_FIRST_DEVICE_VECTOR; i <= IA64_LAST_DEVICE_VECTOR; i++) {
  416. info = &iosapic_intr_info[i];
  417. if (info->trigger == trigger && info->polarity == pol &&
  418. (info->dmode == IOSAPIC_FIXED || info->dmode == IOSAPIC_LOWEST_PRIORITY)) {
  419. if (min_count == -1 || info->count < min_count) {
  420. vector = i;
  421. min_count = info->count;
  422. }
  423. }
  424. }
  425. return vector;
  426. }
  427. /*
  428. * if the given vector is already owned by other,
  429. * assign a new vector for the other and make the vector available
  430. */
  431. static void __init
  432. iosapic_reassign_vector (int vector)
  433. {
  434. int new_vector;
  435. if (!list_empty(&iosapic_intr_info[vector].rtes)) {
  436. new_vector = assign_irq_vector(AUTO_ASSIGN);
  437. if (new_vector < 0)
  438. panic("%s: out of interrupt vectors!\n", __FUNCTION__);
  439. printk(KERN_INFO "Reassigning vector %d to %d\n", vector, new_vector);
  440. memcpy(&iosapic_intr_info[new_vector], &iosapic_intr_info[vector],
  441. sizeof(struct iosapic_intr_info));
  442. INIT_LIST_HEAD(&iosapic_intr_info[new_vector].rtes);
  443. list_move(iosapic_intr_info[vector].rtes.next, &iosapic_intr_info[new_vector].rtes);
  444. memset(&iosapic_intr_info[vector], 0, sizeof(struct iosapic_intr_info));
  445. iosapic_intr_info[vector].low32 = IOSAPIC_MASK;
  446. INIT_LIST_HEAD(&iosapic_intr_info[vector].rtes);
  447. }
  448. }
  449. static struct iosapic_rte_info *iosapic_alloc_rte (void)
  450. {
  451. int i;
  452. struct iosapic_rte_info *rte;
  453. int preallocated = 0;
  454. if (!iosapic_kmalloc_ok && list_empty(&free_rte_list)) {
  455. rte = alloc_bootmem(sizeof(struct iosapic_rte_info) * NR_PREALLOCATE_RTE_ENTRIES);
  456. if (!rte)
  457. return NULL;
  458. for (i = 0; i < NR_PREALLOCATE_RTE_ENTRIES; i++, rte++)
  459. list_add(&rte->rte_list, &free_rte_list);
  460. }
  461. if (!list_empty(&free_rte_list)) {
  462. rte = list_entry(free_rte_list.next, struct iosapic_rte_info, rte_list);
  463. list_del(&rte->rte_list);
  464. preallocated++;
  465. } else {
  466. rte = kmalloc(sizeof(struct iosapic_rte_info), GFP_ATOMIC);
  467. if (!rte)
  468. return NULL;
  469. }
  470. memset(rte, 0, sizeof(struct iosapic_rte_info));
  471. if (preallocated)
  472. rte->flags |= RTE_PREALLOCATED;
  473. return rte;
  474. }
  475. static void iosapic_free_rte (struct iosapic_rte_info *rte)
  476. {
  477. if (rte->flags & RTE_PREALLOCATED)
  478. list_add_tail(&rte->rte_list, &free_rte_list);
  479. else
  480. kfree(rte);
  481. }
  482. static inline int vector_is_shared (int vector)
  483. {
  484. return (iosapic_intr_info[vector].count > 1);
  485. }
  486. static int
  487. register_intr (unsigned int gsi, int vector, unsigned char delivery,
  488. unsigned long polarity, unsigned long trigger)
  489. {
  490. irq_desc_t *idesc;
  491. struct hw_interrupt_type *irq_type;
  492. int rte_index;
  493. int index;
  494. unsigned long gsi_base;
  495. void __iomem *iosapic_address;
  496. struct iosapic_rte_info *rte;
  497. index = find_iosapic(gsi);
  498. if (index < 0) {
  499. printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n", __FUNCTION__, gsi);
  500. return -ENODEV;
  501. }
  502. iosapic_address = iosapic_lists[index].addr;
  503. gsi_base = iosapic_lists[index].gsi_base;
  504. rte = gsi_vector_to_rte(gsi, vector);
  505. if (!rte) {
  506. rte = iosapic_alloc_rte();
  507. if (!rte) {
  508. printk(KERN_WARNING "%s: cannot allocate memory\n", __FUNCTION__);
  509. return -ENOMEM;
  510. }
  511. rte_index = gsi - gsi_base;
  512. rte->rte_index = rte_index;
  513. rte->addr = iosapic_address;
  514. rte->gsi_base = gsi_base;
  515. rte->refcnt++;
  516. list_add_tail(&rte->rte_list, &iosapic_intr_info[vector].rtes);
  517. iosapic_intr_info[vector].count++;
  518. iosapic_lists[index].rtes_inuse++;
  519. }
  520. else if (vector_is_shared(vector)) {
  521. struct iosapic_intr_info *info = &iosapic_intr_info[vector];
  522. if (info->trigger != trigger || info->polarity != polarity) {
  523. printk (KERN_WARNING "%s: cannot override the interrupt\n", __FUNCTION__);
  524. return -EINVAL;
  525. }
  526. }
  527. iosapic_intr_info[vector].polarity = polarity;
  528. iosapic_intr_info[vector].dmode = delivery;
  529. iosapic_intr_info[vector].trigger = trigger;
  530. if (trigger == IOSAPIC_EDGE)
  531. irq_type = &irq_type_iosapic_edge;
  532. else
  533. irq_type = &irq_type_iosapic_level;
  534. idesc = irq_descp(vector);
  535. if (idesc->handler != irq_type) {
  536. if (idesc->handler != &no_irq_type)
  537. printk(KERN_WARNING "%s: changing vector %d from %s to %s\n",
  538. __FUNCTION__, vector, idesc->handler->typename, irq_type->typename);
  539. idesc->handler = irq_type;
  540. }
  541. return 0;
  542. }
  543. static unsigned int
  544. get_target_cpu (unsigned int gsi, int vector)
  545. {
  546. #ifdef CONFIG_SMP
  547. static int cpu = -1;
  548. /*
  549. * In case of vector shared by multiple RTEs, all RTEs that
  550. * share the vector need to use the same destination CPU.
  551. */
  552. if (!list_empty(&iosapic_intr_info[vector].rtes))
  553. return iosapic_intr_info[vector].dest;
  554. /*
  555. * If the platform supports redirection via XTP, let it
  556. * distribute interrupts.
  557. */
  558. if (smp_int_redirect & SMP_IRQ_REDIRECTION)
  559. return cpu_physical_id(smp_processor_id());
  560. /*
  561. * Some interrupts (ACPI SCI, for instance) are registered
  562. * before the BSP is marked as online.
  563. */
  564. if (!cpu_online(smp_processor_id()))
  565. return cpu_physical_id(smp_processor_id());
  566. #ifdef CONFIG_NUMA
  567. {
  568. int num_cpus, cpu_index, iosapic_index, numa_cpu, i = 0;
  569. cpumask_t cpu_mask;
  570. iosapic_index = find_iosapic(gsi);
  571. if (iosapic_index < 0 ||
  572. iosapic_lists[iosapic_index].node == MAX_NUMNODES)
  573. goto skip_numa_setup;
  574. cpu_mask = node_to_cpumask(iosapic_lists[iosapic_index].node);
  575. for_each_cpu_mask(numa_cpu, cpu_mask) {
  576. if (!cpu_online(numa_cpu))
  577. cpu_clear(numa_cpu, cpu_mask);
  578. }
  579. num_cpus = cpus_weight(cpu_mask);
  580. if (!num_cpus)
  581. goto skip_numa_setup;
  582. /* Use vector assigment to distribute across cpus in node */
  583. cpu_index = vector % num_cpus;
  584. for (numa_cpu = first_cpu(cpu_mask) ; i < cpu_index ; i++)
  585. numa_cpu = next_cpu(numa_cpu, cpu_mask);
  586. if (numa_cpu != NR_CPUS)
  587. return cpu_physical_id(numa_cpu);
  588. }
  589. skip_numa_setup:
  590. #endif
  591. /*
  592. * Otherwise, round-robin interrupt vectors across all the
  593. * processors. (It'd be nice if we could be smarter in the
  594. * case of NUMA.)
  595. */
  596. do {
  597. if (++cpu >= NR_CPUS)
  598. cpu = 0;
  599. } while (!cpu_online(cpu));
  600. return cpu_physical_id(cpu);
  601. #else
  602. return cpu_physical_id(smp_processor_id());
  603. #endif
  604. }
  605. /*
  606. * ACPI can describe IOSAPIC interrupts via static tables and namespace
  607. * methods. This provides an interface to register those interrupts and
  608. * program the IOSAPIC RTE.
  609. */
  610. int
  611. iosapic_register_intr (unsigned int gsi,
  612. unsigned long polarity, unsigned long trigger)
  613. {
  614. int vector, mask = 1, err;
  615. unsigned int dest;
  616. unsigned long flags;
  617. struct iosapic_rte_info *rte;
  618. u32 low32;
  619. again:
  620. /*
  621. * If this GSI has already been registered (i.e., it's a
  622. * shared interrupt, or we lost a race to register it),
  623. * don't touch the RTE.
  624. */
  625. spin_lock_irqsave(&iosapic_lock, flags);
  626. {
  627. vector = gsi_to_vector(gsi);
  628. if (vector > 0) {
  629. rte = gsi_vector_to_rte(gsi, vector);
  630. rte->refcnt++;
  631. spin_unlock_irqrestore(&iosapic_lock, flags);
  632. return vector;
  633. }
  634. }
  635. spin_unlock_irqrestore(&iosapic_lock, flags);
  636. /* If vector is running out, we try to find a sharable vector */
  637. vector = assign_irq_vector(AUTO_ASSIGN);
  638. if (vector < 0) {
  639. vector = iosapic_find_sharable_vector(trigger, polarity);
  640. if (vector < 0)
  641. return -ENOSPC;
  642. }
  643. spin_lock_irqsave(&irq_descp(vector)->lock, flags);
  644. spin_lock(&iosapic_lock);
  645. {
  646. if (gsi_to_vector(gsi) > 0) {
  647. if (list_empty(&iosapic_intr_info[vector].rtes))
  648. free_irq_vector(vector);
  649. spin_unlock(&iosapic_lock);
  650. spin_unlock_irqrestore(&irq_descp(vector)->lock, flags);
  651. goto again;
  652. }
  653. dest = get_target_cpu(gsi, vector);
  654. err = register_intr(gsi, vector, IOSAPIC_LOWEST_PRIORITY,
  655. polarity, trigger);
  656. if (err < 0) {
  657. spin_unlock(&iosapic_lock);
  658. spin_unlock_irqrestore(&irq_descp(vector)->lock, flags);
  659. return err;
  660. }
  661. /*
  662. * If the vector is shared and already unmasked for
  663. * other interrupt sources, don't mask it.
  664. */
  665. low32 = iosapic_intr_info[vector].low32;
  666. if (vector_is_shared(vector) && !(low32 & IOSAPIC_MASK))
  667. mask = 0;
  668. set_rte(gsi, vector, dest, mask);
  669. }
  670. spin_unlock(&iosapic_lock);
  671. spin_unlock_irqrestore(&irq_descp(vector)->lock, flags);
  672. printk(KERN_INFO "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d\n",
  673. gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  674. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  675. cpu_logical_id(dest), dest, vector);
  676. return vector;
  677. }
  678. void
  679. iosapic_unregister_intr (unsigned int gsi)
  680. {
  681. unsigned long flags;
  682. int irq, vector, index;
  683. irq_desc_t *idesc;
  684. u32 low32;
  685. unsigned long trigger, polarity;
  686. unsigned int dest;
  687. struct iosapic_rte_info *rte;
  688. /*
  689. * If the irq associated with the gsi is not found,
  690. * iosapic_unregister_intr() is unbalanced. We need to check
  691. * this again after getting locks.
  692. */
  693. irq = gsi_to_irq(gsi);
  694. if (irq < 0) {
  695. printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n", gsi);
  696. WARN_ON(1);
  697. return;
  698. }
  699. vector = irq_to_vector(irq);
  700. idesc = irq_descp(irq);
  701. spin_lock_irqsave(&idesc->lock, flags);
  702. spin_lock(&iosapic_lock);
  703. {
  704. if ((rte = gsi_vector_to_rte(gsi, vector)) == NULL) {
  705. printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n", gsi);
  706. WARN_ON(1);
  707. goto out;
  708. }
  709. if (--rte->refcnt > 0)
  710. goto out;
  711. /* Mask the interrupt */
  712. low32 = iosapic_intr_info[vector].low32 | IOSAPIC_MASK;
  713. iosapic_write(rte->addr, IOSAPIC_RTE_LOW(rte->rte_index), low32);
  714. /* Remove the rte entry from the list */
  715. list_del(&rte->rte_list);
  716. iosapic_intr_info[vector].count--;
  717. iosapic_free_rte(rte);
  718. index = find_iosapic(gsi);
  719. iosapic_lists[index].rtes_inuse--;
  720. WARN_ON(iosapic_lists[index].rtes_inuse < 0);
  721. trigger = iosapic_intr_info[vector].trigger;
  722. polarity = iosapic_intr_info[vector].polarity;
  723. dest = iosapic_intr_info[vector].dest;
  724. printk(KERN_INFO "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d unregistered\n",
  725. gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  726. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  727. cpu_logical_id(dest), dest, vector);
  728. if (list_empty(&iosapic_intr_info[vector].rtes)) {
  729. /* Sanity check */
  730. BUG_ON(iosapic_intr_info[vector].count);
  731. /* Clear the interrupt controller descriptor */
  732. idesc->handler = &no_irq_type;
  733. /* Clear the interrupt information */
  734. memset(&iosapic_intr_info[vector], 0, sizeof(struct iosapic_intr_info));
  735. iosapic_intr_info[vector].low32 |= IOSAPIC_MASK;
  736. INIT_LIST_HEAD(&iosapic_intr_info[vector].rtes);
  737. if (idesc->action) {
  738. printk(KERN_ERR "interrupt handlers still exist on IRQ %u\n", irq);
  739. WARN_ON(1);
  740. }
  741. /* Free the interrupt vector */
  742. free_irq_vector(vector);
  743. }
  744. }
  745. out:
  746. spin_unlock(&iosapic_lock);
  747. spin_unlock_irqrestore(&idesc->lock, flags);
  748. }
  749. /*
  750. * ACPI calls this when it finds an entry for a platform interrupt.
  751. * Note that the irq_base and IOSAPIC address must be set in iosapic_init().
  752. */
  753. int __init
  754. iosapic_register_platform_intr (u32 int_type, unsigned int gsi,
  755. int iosapic_vector, u16 eid, u16 id,
  756. unsigned long polarity, unsigned long trigger)
  757. {
  758. static const char * const name[] = {"unknown", "PMI", "INIT", "CPEI"};
  759. unsigned char delivery;
  760. int vector, mask = 0;
  761. unsigned int dest = ((id << 8) | eid) & 0xffff;
  762. switch (int_type) {
  763. case ACPI_INTERRUPT_PMI:
  764. vector = iosapic_vector;
  765. /*
  766. * since PMI vector is alloc'd by FW(ACPI) not by kernel,
  767. * we need to make sure the vector is available
  768. */
  769. iosapic_reassign_vector(vector);
  770. delivery = IOSAPIC_PMI;
  771. break;
  772. case ACPI_INTERRUPT_INIT:
  773. vector = assign_irq_vector(AUTO_ASSIGN);
  774. if (vector < 0)
  775. panic("%s: out of interrupt vectors!\n", __FUNCTION__);
  776. delivery = IOSAPIC_INIT;
  777. break;
  778. case ACPI_INTERRUPT_CPEI:
  779. vector = IA64_CPE_VECTOR;
  780. delivery = IOSAPIC_LOWEST_PRIORITY;
  781. mask = 1;
  782. break;
  783. default:
  784. printk(KERN_ERR "iosapic_register_platform_irq(): invalid int type 0x%x\n", int_type);
  785. return -1;
  786. }
  787. register_intr(gsi, vector, delivery, polarity, trigger);
  788. printk(KERN_INFO "PLATFORM int %s (0x%x): GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d\n",
  789. int_type < ARRAY_SIZE(name) ? name[int_type] : "unknown",
  790. int_type, gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  791. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  792. cpu_logical_id(dest), dest, vector);
  793. set_rte(gsi, vector, dest, mask);
  794. return vector;
  795. }
  796. /*
  797. * ACPI calls this when it finds an entry for a legacy ISA IRQ override.
  798. * Note that the gsi_base and IOSAPIC address must be set in iosapic_init().
  799. */
  800. void __init
  801. iosapic_override_isa_irq (unsigned int isa_irq, unsigned int gsi,
  802. unsigned long polarity,
  803. unsigned long trigger)
  804. {
  805. int vector;
  806. unsigned int dest = cpu_physical_id(smp_processor_id());
  807. vector = isa_irq_to_vector(isa_irq);
  808. register_intr(gsi, vector, IOSAPIC_LOWEST_PRIORITY, polarity, trigger);
  809. DBG("ISA: IRQ %u -> GSI %u (%s,%s) -> CPU %d (0x%04x) vector %d\n",
  810. isa_irq, gsi, trigger == IOSAPIC_EDGE ? "edge" : "level",
  811. polarity == IOSAPIC_POL_HIGH ? "high" : "low",
  812. cpu_logical_id(dest), dest, vector);
  813. set_rte(gsi, vector, dest, 1);
  814. }
  815. void __init
  816. iosapic_system_init (int system_pcat_compat)
  817. {
  818. int vector;
  819. for (vector = 0; vector < IA64_NUM_VECTORS; ++vector) {
  820. iosapic_intr_info[vector].low32 = IOSAPIC_MASK;
  821. INIT_LIST_HEAD(&iosapic_intr_info[vector].rtes); /* mark as unused */
  822. }
  823. pcat_compat = system_pcat_compat;
  824. if (pcat_compat) {
  825. /*
  826. * Disable the compatibility mode interrupts (8259 style), needs IN/OUT support
  827. * enabled.
  828. */
  829. printk(KERN_INFO "%s: Disabling PC-AT compatible 8259 interrupts\n", __FUNCTION__);
  830. outb(0xff, 0xA1);
  831. outb(0xff, 0x21);
  832. }
  833. }
  834. static inline int
  835. iosapic_alloc (void)
  836. {
  837. int index;
  838. for (index = 0; index < NR_IOSAPICS; index++)
  839. if (!iosapic_lists[index].addr)
  840. return index;
  841. printk(KERN_WARNING "%s: failed to allocate iosapic\n", __FUNCTION__);
  842. return -1;
  843. }
  844. static inline void
  845. iosapic_free (int index)
  846. {
  847. memset(&iosapic_lists[index], 0, sizeof(iosapic_lists[0]));
  848. }
  849. static inline int
  850. iosapic_check_gsi_range (unsigned int gsi_base, unsigned int ver)
  851. {
  852. int index;
  853. unsigned int gsi_end, base, end;
  854. /* check gsi range */
  855. gsi_end = gsi_base + ((ver >> 16) & 0xff);
  856. for (index = 0; index < NR_IOSAPICS; index++) {
  857. if (!iosapic_lists[index].addr)
  858. continue;
  859. base = iosapic_lists[index].gsi_base;
  860. end = base + iosapic_lists[index].num_rte - 1;
  861. if (gsi_base < base && gsi_end < base)
  862. continue;/* OK */
  863. if (gsi_base > end && gsi_end > end)
  864. continue; /* OK */
  865. return -EBUSY;
  866. }
  867. return 0;
  868. }
  869. int __devinit
  870. iosapic_init (unsigned long phys_addr, unsigned int gsi_base)
  871. {
  872. int num_rte, err, index;
  873. unsigned int isa_irq, ver;
  874. char __iomem *addr;
  875. unsigned long flags;
  876. spin_lock_irqsave(&iosapic_lock, flags);
  877. {
  878. addr = ioremap(phys_addr, 0);
  879. ver = iosapic_version(addr);
  880. if ((err = iosapic_check_gsi_range(gsi_base, ver))) {
  881. iounmap(addr);
  882. spin_unlock_irqrestore(&iosapic_lock, flags);
  883. return err;
  884. }
  885. /*
  886. * The MAX_REDIR register holds the highest input pin
  887. * number (starting from 0).
  888. * We add 1 so that we can use it for number of pins (= RTEs)
  889. */
  890. num_rte = ((ver >> 16) & 0xff) + 1;
  891. index = iosapic_alloc();
  892. iosapic_lists[index].addr = addr;
  893. iosapic_lists[index].gsi_base = gsi_base;
  894. iosapic_lists[index].num_rte = num_rte;
  895. #ifdef CONFIG_NUMA
  896. iosapic_lists[index].node = MAX_NUMNODES;
  897. #endif
  898. }
  899. spin_unlock_irqrestore(&iosapic_lock, flags);
  900. if ((gsi_base == 0) && pcat_compat) {
  901. /*
  902. * Map the legacy ISA devices into the IOSAPIC data. Some of these may
  903. * get reprogrammed later on with data from the ACPI Interrupt Source
  904. * Override table.
  905. */
  906. for (isa_irq = 0; isa_irq < 16; ++isa_irq)
  907. iosapic_override_isa_irq(isa_irq, isa_irq, IOSAPIC_POL_HIGH, IOSAPIC_EDGE);
  908. }
  909. return 0;
  910. }
  911. #ifdef CONFIG_HOTPLUG
  912. int
  913. iosapic_remove (unsigned int gsi_base)
  914. {
  915. int index, err = 0;
  916. unsigned long flags;
  917. spin_lock_irqsave(&iosapic_lock, flags);
  918. {
  919. index = find_iosapic(gsi_base);
  920. if (index < 0) {
  921. printk(KERN_WARNING "%s: No IOSAPIC for GSI base %u\n",
  922. __FUNCTION__, gsi_base);
  923. goto out;
  924. }
  925. if (iosapic_lists[index].rtes_inuse) {
  926. err = -EBUSY;
  927. printk(KERN_WARNING "%s: IOSAPIC for GSI base %u is busy\n",
  928. __FUNCTION__, gsi_base);
  929. goto out;
  930. }
  931. iounmap(iosapic_lists[index].addr);
  932. iosapic_free(index);
  933. }
  934. out:
  935. spin_unlock_irqrestore(&iosapic_lock, flags);
  936. return err;
  937. }
  938. #endif /* CONFIG_HOTPLUG */
  939. #ifdef CONFIG_NUMA
  940. void __devinit
  941. map_iosapic_to_node(unsigned int gsi_base, int node)
  942. {
  943. int index;
  944. index = find_iosapic(gsi_base);
  945. if (index < 0) {
  946. printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n",
  947. __FUNCTION__, gsi_base);
  948. return;
  949. }
  950. iosapic_lists[index].node = node;
  951. return;
  952. }
  953. #endif
  954. static int __init iosapic_enable_kmalloc (void)
  955. {
  956. iosapic_kmalloc_ok = 1;
  957. return 0;
  958. }
  959. core_initcall (iosapic_enable_kmalloc);