iosapic.c 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116
  1. /*
  2. * I/O SAPIC support.
  3. *
  4. * Copyright (C) 1999 Intel Corp.
  5. * Copyright (C) 1999 Asit Mallick <asit.k.mallick@intel.com>
  6. * Copyright (C) 2000-2002 J.I. Lee <jung-ik.lee@intel.com>
  7. * Copyright (C) 1999-2000, 2002-2003 Hewlett-Packard Co.
  8. * David Mosberger-Tang <davidm@hpl.hp.com>
  9. * Copyright (C) 1999 VA Linux Systems
  10. * Copyright (C) 1999,2000 Walt Drummond <drummond@valinux.com>
  11. *
  12. * 00/04/19 D. Mosberger Rewritten to mirror more closely the x86 I/O APIC code.
  13. * In particular, we now have separate handlers for edge
  14. * and level triggered interrupts.
  15. * 00/10/27 Asit Mallick, Goutham Rao <goutham.rao@intel.com> IRQ vector allocation
  16. * PCI to vector mapping, shared PCI interrupts.
  17. * 00/10/27 D. Mosberger Document things a bit more to make them more understandable.
  18. * Clean up much of the old IOSAPIC cruft.
  19. * 01/07/27 J.I. Lee PCI irq routing, Platform/Legacy interrupts and fixes for
  20. * ACPI S5(SoftOff) support.
  21. * 02/01/23 J.I. Lee iosapic pgm fixes for PCI irq routing from _PRT
  22. * 02/01/07 E. Focht <efocht@ess.nec.de> Redirectable interrupt vectors in
  23. * iosapic_set_affinity(), initializations for
  24. * /proc/irq/#/smp_affinity
  25. * 02/04/02 P. Diefenbaugh Cleaned up ACPI PCI IRQ routing.
  26. * 02/04/18 J.I. Lee bug fix in iosapic_init_pci_irq
  27. * 02/04/30 J.I. Lee bug fix in find_iosapic to fix ACPI PCI IRQ to IOSAPIC mapping
  28. * error
  29. * 02/07/29 T. Kochi Allocate interrupt vectors dynamically
  30. * 02/08/04 T. Kochi Cleaned up terminology (irq, global system interrupt, vector, etc.)
  31. * 02/09/20 D. Mosberger Simplified by taking advantage of ACPI's pci_irq code.
  32. * 03/02/19 B. Helgaas Make pcat_compat system-wide, not per-IOSAPIC.
  33. * Remove iosapic_address & gsi_base from external interfaces.
  34. * Rationalize __init/__devinit attributes.
  35. * 04/12/04 Ashok Raj <ashok.raj@intel.com> Intel Corporation 2004
  36. * Updated to work with irq migration necessary for CPU Hotplug
  37. */
  38. /*
  39. * Here is what the interrupt logic between a PCI device and the kernel looks like:
  40. *
  41. * (1) A PCI device raises one of the four interrupt pins (INTA, INTB, INTC, INTD). The
  42. * device is uniquely identified by its bus--, and slot-number (the function
  43. * number does not matter here because all functions share the same interrupt
  44. * lines).
  45. *
  46. * (2) The motherboard routes the interrupt line to a pin on a IOSAPIC controller.
  47. * Multiple interrupt lines may have to share the same IOSAPIC pin (if they're level
  48. * triggered and use the same polarity). Each interrupt line has a unique Global
  49. * System Interrupt (GSI) number which can be calculated as the sum of the controller's
  50. * base GSI number and the IOSAPIC pin number to which the line connects.
  51. *
  52. * (3) The IOSAPIC uses an internal routing table entries (RTEs) to map the IOSAPIC pin
  53. * into the IA-64 interrupt vector. This interrupt vector is then sent to the CPU.
  54. *
  55. * (4) The kernel recognizes an interrupt as an IRQ. The IRQ interface is used as
  56. * architecture-independent interrupt handling mechanism in Linux. As an
  57. * IRQ is a number, we have to have IA-64 interrupt vector number <-> IRQ number
  58. * mapping. On smaller systems, we use one-to-one mapping between IA-64 vector and
  59. * IRQ. A platform can implement platform_irq_to_vector(irq) and
  60. * platform_local_vector_to_irq(vector) APIs to differentiate the mapping.
  61. * Please see also include/asm-ia64/hw_irq.h for those APIs.
  62. *
  63. * To sum up, there are three levels of mappings involved:
  64. *
  65. * PCI pin -> global system interrupt (GSI) -> IA-64 vector <-> IRQ
  66. *
  67. * Note: The term "IRQ" is loosely used everywhere in Linux kernel to describe interrupts.
  68. * Now we use "IRQ" only for Linux IRQ's. ISA IRQ (isa_irq) is the only exception in this
  69. * source code.
  70. */
  71. #include <linux/config.h>
  72. #include <linux/acpi.h>
  73. #include <linux/init.h>
  74. #include <linux/irq.h>
  75. #include <linux/kernel.h>
  76. #include <linux/list.h>
  77. #include <linux/pci.h>
  78. #include <linux/smp.h>
  79. #include <linux/smp_lock.h>
  80. #include <linux/string.h>
  81. #include <linux/bootmem.h>
  82. #include <asm/delay.h>
  83. #include <asm/hw_irq.h>
  84. #include <asm/io.h>
  85. #include <asm/iosapic.h>
  86. #include <asm/machvec.h>
  87. #include <asm/processor.h>
  88. #include <asm/ptrace.h>
  89. #include <asm/system.h>
  90. #undef DEBUG_INTERRUPT_ROUTING
  91. #ifdef DEBUG_INTERRUPT_ROUTING
  92. #define DBG(fmt...) printk(fmt)
  93. #else
  94. #define DBG(fmt...)
  95. #endif
  96. #define NR_PREALLOCATE_RTE_ENTRIES (PAGE_SIZE / sizeof(struct iosapic_rte_info))
  97. #define RTE_PREALLOCATED (1)
  98. static DEFINE_SPINLOCK(iosapic_lock);
  99. /* These tables map IA-64 vectors to the IOSAPIC pin that generates this vector. */
  100. struct iosapic_rte_info {
  101. struct list_head rte_list; /* node in list of RTEs sharing the same vector */
  102. char __iomem *addr; /* base address of IOSAPIC */
  103. unsigned int gsi_base; /* first GSI assigned to this IOSAPIC */
  104. char rte_index; /* IOSAPIC RTE index */
  105. int refcnt; /* reference counter */
  106. unsigned int flags; /* flags */
  107. } ____cacheline_aligned;
  108. static struct iosapic_intr_info {
  109. struct list_head rtes; /* RTEs using this vector (empty => not an IOSAPIC interrupt) */
  110. int count; /* # of RTEs that shares this vector */
  111. u32 low32; /* current value of low word of Redirection table entry */
  112. unsigned int dest; /* destination CPU physical ID */
  113. unsigned char dmode : 3; /* delivery mode (see iosapic.h) */
  114. unsigned char polarity: 1; /* interrupt polarity (see iosapic.h) */
  115. unsigned char trigger : 1; /* trigger mode (see iosapic.h) */
  116. } iosapic_intr_info[IA64_NUM_VECTORS];
  117. static struct iosapic {
  118. char __iomem *addr; /* base address of IOSAPIC */
  119. unsigned int gsi_base; /* first GSI assigned to this IOSAPIC */
  120. unsigned short num_rte; /* number of RTE in this IOSAPIC */
  121. int rtes_inuse; /* # of RTEs in use on this IOSAPIC */
  122. #ifdef CONFIG_NUMA
  123. unsigned short node; /* numa node association via pxm */
  124. #endif
  125. } iosapic_lists[NR_IOSAPICS];
  126. static unsigned char pcat_compat __devinitdata; /* 8259 compatibility flag */
  127. static int iosapic_kmalloc_ok;
  128. static LIST_HEAD(free_rte_list);
  129. /*
  130. * Find an IOSAPIC associated with a GSI
  131. */
  132. static inline int
  133. find_iosapic (unsigned int gsi)
  134. {
  135. int i;
  136. for (i = 0; i < NR_IOSAPICS; i++) {
  137. if ((unsigned) (gsi - iosapic_lists[i].gsi_base) < iosapic_lists[i].num_rte)
  138. return i;
  139. }
  140. return -1;
  141. }
  142. static inline int
  143. _gsi_to_vector (unsigned int gsi)
  144. {
  145. struct iosapic_intr_info *info;
  146. struct iosapic_rte_info *rte;
  147. for (info = iosapic_intr_info; info < iosapic_intr_info + IA64_NUM_VECTORS; ++info)
  148. list_for_each_entry(rte, &info->rtes, rte_list)
  149. if (rte->gsi_base + rte->rte_index == gsi)
  150. return info - iosapic_intr_info;
  151. return -1;
  152. }
  153. /*
  154. * Translate GSI number to the corresponding IA-64 interrupt vector. If no
  155. * entry exists, return -1.
  156. */
  157. inline int
  158. gsi_to_vector (unsigned int gsi)
  159. {
  160. return _gsi_to_vector(gsi);
  161. }
  162. int
  163. gsi_to_irq (unsigned int gsi)
  164. {
  165. unsigned long flags;
  166. int irq;
  167. /*
  168. * XXX fix me: this assumes an identity mapping vetween IA-64 vector and Linux irq
  169. * numbers...
  170. */
  171. spin_lock_irqsave(&iosapic_lock, flags);
  172. {
  173. irq = _gsi_to_vector(gsi);
  174. }
  175. spin_unlock_irqrestore(&iosapic_lock, flags);
  176. return irq;
  177. }
  178. static struct iosapic_rte_info *gsi_vector_to_rte(unsigned int gsi, unsigned int vec)
  179. {
  180. struct iosapic_rte_info *rte;
  181. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list)
  182. if (rte->gsi_base + rte->rte_index == gsi)
  183. return rte;
  184. return NULL;
  185. }
  186. static void
  187. set_rte (unsigned int gsi, unsigned int vector, unsigned int dest, int mask)
  188. {
  189. unsigned long pol, trigger, dmode;
  190. u32 low32, high32;
  191. char __iomem *addr;
  192. int rte_index;
  193. char redir;
  194. struct iosapic_rte_info *rte;
  195. DBG(KERN_DEBUG"IOSAPIC: routing vector %d to 0x%x\n", vector, dest);
  196. rte = gsi_vector_to_rte(gsi, vector);
  197. if (!rte)
  198. return; /* not an IOSAPIC interrupt */
  199. rte_index = rte->rte_index;
  200. addr = rte->addr;
  201. pol = iosapic_intr_info[vector].polarity;
  202. trigger = iosapic_intr_info[vector].trigger;
  203. dmode = iosapic_intr_info[vector].dmode;
  204. redir = (dmode == IOSAPIC_LOWEST_PRIORITY) ? 1 : 0;
  205. #ifdef CONFIG_SMP
  206. {
  207. unsigned int irq;
  208. for (irq = 0; irq < NR_IRQS; ++irq)
  209. if (irq_to_vector(irq) == vector) {
  210. set_irq_affinity_info(irq, (int)(dest & 0xffff), redir);
  211. break;
  212. }
  213. }
  214. #endif
  215. low32 = ((pol << IOSAPIC_POLARITY_SHIFT) |
  216. (trigger << IOSAPIC_TRIGGER_SHIFT) |
  217. (dmode << IOSAPIC_DELIVERY_SHIFT) |
  218. ((mask ? 1 : 0) << IOSAPIC_MASK_SHIFT) |
  219. vector);
  220. /* dest contains both id and eid */
  221. high32 = (dest << IOSAPIC_DEST_SHIFT);
  222. iosapic_write(addr, IOSAPIC_RTE_HIGH(rte_index), high32);
  223. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  224. iosapic_intr_info[vector].low32 = low32;
  225. iosapic_intr_info[vector].dest = dest;
  226. }
  227. static void
  228. nop (unsigned int vector)
  229. {
  230. /* do nothing... */
  231. }
  232. static void
  233. mask_irq (unsigned int irq)
  234. {
  235. unsigned long flags;
  236. char __iomem *addr;
  237. u32 low32;
  238. int rte_index;
  239. ia64_vector vec = irq_to_vector(irq);
  240. struct iosapic_rte_info *rte;
  241. if (list_empty(&iosapic_intr_info[vec].rtes))
  242. return; /* not an IOSAPIC interrupt! */
  243. spin_lock_irqsave(&iosapic_lock, flags);
  244. {
  245. /* set only the mask bit */
  246. low32 = iosapic_intr_info[vec].low32 |= IOSAPIC_MASK;
  247. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list) {
  248. addr = rte->addr;
  249. rte_index = rte->rte_index;
  250. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  251. }
  252. }
  253. spin_unlock_irqrestore(&iosapic_lock, flags);
  254. }
  255. static void
  256. unmask_irq (unsigned int irq)
  257. {
  258. unsigned long flags;
  259. char __iomem *addr;
  260. u32 low32;
  261. int rte_index;
  262. ia64_vector vec = irq_to_vector(irq);
  263. struct iosapic_rte_info *rte;
  264. if (list_empty(&iosapic_intr_info[vec].rtes))
  265. return; /* not an IOSAPIC interrupt! */
  266. spin_lock_irqsave(&iosapic_lock, flags);
  267. {
  268. low32 = iosapic_intr_info[vec].low32 &= ~IOSAPIC_MASK;
  269. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list) {
  270. addr = rte->addr;
  271. rte_index = rte->rte_index;
  272. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  273. }
  274. }
  275. spin_unlock_irqrestore(&iosapic_lock, flags);
  276. }
  277. static void
  278. iosapic_set_affinity (unsigned int irq, cpumask_t mask)
  279. {
  280. #ifdef CONFIG_SMP
  281. unsigned long flags;
  282. u32 high32, low32;
  283. int dest, rte_index;
  284. char __iomem *addr;
  285. int redir = (irq & IA64_IRQ_REDIRECTED) ? 1 : 0;
  286. ia64_vector vec;
  287. struct iosapic_rte_info *rte;
  288. irq &= (~IA64_IRQ_REDIRECTED);
  289. vec = irq_to_vector(irq);
  290. if (cpus_empty(mask))
  291. return;
  292. dest = cpu_physical_id(first_cpu(mask));
  293. if (list_empty(&iosapic_intr_info[vec].rtes))
  294. return; /* not an IOSAPIC interrupt */
  295. set_irq_affinity_info(irq, dest, redir);
  296. /* dest contains both id and eid */
  297. high32 = dest << IOSAPIC_DEST_SHIFT;
  298. spin_lock_irqsave(&iosapic_lock, flags);
  299. {
  300. low32 = iosapic_intr_info[vec].low32 & ~(7 << IOSAPIC_DELIVERY_SHIFT);
  301. if (redir)
  302. /* change delivery mode to lowest priority */
  303. low32 |= (IOSAPIC_LOWEST_PRIORITY << IOSAPIC_DELIVERY_SHIFT);
  304. else
  305. /* change delivery mode to fixed */
  306. low32 |= (IOSAPIC_FIXED << IOSAPIC_DELIVERY_SHIFT);
  307. iosapic_intr_info[vec].low32 = low32;
  308. iosapic_intr_info[vec].dest = dest;
  309. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list) {
  310. addr = rte->addr;
  311. rte_index = rte->rte_index;
  312. iosapic_write(addr, IOSAPIC_RTE_HIGH(rte_index), high32);
  313. iosapic_write(addr, IOSAPIC_RTE_LOW(rte_index), low32);
  314. }
  315. }
  316. spin_unlock_irqrestore(&iosapic_lock, flags);
  317. #endif
  318. }
  319. /*
  320. * Handlers for level-triggered interrupts.
  321. */
  322. static unsigned int
  323. iosapic_startup_level_irq (unsigned int irq)
  324. {
  325. unmask_irq(irq);
  326. return 0;
  327. }
  328. static void
  329. iosapic_end_level_irq (unsigned int irq)
  330. {
  331. ia64_vector vec = irq_to_vector(irq);
  332. struct iosapic_rte_info *rte;
  333. move_irq(irq);
  334. list_for_each_entry(rte, &iosapic_intr_info[vec].rtes, rte_list)
  335. iosapic_eoi(rte->addr, vec);
  336. }
  337. #define iosapic_shutdown_level_irq mask_irq
  338. #define iosapic_enable_level_irq unmask_irq
  339. #define iosapic_disable_level_irq mask_irq
  340. #define iosapic_ack_level_irq nop
  341. struct hw_interrupt_type irq_type_iosapic_level = {
  342. .typename = "IO-SAPIC-level",
  343. .startup = iosapic_startup_level_irq,
  344. .shutdown = iosapic_shutdown_level_irq,
  345. .enable = iosapic_enable_level_irq,
  346. .disable = iosapic_disable_level_irq,
  347. .ack = iosapic_ack_level_irq,
  348. .end = iosapic_end_level_irq,
  349. .set_affinity = iosapic_set_affinity
  350. };
  351. /*
  352. * Handlers for edge-triggered interrupts.
  353. */
  354. static unsigned int
  355. iosapic_startup_edge_irq (unsigned int irq)
  356. {
  357. unmask_irq(irq);
  358. /*
  359. * IOSAPIC simply drops interrupts pended while the
  360. * corresponding pin was masked, so we can't know if an
  361. * interrupt is pending already. Let's hope not...
  362. */
  363. return 0;
  364. }
  365. static void
  366. iosapic_ack_edge_irq (unsigned int irq)
  367. {
  368. irq_desc_t *idesc = irq_descp(irq);
  369. move_irq(irq);
  370. /*
  371. * Once we have recorded IRQ_PENDING already, we can mask the
  372. * interrupt for real. This prevents IRQ storms from unhandled
  373. * devices.
  374. */
  375. if ((idesc->status & (IRQ_PENDING|IRQ_DISABLED)) == (IRQ_PENDING|IRQ_DISABLED))
  376. mask_irq(irq);
  377. }
  378. #define iosapic_enable_edge_irq unmask_irq
  379. #define iosapic_disable_edge_irq nop
  380. #define iosapic_end_edge_irq nop
  381. struct hw_interrupt_type irq_type_iosapic_edge = {
  382. .typename = "IO-SAPIC-edge",
  383. .startup = iosapic_startup_edge_irq,
  384. .shutdown = iosapic_disable_edge_irq,
  385. .enable = iosapic_enable_edge_irq,
  386. .disable = iosapic_disable_edge_irq,
  387. .ack = iosapic_ack_edge_irq,
  388. .end = iosapic_end_edge_irq,
  389. .set_affinity = iosapic_set_affinity
  390. };
  391. unsigned int
  392. iosapic_version (char __iomem *addr)
  393. {
  394. /*
  395. * IOSAPIC Version Register return 32 bit structure like:
  396. * {
  397. * unsigned int version : 8;
  398. * unsigned int reserved1 : 8;
  399. * unsigned int max_redir : 8;
  400. * unsigned int reserved2 : 8;
  401. * }
  402. */
  403. return iosapic_read(addr, IOSAPIC_VERSION);
  404. }
  405. static int iosapic_find_sharable_vector (unsigned long trigger, unsigned long pol)
  406. {
  407. int i, vector = -1, min_count = -1;
  408. struct iosapic_intr_info *info;
  409. /*
  410. * shared vectors for edge-triggered interrupts are not
  411. * supported yet
  412. */
  413. if (trigger == IOSAPIC_EDGE)
  414. return -1;
  415. for (i = IA64_FIRST_DEVICE_VECTOR; i <= IA64_LAST_DEVICE_VECTOR; i++) {
  416. info = &iosapic_intr_info[i];
  417. if (info->trigger == trigger && info->polarity == pol &&
  418. (info->dmode == IOSAPIC_FIXED || info->dmode == IOSAPIC_LOWEST_PRIORITY)) {
  419. if (min_count == -1 || info->count < min_count) {
  420. vector = i;
  421. min_count = info->count;
  422. }
  423. }
  424. }
  425. return vector;
  426. }
  427. /*
  428. * if the given vector is already owned by other,
  429. * assign a new vector for the other and make the vector available
  430. */
  431. static void __init
  432. iosapic_reassign_vector (int vector)
  433. {
  434. int new_vector;
  435. if (!list_empty(&iosapic_intr_info[vector].rtes)) {
  436. new_vector = assign_irq_vector(AUTO_ASSIGN);
  437. if (new_vector < 0)
  438. panic("%s: out of interrupt vectors!\n", __FUNCTION__);
  439. printk(KERN_INFO "Reassigning vector %d to %d\n", vector, new_vector);
  440. memcpy(&iosapic_intr_info[new_vector], &iosapic_intr_info[vector],
  441. sizeof(struct iosapic_intr_info));
  442. INIT_LIST_HEAD(&iosapic_intr_info[new_vector].rtes);
  443. list_move(iosapic_intr_info[vector].rtes.next, &iosapic_intr_info[new_vector].rtes);
  444. memset(&iosapic_intr_info[vector], 0, sizeof(struct iosapic_intr_info));
  445. iosapic_intr_info[vector].low32 = IOSAPIC_MASK;
  446. INIT_LIST_HEAD(&iosapic_intr_info[vector].rtes);
  447. }
  448. }
  449. static struct iosapic_rte_info *iosapic_alloc_rte (void)
  450. {
  451. int i;
  452. struct iosapic_rte_info *rte;
  453. int preallocated = 0;
  454. if (!iosapic_kmalloc_ok && list_empty(&free_rte_list)) {
  455. rte = alloc_bootmem(sizeof(struct iosapic_rte_info) * NR_PREALLOCATE_RTE_ENTRIES);
  456. if (!rte)
  457. return NULL;
  458. for (i = 0; i < NR_PREALLOCATE_RTE_ENTRIES; i++, rte++)
  459. list_add(&rte->rte_list, &free_rte_list);
  460. }
  461. if (!list_empty(&free_rte_list)) {
  462. rte = list_entry(free_rte_list.next, struct iosapic_rte_info, rte_list);
  463. list_del(&rte->rte_list);
  464. preallocated++;
  465. } else {
  466. rte = kmalloc(sizeof(struct iosapic_rte_info), GFP_ATOMIC);
  467. if (!rte)
  468. return NULL;
  469. }
  470. memset(rte, 0, sizeof(struct iosapic_rte_info));
  471. if (preallocated)
  472. rte->flags |= RTE_PREALLOCATED;
  473. return rte;
  474. }
  475. static void iosapic_free_rte (struct iosapic_rte_info *rte)
  476. {
  477. if (rte->flags & RTE_PREALLOCATED)
  478. list_add_tail(&rte->rte_list, &free_rte_list);
  479. else
  480. kfree(rte);
  481. }
  482. static inline int vector_is_shared (int vector)
  483. {
  484. return (iosapic_intr_info[vector].count > 1);
  485. }
  486. static int
  487. register_intr (unsigned int gsi, int vector, unsigned char delivery,
  488. unsigned long polarity, unsigned long trigger)
  489. {
  490. irq_desc_t *idesc;
  491. struct hw_interrupt_type *irq_type;
  492. int rte_index;
  493. int index;
  494. unsigned long gsi_base;
  495. void __iomem *iosapic_address;
  496. struct iosapic_rte_info *rte;
  497. index = find_iosapic(gsi);
  498. if (index < 0) {
  499. printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n", __FUNCTION__, gsi);
  500. return -ENODEV;
  501. }
  502. iosapic_address = iosapic_lists[index].addr;
  503. gsi_base = iosapic_lists[index].gsi_base;
  504. rte = gsi_vector_to_rte(gsi, vector);
  505. if (!rte) {
  506. rte = iosapic_alloc_rte();
  507. if (!rte) {
  508. printk(KERN_WARNING "%s: cannot allocate memory\n", __FUNCTION__);
  509. return -ENOMEM;
  510. }
  511. rte_index = gsi - gsi_base;
  512. rte->rte_index = rte_index;
  513. rte->addr = iosapic_address;
  514. rte->gsi_base = gsi_base;
  515. rte->refcnt++;
  516. list_add_tail(&rte->rte_list, &iosapic_intr_info[vector].rtes);
  517. iosapic_intr_info[vector].count++;
  518. iosapic_lists[index].rtes_inuse++;
  519. }
  520. else if (vector_is_shared(vector)) {
  521. struct iosapic_intr_info *info = &iosapic_intr_info[vector];
  522. if (info->trigger != trigger || info->polarity != polarity) {
  523. printk (KERN_WARNING "%s: cannot override the interrupt\n", __FUNCTION__);
  524. return -EINVAL;
  525. }
  526. }
  527. iosapic_intr_info[vector].polarity = polarity;
  528. iosapic_intr_info[vector].dmode = delivery;
  529. iosapic_intr_info[vector].trigger = trigger;
  530. if (trigger == IOSAPIC_EDGE)
  531. irq_type = &irq_type_iosapic_edge;
  532. else
  533. irq_type = &irq_type_iosapic_level;
  534. idesc = irq_descp(vector);
  535. if (idesc->handler != irq_type) {
  536. if (idesc->handler != &no_irq_type)
  537. printk(KERN_WARNING "%s: changing vector %d from %s to %s\n",
  538. __FUNCTION__, vector, idesc->handler->typename, irq_type->typename);
  539. idesc->handler = irq_type;
  540. }
  541. return 0;
  542. }
  543. static unsigned int
  544. get_target_cpu (unsigned int gsi, int vector)
  545. {
  546. #ifdef CONFIG_SMP
  547. static int cpu = -1;
  548. /*
  549. * In case of vector shared by multiple RTEs, all RTEs that
  550. * share the vector need to use the same destination CPU.
  551. */
  552. if (!list_empty(&iosapic_intr_info[vector].rtes))
  553. return iosapic_intr_info[vector].dest;
  554. /*
  555. * If the platform supports redirection via XTP, let it
  556. * distribute interrupts.
  557. */
  558. if (smp_int_redirect & SMP_IRQ_REDIRECTION)
  559. return cpu_physical_id(smp_processor_id());
  560. /*
  561. * Some interrupts (ACPI SCI, for instance) are registered
  562. * before the BSP is marked as online.
  563. */
  564. if (!cpu_online(smp_processor_id()))
  565. return cpu_physical_id(smp_processor_id());
  566. #ifdef CONFIG_NUMA
  567. {
  568. int num_cpus, cpu_index, iosapic_index, numa_cpu, i = 0;
  569. cpumask_t cpu_mask;
  570. iosapic_index = find_iosapic(gsi);
  571. if (iosapic_index < 0 ||
  572. iosapic_lists[iosapic_index].node == MAX_NUMNODES)
  573. goto skip_numa_setup;
  574. cpu_mask = node_to_cpumask(iosapic_lists[iosapic_index].node);
  575. for_each_cpu_mask(numa_cpu, cpu_mask) {
  576. if (!cpu_online(numa_cpu))
  577. cpu_clear(numa_cpu, cpu_mask);
  578. }
  579. num_cpus = cpus_weight(cpu_mask);
  580. if (!num_cpus)
  581. goto skip_numa_setup;
  582. /* Use vector assigment to distribute across cpus in node */
  583. cpu_index = vector % num_cpus;
  584. for (numa_cpu = first_cpu(cpu_mask) ; i < cpu_index ; i++)
  585. numa_cpu = next_cpu(numa_cpu, cpu_mask);
  586. if (numa_cpu != NR_CPUS)
  587. return cpu_physical_id(numa_cpu);
  588. }
  589. skip_numa_setup:
  590. #endif
  591. /*
  592. * Otherwise, round-robin interrupt vectors across all the
  593. * processors. (It'd be nice if we could be smarter in the
  594. * case of NUMA.)
  595. */
  596. do {
  597. if (++cpu >= NR_CPUS)
  598. cpu = 0;
  599. } while (!cpu_online(cpu));
  600. return cpu_physical_id(cpu);
  601. #else
  602. return cpu_physical_id(smp_processor_id());
  603. #endif
  604. }
  605. /*
  606. * ACPI can describe IOSAPIC interrupts via static tables and namespace
  607. * methods. This provides an interface to register those interrupts and
  608. * program the IOSAPIC RTE.
  609. */
  610. int
  611. iosapic_register_intr (unsigned int gsi,
  612. unsigned long polarity, unsigned long trigger)
  613. {
  614. int vector, mask = 1, err;
  615. unsigned int dest;
  616. unsigned long flags;
  617. struct iosapic_rte_info *rte;
  618. u32 low32;
  619. again:
  620. /*
  621. * If this GSI has already been registered (i.e., it's a
  622. * shared interrupt, or we lost a race to register it),
  623. * don't touch the RTE.
  624. */
  625. spin_lock_irqsave(&iosapic_lock, flags);
  626. {
  627. vector = gsi_to_vector(gsi);
  628. if (vector > 0) {
  629. rte = gsi_vector_to_rte(gsi, vector);
  630. rte->refcnt++;
  631. spin_unlock_irqrestore(&iosapic_lock, flags);
  632. return vector;
  633. }
  634. }
  635. spin_unlock_irqrestore(&iosapic_lock, flags);
  636. /* If vector is running out, we try to find a sharable vector */
  637. vector = assign_irq_vector(AUTO_ASSIGN);
  638. if (vector < 0) {
  639. vector = iosapic_find_sharable_vector(trigger, polarity);
  640. if (vector < 0)
  641. return -ENOSPC;
  642. }
  643. spin_lock_irqsave(&irq_descp(vector)->lock, flags);
  644. spin_lock(&iosapic_lock);
  645. {
  646. if (gsi_to_vector(gsi) > 0) {
  647. if (list_empty(&iosapic_intr_info[vector].rtes))
  648. free_irq_vector(vector);
  649. spin_unlock(&iosapic_lock);
  650. spin_unlock_irqrestore(&irq_descp(vector)->lock, flags);
  651. goto again;
  652. }
  653. dest = get_target_cpu(gsi, vector);
  654. err = register_intr(gsi, vector, IOSAPIC_LOWEST_PRIORITY,
  655. polarity, trigger);
  656. if (err < 0) {
  657. spin_unlock(&iosapic_lock);
  658. spin_unlock_irqrestore(&irq_descp(vector)->lock, flags);
  659. return err;
  660. }
  661. /*
  662. * If the vector is shared and already unmasked for
  663. * other interrupt sources, don't mask it.
  664. */
  665. low32 = iosapic_intr_info[vector].low32;
  666. if (vector_is_shared(vector) && !(low32 & IOSAPIC_MASK))
  667. mask = 0;
  668. set_rte(gsi, vector, dest, mask);
  669. }
  670. spin_unlock(&iosapic_lock);
  671. spin_unlock_irqrestore(&irq_descp(vector)->lock, flags);
  672. printk(KERN_INFO "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d\n",
  673. gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  674. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  675. cpu_logical_id(dest), dest, vector);
  676. return vector;
  677. }
  678. #ifdef CONFIG_ACPI_DEALLOCATE_IRQ
  679. void
  680. iosapic_unregister_intr (unsigned int gsi)
  681. {
  682. unsigned long flags;
  683. int irq, vector, index;
  684. irq_desc_t *idesc;
  685. u32 low32;
  686. unsigned long trigger, polarity;
  687. unsigned int dest;
  688. struct iosapic_rte_info *rte;
  689. /*
  690. * If the irq associated with the gsi is not found,
  691. * iosapic_unregister_intr() is unbalanced. We need to check
  692. * this again after getting locks.
  693. */
  694. irq = gsi_to_irq(gsi);
  695. if (irq < 0) {
  696. printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n", gsi);
  697. WARN_ON(1);
  698. return;
  699. }
  700. vector = irq_to_vector(irq);
  701. idesc = irq_descp(irq);
  702. spin_lock_irqsave(&idesc->lock, flags);
  703. spin_lock(&iosapic_lock);
  704. {
  705. if ((rte = gsi_vector_to_rte(gsi, vector)) == NULL) {
  706. printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n", gsi);
  707. WARN_ON(1);
  708. goto out;
  709. }
  710. if (--rte->refcnt > 0)
  711. goto out;
  712. /* Mask the interrupt */
  713. low32 = iosapic_intr_info[vector].low32 | IOSAPIC_MASK;
  714. iosapic_write(rte->addr, IOSAPIC_RTE_LOW(rte->rte_index), low32);
  715. /* Remove the rte entry from the list */
  716. list_del(&rte->rte_list);
  717. iosapic_intr_info[vector].count--;
  718. iosapic_free_rte(rte);
  719. index = find_iosapic(gsi);
  720. iosapic_lists[index].rtes_inuse--;
  721. WARN_ON(iosapic_lists[index].rtes_inuse < 0);
  722. trigger = iosapic_intr_info[vector].trigger;
  723. polarity = iosapic_intr_info[vector].polarity;
  724. dest = iosapic_intr_info[vector].dest;
  725. printk(KERN_INFO "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d unregistered\n",
  726. gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  727. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  728. cpu_logical_id(dest), dest, vector);
  729. if (list_empty(&iosapic_intr_info[vector].rtes)) {
  730. /* Sanity check */
  731. BUG_ON(iosapic_intr_info[vector].count);
  732. /* Clear the interrupt controller descriptor */
  733. idesc->handler = &no_irq_type;
  734. /* Clear the interrupt information */
  735. memset(&iosapic_intr_info[vector], 0, sizeof(struct iosapic_intr_info));
  736. iosapic_intr_info[vector].low32 |= IOSAPIC_MASK;
  737. INIT_LIST_HEAD(&iosapic_intr_info[vector].rtes);
  738. if (idesc->action) {
  739. printk(KERN_ERR "interrupt handlers still exist on IRQ %u\n", irq);
  740. WARN_ON(1);
  741. }
  742. /* Free the interrupt vector */
  743. free_irq_vector(vector);
  744. }
  745. }
  746. out:
  747. spin_unlock(&iosapic_lock);
  748. spin_unlock_irqrestore(&idesc->lock, flags);
  749. }
  750. #endif /* CONFIG_ACPI_DEALLOCATE_IRQ */
  751. /*
  752. * ACPI calls this when it finds an entry for a platform interrupt.
  753. * Note that the irq_base and IOSAPIC address must be set in iosapic_init().
  754. */
  755. int __init
  756. iosapic_register_platform_intr (u32 int_type, unsigned int gsi,
  757. int iosapic_vector, u16 eid, u16 id,
  758. unsigned long polarity, unsigned long trigger)
  759. {
  760. static const char * const name[] = {"unknown", "PMI", "INIT", "CPEI"};
  761. unsigned char delivery;
  762. int vector, mask = 0;
  763. unsigned int dest = ((id << 8) | eid) & 0xffff;
  764. switch (int_type) {
  765. case ACPI_INTERRUPT_PMI:
  766. vector = iosapic_vector;
  767. /*
  768. * since PMI vector is alloc'd by FW(ACPI) not by kernel,
  769. * we need to make sure the vector is available
  770. */
  771. iosapic_reassign_vector(vector);
  772. delivery = IOSAPIC_PMI;
  773. break;
  774. case ACPI_INTERRUPT_INIT:
  775. vector = assign_irq_vector(AUTO_ASSIGN);
  776. if (vector < 0)
  777. panic("%s: out of interrupt vectors!\n", __FUNCTION__);
  778. delivery = IOSAPIC_INIT;
  779. break;
  780. case ACPI_INTERRUPT_CPEI:
  781. vector = IA64_CPE_VECTOR;
  782. delivery = IOSAPIC_LOWEST_PRIORITY;
  783. mask = 1;
  784. break;
  785. default:
  786. printk(KERN_ERR "iosapic_register_platform_irq(): invalid int type 0x%x\n", int_type);
  787. return -1;
  788. }
  789. register_intr(gsi, vector, delivery, polarity, trigger);
  790. printk(KERN_INFO "PLATFORM int %s (0x%x): GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d\n",
  791. int_type < ARRAY_SIZE(name) ? name[int_type] : "unknown",
  792. int_type, gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  793. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  794. cpu_logical_id(dest), dest, vector);
  795. set_rte(gsi, vector, dest, mask);
  796. return vector;
  797. }
  798. /*
  799. * ACPI calls this when it finds an entry for a legacy ISA IRQ override.
  800. * Note that the gsi_base and IOSAPIC address must be set in iosapic_init().
  801. */
  802. void __init
  803. iosapic_override_isa_irq (unsigned int isa_irq, unsigned int gsi,
  804. unsigned long polarity,
  805. unsigned long trigger)
  806. {
  807. int vector;
  808. unsigned int dest = cpu_physical_id(smp_processor_id());
  809. vector = isa_irq_to_vector(isa_irq);
  810. register_intr(gsi, vector, IOSAPIC_LOWEST_PRIORITY, polarity, trigger);
  811. DBG("ISA: IRQ %u -> GSI %u (%s,%s) -> CPU %d (0x%04x) vector %d\n",
  812. isa_irq, gsi, trigger == IOSAPIC_EDGE ? "edge" : "level",
  813. polarity == IOSAPIC_POL_HIGH ? "high" : "low",
  814. cpu_logical_id(dest), dest, vector);
  815. set_rte(gsi, vector, dest, 1);
  816. }
  817. void __init
  818. iosapic_system_init (int system_pcat_compat)
  819. {
  820. int vector;
  821. for (vector = 0; vector < IA64_NUM_VECTORS; ++vector) {
  822. iosapic_intr_info[vector].low32 = IOSAPIC_MASK;
  823. INIT_LIST_HEAD(&iosapic_intr_info[vector].rtes); /* mark as unused */
  824. }
  825. pcat_compat = system_pcat_compat;
  826. if (pcat_compat) {
  827. /*
  828. * Disable the compatibility mode interrupts (8259 style), needs IN/OUT support
  829. * enabled.
  830. */
  831. printk(KERN_INFO "%s: Disabling PC-AT compatible 8259 interrupts\n", __FUNCTION__);
  832. outb(0xff, 0xA1);
  833. outb(0xff, 0x21);
  834. }
  835. }
  836. static inline int
  837. iosapic_alloc (void)
  838. {
  839. int index;
  840. for (index = 0; index < NR_IOSAPICS; index++)
  841. if (!iosapic_lists[index].addr)
  842. return index;
  843. printk(KERN_WARNING "%s: failed to allocate iosapic\n", __FUNCTION__);
  844. return -1;
  845. }
  846. static inline void
  847. iosapic_free (int index)
  848. {
  849. memset(&iosapic_lists[index], 0, sizeof(iosapic_lists[0]));
  850. }
  851. static inline int
  852. iosapic_check_gsi_range (unsigned int gsi_base, unsigned int ver)
  853. {
  854. int index;
  855. unsigned int gsi_end, base, end;
  856. /* check gsi range */
  857. gsi_end = gsi_base + ((ver >> 16) & 0xff);
  858. for (index = 0; index < NR_IOSAPICS; index++) {
  859. if (!iosapic_lists[index].addr)
  860. continue;
  861. base = iosapic_lists[index].gsi_base;
  862. end = base + iosapic_lists[index].num_rte - 1;
  863. if (gsi_base < base && gsi_end < base)
  864. continue;/* OK */
  865. if (gsi_base > end && gsi_end > end)
  866. continue; /* OK */
  867. return -EBUSY;
  868. }
  869. return 0;
  870. }
  871. int __devinit
  872. iosapic_init (unsigned long phys_addr, unsigned int gsi_base)
  873. {
  874. int num_rte, err, index;
  875. unsigned int isa_irq, ver;
  876. char __iomem *addr;
  877. unsigned long flags;
  878. spin_lock_irqsave(&iosapic_lock, flags);
  879. {
  880. addr = ioremap(phys_addr, 0);
  881. ver = iosapic_version(addr);
  882. if ((err = iosapic_check_gsi_range(gsi_base, ver))) {
  883. iounmap(addr);
  884. spin_unlock_irqrestore(&iosapic_lock, flags);
  885. return err;
  886. }
  887. /*
  888. * The MAX_REDIR register holds the highest input pin
  889. * number (starting from 0).
  890. * We add 1 so that we can use it for number of pins (= RTEs)
  891. */
  892. num_rte = ((ver >> 16) & 0xff) + 1;
  893. index = iosapic_alloc();
  894. iosapic_lists[index].addr = addr;
  895. iosapic_lists[index].gsi_base = gsi_base;
  896. iosapic_lists[index].num_rte = num_rte;
  897. #ifdef CONFIG_NUMA
  898. iosapic_lists[index].node = MAX_NUMNODES;
  899. #endif
  900. }
  901. spin_unlock_irqrestore(&iosapic_lock, flags);
  902. if ((gsi_base == 0) && pcat_compat) {
  903. /*
  904. * Map the legacy ISA devices into the IOSAPIC data. Some of these may
  905. * get reprogrammed later on with data from the ACPI Interrupt Source
  906. * Override table.
  907. */
  908. for (isa_irq = 0; isa_irq < 16; ++isa_irq)
  909. iosapic_override_isa_irq(isa_irq, isa_irq, IOSAPIC_POL_HIGH, IOSAPIC_EDGE);
  910. }
  911. return 0;
  912. }
  913. #ifdef CONFIG_HOTPLUG
  914. int
  915. iosapic_remove (unsigned int gsi_base)
  916. {
  917. int index, err = 0;
  918. unsigned long flags;
  919. spin_lock_irqsave(&iosapic_lock, flags);
  920. {
  921. index = find_iosapic(gsi_base);
  922. if (index < 0) {
  923. printk(KERN_WARNING "%s: No IOSAPIC for GSI base %u\n",
  924. __FUNCTION__, gsi_base);
  925. goto out;
  926. }
  927. if (iosapic_lists[index].rtes_inuse) {
  928. err = -EBUSY;
  929. printk(KERN_WARNING "%s: IOSAPIC for GSI base %u is busy\n",
  930. __FUNCTION__, gsi_base);
  931. goto out;
  932. }
  933. iounmap(iosapic_lists[index].addr);
  934. iosapic_free(index);
  935. }
  936. out:
  937. spin_unlock_irqrestore(&iosapic_lock, flags);
  938. return err;
  939. }
  940. #endif /* CONFIG_HOTPLUG */
  941. #ifdef CONFIG_NUMA
  942. void __devinit
  943. map_iosapic_to_node(unsigned int gsi_base, int node)
  944. {
  945. int index;
  946. index = find_iosapic(gsi_base);
  947. if (index < 0) {
  948. printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n",
  949. __FUNCTION__, gsi_base);
  950. return;
  951. }
  952. iosapic_lists[index].node = node;
  953. return;
  954. }
  955. #endif
  956. static int __init iosapic_enable_kmalloc (void)
  957. {
  958. iosapic_kmalloc_ok = 1;
  959. return 0;
  960. }
  961. core_initcall (iosapic_enable_kmalloc);