iosapic.c 29 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142
  1. /*
  2. * I/O SAPIC support.
  3. *
  4. * Copyright (C) 1999 Intel Corp.
  5. * Copyright (C) 1999 Asit Mallick <asit.k.mallick@intel.com>
  6. * Copyright (C) 2000-2002 J.I. Lee <jung-ik.lee@intel.com>
  7. * Copyright (C) 1999-2000, 2002-2003 Hewlett-Packard Co.
  8. * David Mosberger-Tang <davidm@hpl.hp.com>
  9. * Copyright (C) 1999 VA Linux Systems
  10. * Copyright (C) 1999,2000 Walt Drummond <drummond@valinux.com>
  11. *
  12. * 00/04/19 D. Mosberger Rewritten to mirror more closely the x86 I/O
  13. * APIC code. In particular, we now have separate
  14. * handlers for edge and level triggered
  15. * interrupts.
  16. * 00/10/27 Asit Mallick, Goutham Rao <goutham.rao@intel.com> IRQ vector
  17. * allocation PCI to vector mapping, shared PCI
  18. * interrupts.
  19. * 00/10/27 D. Mosberger Document things a bit more to make them more
  20. * understandable. Clean up much of the old
  21. * IOSAPIC cruft.
  22. * 01/07/27 J.I. Lee PCI irq routing, Platform/Legacy interrupts
  23. * and fixes for ACPI S5(SoftOff) support.
  24. * 02/01/23 J.I. Lee iosapic pgm fixes for PCI irq routing from _PRT
  25. * 02/01/07 E. Focht <efocht@ess.nec.de> Redirectable interrupt
  26. * vectors in iosapic_set_affinity(),
  27. * initializations for /proc/irq/#/smp_affinity
  28. * 02/04/02 P. Diefenbaugh Cleaned up ACPI PCI IRQ routing.
  29. * 02/04/18 J.I. Lee bug fix in iosapic_init_pci_irq
  30. * 02/04/30 J.I. Lee bug fix in find_iosapic to fix ACPI PCI IRQ to
  31. * IOSAPIC mapping error
  32. * 02/07/29 T. Kochi Allocate interrupt vectors dynamically
  33. * 02/08/04 T. Kochi Cleaned up terminology (irq, global system
  34. * interrupt, vector, etc.)
  35. * 02/09/20 D. Mosberger Simplified by taking advantage of ACPI's
  36. * pci_irq code.
  37. * 03/02/19 B. Helgaas Make pcat_compat system-wide, not per-IOSAPIC.
  38. * Remove iosapic_address & gsi_base from
  39. * external interfaces. Rationalize
  40. * __init/__devinit attributes.
  41. * 04/12/04 Ashok Raj <ashok.raj@intel.com> Intel Corporation 2004
  42. * Updated to work with irq migration necessary
  43. * for CPU Hotplug
  44. */
  45. /*
  46. * Here is what the interrupt logic between a PCI device and the kernel looks
  47. * like:
  48. *
  49. * (1) A PCI device raises one of the four interrupt pins (INTA, INTB, INTC,
  50. * INTD). The device is uniquely identified by its bus-, and slot-number
  51. * (the function number does not matter here because all functions share
  52. * the same interrupt lines).
  53. *
  54. * (2) The motherboard routes the interrupt line to a pin on a IOSAPIC
  55. * controller. Multiple interrupt lines may have to share the same
  56. * IOSAPIC pin (if they're level triggered and use the same polarity).
  57. * Each interrupt line has a unique Global System Interrupt (GSI) number
  58. * which can be calculated as the sum of the controller's base GSI number
  59. * and the IOSAPIC pin number to which the line connects.
  60. *
  61. * (3) The IOSAPIC uses an internal routing table entries (RTEs) to map the
  62. * IOSAPIC pin into the IA-64 interrupt vector. This interrupt vector is then
  63. * sent to the CPU.
  64. *
  65. * (4) The kernel recognizes an interrupt as an IRQ. The IRQ interface is
  66. * used as architecture-independent interrupt handling mechanism in Linux.
  67. * As an IRQ is a number, we have to have
  68. * IA-64 interrupt vector number <-> IRQ number mapping. On smaller
  69. * systems, we use one-to-one mapping between IA-64 vector and IRQ. A
  70. * platform can implement platform_irq_to_vector(irq) and
  71. * platform_local_vector_to_irq(vector) APIs to differentiate the mapping.
  72. * Please see also arch/ia64/include/asm/hw_irq.h for those APIs.
  73. *
  74. * To sum up, there are three levels of mappings involved:
  75. *
  76. * PCI pin -> global system interrupt (GSI) -> IA-64 vector <-> IRQ
  77. *
  78. * Note: The term "IRQ" is loosely used everywhere in Linux kernel to
  79. * describe interrupts. Now we use "IRQ" only for Linux IRQ's. ISA IRQ
  80. * (isa_irq) is the only exception in this source code.
  81. */
  82. #include <linux/acpi.h>
  83. #include <linux/init.h>
  84. #include <linux/irq.h>
  85. #include <linux/kernel.h>
  86. #include <linux/list.h>
  87. #include <linux/pci.h>
  88. #include <linux/slab.h>
  89. #include <linux/smp.h>
  90. #include <linux/string.h>
  91. #include <linux/bootmem.h>
  92. #include <asm/delay.h>
  93. #include <asm/hw_irq.h>
  94. #include <asm/io.h>
  95. #include <asm/iosapic.h>
  96. #include <asm/machvec.h>
  97. #include <asm/processor.h>
  98. #include <asm/ptrace.h>
  99. #undef DEBUG_INTERRUPT_ROUTING
  100. #ifdef DEBUG_INTERRUPT_ROUTING
  101. #define DBG(fmt...) printk(fmt)
  102. #else
  103. #define DBG(fmt...)
  104. #endif
  105. static DEFINE_SPINLOCK(iosapic_lock);
  106. /*
  107. * These tables map IA-64 vectors to the IOSAPIC pin that generates this
  108. * vector.
  109. */
  110. #define NO_REF_RTE 0
  111. static struct iosapic {
  112. char __iomem *addr; /* base address of IOSAPIC */
  113. unsigned int gsi_base; /* GSI base */
  114. unsigned short num_rte; /* # of RTEs on this IOSAPIC */
  115. int rtes_inuse; /* # of RTEs in use on this IOSAPIC */
  116. #ifdef CONFIG_NUMA
  117. unsigned short node; /* numa node association via pxm */
  118. #endif
  119. spinlock_t lock; /* lock for indirect reg access */
  120. } iosapic_lists[NR_IOSAPICS];
  121. struct iosapic_rte_info {
  122. struct list_head rte_list; /* RTEs sharing the same vector */
  123. char rte_index; /* IOSAPIC RTE index */
  124. int refcnt; /* reference counter */
  125. struct iosapic *iosapic;
  126. } ____cacheline_aligned;
  127. static struct iosapic_intr_info {
  128. struct list_head rtes; /* RTEs using this vector (empty =>
  129. * not an IOSAPIC interrupt) */
  130. int count; /* # of registered RTEs */
  131. u32 low32; /* current value of low word of
  132. * Redirection table entry */
  133. unsigned int dest; /* destination CPU physical ID */
  134. unsigned char dmode : 3; /* delivery mode (see iosapic.h) */
  135. unsigned char polarity: 1; /* interrupt polarity
  136. * (see iosapic.h) */
  137. unsigned char trigger : 1; /* trigger mode (see iosapic.h) */
  138. } iosapic_intr_info[NR_IRQS];
  139. static unsigned char pcat_compat; /* 8259 compatibility flag */
  140. static inline void
  141. iosapic_write(struct iosapic *iosapic, unsigned int reg, u32 val)
  142. {
  143. unsigned long flags;
  144. spin_lock_irqsave(&iosapic->lock, flags);
  145. __iosapic_write(iosapic->addr, reg, val);
  146. spin_unlock_irqrestore(&iosapic->lock, flags);
  147. }
  148. /*
  149. * Find an IOSAPIC associated with a GSI
  150. */
  151. static inline int
  152. find_iosapic (unsigned int gsi)
  153. {
  154. int i;
  155. for (i = 0; i < NR_IOSAPICS; i++) {
  156. if ((unsigned) (gsi - iosapic_lists[i].gsi_base) <
  157. iosapic_lists[i].num_rte)
  158. return i;
  159. }
  160. return -1;
  161. }
  162. static inline int __gsi_to_irq(unsigned int gsi)
  163. {
  164. int irq;
  165. struct iosapic_intr_info *info;
  166. struct iosapic_rte_info *rte;
  167. for (irq = 0; irq < NR_IRQS; irq++) {
  168. info = &iosapic_intr_info[irq];
  169. list_for_each_entry(rte, &info->rtes, rte_list)
  170. if (rte->iosapic->gsi_base + rte->rte_index == gsi)
  171. return irq;
  172. }
  173. return -1;
  174. }
  175. int
  176. gsi_to_irq (unsigned int gsi)
  177. {
  178. unsigned long flags;
  179. int irq;
  180. spin_lock_irqsave(&iosapic_lock, flags);
  181. irq = __gsi_to_irq(gsi);
  182. spin_unlock_irqrestore(&iosapic_lock, flags);
  183. return irq;
  184. }
  185. static struct iosapic_rte_info *find_rte(unsigned int irq, unsigned int gsi)
  186. {
  187. struct iosapic_rte_info *rte;
  188. list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list)
  189. if (rte->iosapic->gsi_base + rte->rte_index == gsi)
  190. return rte;
  191. return NULL;
  192. }
  193. static void
  194. set_rte (unsigned int gsi, unsigned int irq, unsigned int dest, int mask)
  195. {
  196. unsigned long pol, trigger, dmode;
  197. u32 low32, high32;
  198. int rte_index;
  199. char redir;
  200. struct iosapic_rte_info *rte;
  201. ia64_vector vector = irq_to_vector(irq);
  202. DBG(KERN_DEBUG"IOSAPIC: routing vector %d to 0x%x\n", vector, dest);
  203. rte = find_rte(irq, gsi);
  204. if (!rte)
  205. return; /* not an IOSAPIC interrupt */
  206. rte_index = rte->rte_index;
  207. pol = iosapic_intr_info[irq].polarity;
  208. trigger = iosapic_intr_info[irq].trigger;
  209. dmode = iosapic_intr_info[irq].dmode;
  210. redir = (dmode == IOSAPIC_LOWEST_PRIORITY) ? 1 : 0;
  211. #ifdef CONFIG_SMP
  212. set_irq_affinity_info(irq, (int)(dest & 0xffff), redir);
  213. #endif
  214. low32 = ((pol << IOSAPIC_POLARITY_SHIFT) |
  215. (trigger << IOSAPIC_TRIGGER_SHIFT) |
  216. (dmode << IOSAPIC_DELIVERY_SHIFT) |
  217. ((mask ? 1 : 0) << IOSAPIC_MASK_SHIFT) |
  218. vector);
  219. /* dest contains both id and eid */
  220. high32 = (dest << IOSAPIC_DEST_SHIFT);
  221. iosapic_write(rte->iosapic, IOSAPIC_RTE_HIGH(rte_index), high32);
  222. iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte_index), low32);
  223. iosapic_intr_info[irq].low32 = low32;
  224. iosapic_intr_info[irq].dest = dest;
  225. }
  226. static void
  227. iosapic_nop (struct irq_data *data)
  228. {
  229. /* do nothing... */
  230. }
  231. #ifdef CONFIG_KEXEC
  232. void
  233. kexec_disable_iosapic(void)
  234. {
  235. struct iosapic_intr_info *info;
  236. struct iosapic_rte_info *rte;
  237. ia64_vector vec;
  238. int irq;
  239. for (irq = 0; irq < NR_IRQS; irq++) {
  240. info = &iosapic_intr_info[irq];
  241. vec = irq_to_vector(irq);
  242. list_for_each_entry(rte, &info->rtes,
  243. rte_list) {
  244. iosapic_write(rte->iosapic,
  245. IOSAPIC_RTE_LOW(rte->rte_index),
  246. IOSAPIC_MASK|vec);
  247. iosapic_eoi(rte->iosapic->addr, vec);
  248. }
  249. }
  250. }
  251. #endif
  252. static void
  253. mask_irq (struct irq_data *data)
  254. {
  255. unsigned int irq = data->irq;
  256. u32 low32;
  257. int rte_index;
  258. struct iosapic_rte_info *rte;
  259. if (!iosapic_intr_info[irq].count)
  260. return; /* not an IOSAPIC interrupt! */
  261. /* set only the mask bit */
  262. low32 = iosapic_intr_info[irq].low32 |= IOSAPIC_MASK;
  263. list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) {
  264. rte_index = rte->rte_index;
  265. iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte_index), low32);
  266. }
  267. }
  268. static void
  269. unmask_irq (struct irq_data *data)
  270. {
  271. unsigned int irq = data->irq;
  272. u32 low32;
  273. int rte_index;
  274. struct iosapic_rte_info *rte;
  275. if (!iosapic_intr_info[irq].count)
  276. return; /* not an IOSAPIC interrupt! */
  277. low32 = iosapic_intr_info[irq].low32 &= ~IOSAPIC_MASK;
  278. list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) {
  279. rte_index = rte->rte_index;
  280. iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte_index), low32);
  281. }
  282. }
  283. static int
  284. iosapic_set_affinity(struct irq_data *data, const struct cpumask *mask,
  285. bool force)
  286. {
  287. #ifdef CONFIG_SMP
  288. unsigned int irq = data->irq;
  289. u32 high32, low32;
  290. int cpu, dest, rte_index;
  291. int redir = (irq & IA64_IRQ_REDIRECTED) ? 1 : 0;
  292. struct iosapic_rte_info *rte;
  293. struct iosapic *iosapic;
  294. irq &= (~IA64_IRQ_REDIRECTED);
  295. cpu = cpumask_first_and(cpu_online_mask, mask);
  296. if (cpu >= nr_cpu_ids)
  297. return -1;
  298. if (irq_prepare_move(irq, cpu))
  299. return -1;
  300. dest = cpu_physical_id(cpu);
  301. if (!iosapic_intr_info[irq].count)
  302. return -1; /* not an IOSAPIC interrupt */
  303. set_irq_affinity_info(irq, dest, redir);
  304. /* dest contains both id and eid */
  305. high32 = dest << IOSAPIC_DEST_SHIFT;
  306. low32 = iosapic_intr_info[irq].low32 & ~(7 << IOSAPIC_DELIVERY_SHIFT);
  307. if (redir)
  308. /* change delivery mode to lowest priority */
  309. low32 |= (IOSAPIC_LOWEST_PRIORITY << IOSAPIC_DELIVERY_SHIFT);
  310. else
  311. /* change delivery mode to fixed */
  312. low32 |= (IOSAPIC_FIXED << IOSAPIC_DELIVERY_SHIFT);
  313. low32 &= IOSAPIC_VECTOR_MASK;
  314. low32 |= irq_to_vector(irq);
  315. iosapic_intr_info[irq].low32 = low32;
  316. iosapic_intr_info[irq].dest = dest;
  317. list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) {
  318. iosapic = rte->iosapic;
  319. rte_index = rte->rte_index;
  320. iosapic_write(iosapic, IOSAPIC_RTE_HIGH(rte_index), high32);
  321. iosapic_write(iosapic, IOSAPIC_RTE_LOW(rte_index), low32);
  322. }
  323. #endif
  324. return 0;
  325. }
  326. /*
  327. * Handlers for level-triggered interrupts.
  328. */
  329. static unsigned int
  330. iosapic_startup_level_irq (struct irq_data *data)
  331. {
  332. unmask_irq(data);
  333. return 0;
  334. }
  335. static void
  336. iosapic_unmask_level_irq (struct irq_data *data)
  337. {
  338. unsigned int irq = data->irq;
  339. ia64_vector vec = irq_to_vector(irq);
  340. struct iosapic_rte_info *rte;
  341. int do_unmask_irq = 0;
  342. irq_complete_move(irq);
  343. if (unlikely(irqd_is_setaffinity_pending(data))) {
  344. do_unmask_irq = 1;
  345. mask_irq(data);
  346. } else
  347. unmask_irq(data);
  348. list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list)
  349. iosapic_eoi(rte->iosapic->addr, vec);
  350. if (unlikely(do_unmask_irq)) {
  351. irq_move_masked_irq(data);
  352. unmask_irq(data);
  353. }
  354. }
  355. #define iosapic_shutdown_level_irq mask_irq
  356. #define iosapic_enable_level_irq unmask_irq
  357. #define iosapic_disable_level_irq mask_irq
  358. #define iosapic_ack_level_irq iosapic_nop
  359. static struct irq_chip irq_type_iosapic_level = {
  360. .name = "IO-SAPIC-level",
  361. .irq_startup = iosapic_startup_level_irq,
  362. .irq_shutdown = iosapic_shutdown_level_irq,
  363. .irq_enable = iosapic_enable_level_irq,
  364. .irq_disable = iosapic_disable_level_irq,
  365. .irq_ack = iosapic_ack_level_irq,
  366. .irq_mask = mask_irq,
  367. .irq_unmask = iosapic_unmask_level_irq,
  368. .irq_set_affinity = iosapic_set_affinity
  369. };
  370. /*
  371. * Handlers for edge-triggered interrupts.
  372. */
  373. static unsigned int
  374. iosapic_startup_edge_irq (struct irq_data *data)
  375. {
  376. unmask_irq(data);
  377. /*
  378. * IOSAPIC simply drops interrupts pended while the
  379. * corresponding pin was masked, so we can't know if an
  380. * interrupt is pending already. Let's hope not...
  381. */
  382. return 0;
  383. }
  384. static void
  385. iosapic_ack_edge_irq (struct irq_data *data)
  386. {
  387. irq_complete_move(data->irq);
  388. irq_move_irq(data);
  389. }
  390. #define iosapic_enable_edge_irq unmask_irq
  391. #define iosapic_disable_edge_irq iosapic_nop
  392. static struct irq_chip irq_type_iosapic_edge = {
  393. .name = "IO-SAPIC-edge",
  394. .irq_startup = iosapic_startup_edge_irq,
  395. .irq_shutdown = iosapic_disable_edge_irq,
  396. .irq_enable = iosapic_enable_edge_irq,
  397. .irq_disable = iosapic_disable_edge_irq,
  398. .irq_ack = iosapic_ack_edge_irq,
  399. .irq_mask = mask_irq,
  400. .irq_unmask = unmask_irq,
  401. .irq_set_affinity = iosapic_set_affinity
  402. };
  403. static unsigned int
  404. iosapic_version (char __iomem *addr)
  405. {
  406. /*
  407. * IOSAPIC Version Register return 32 bit structure like:
  408. * {
  409. * unsigned int version : 8;
  410. * unsigned int reserved1 : 8;
  411. * unsigned int max_redir : 8;
  412. * unsigned int reserved2 : 8;
  413. * }
  414. */
  415. return __iosapic_read(addr, IOSAPIC_VERSION);
  416. }
  417. static int iosapic_find_sharable_irq(unsigned long trigger, unsigned long pol)
  418. {
  419. int i, irq = -ENOSPC, min_count = -1;
  420. struct iosapic_intr_info *info;
  421. /*
  422. * shared vectors for edge-triggered interrupts are not
  423. * supported yet
  424. */
  425. if (trigger == IOSAPIC_EDGE)
  426. return -EINVAL;
  427. for (i = 0; i < NR_IRQS; i++) {
  428. info = &iosapic_intr_info[i];
  429. if (info->trigger == trigger && info->polarity == pol &&
  430. (info->dmode == IOSAPIC_FIXED ||
  431. info->dmode == IOSAPIC_LOWEST_PRIORITY) &&
  432. can_request_irq(i, IRQF_SHARED)) {
  433. if (min_count == -1 || info->count < min_count) {
  434. irq = i;
  435. min_count = info->count;
  436. }
  437. }
  438. }
  439. return irq;
  440. }
  441. /*
  442. * if the given vector is already owned by other,
  443. * assign a new vector for the other and make the vector available
  444. */
  445. static void __init
  446. iosapic_reassign_vector (int irq)
  447. {
  448. int new_irq;
  449. if (iosapic_intr_info[irq].count) {
  450. new_irq = create_irq();
  451. if (new_irq < 0)
  452. panic("%s: out of interrupt vectors!\n", __func__);
  453. printk(KERN_INFO "Reassigning vector %d to %d\n",
  454. irq_to_vector(irq), irq_to_vector(new_irq));
  455. memcpy(&iosapic_intr_info[new_irq], &iosapic_intr_info[irq],
  456. sizeof(struct iosapic_intr_info));
  457. INIT_LIST_HEAD(&iosapic_intr_info[new_irq].rtes);
  458. list_move(iosapic_intr_info[irq].rtes.next,
  459. &iosapic_intr_info[new_irq].rtes);
  460. memset(&iosapic_intr_info[irq], 0,
  461. sizeof(struct iosapic_intr_info));
  462. iosapic_intr_info[irq].low32 = IOSAPIC_MASK;
  463. INIT_LIST_HEAD(&iosapic_intr_info[irq].rtes);
  464. }
  465. }
  466. static inline int irq_is_shared (int irq)
  467. {
  468. return (iosapic_intr_info[irq].count > 1);
  469. }
  470. struct irq_chip*
  471. ia64_native_iosapic_get_irq_chip(unsigned long trigger)
  472. {
  473. if (trigger == IOSAPIC_EDGE)
  474. return &irq_type_iosapic_edge;
  475. else
  476. return &irq_type_iosapic_level;
  477. }
  478. static int
  479. register_intr (unsigned int gsi, int irq, unsigned char delivery,
  480. unsigned long polarity, unsigned long trigger)
  481. {
  482. struct irq_chip *chip, *irq_type;
  483. int index;
  484. struct iosapic_rte_info *rte;
  485. index = find_iosapic(gsi);
  486. if (index < 0) {
  487. printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n",
  488. __func__, gsi);
  489. return -ENODEV;
  490. }
  491. rte = find_rte(irq, gsi);
  492. if (!rte) {
  493. rte = kzalloc(sizeof (*rte), GFP_ATOMIC);
  494. if (!rte) {
  495. printk(KERN_WARNING "%s: cannot allocate memory\n",
  496. __func__);
  497. return -ENOMEM;
  498. }
  499. rte->iosapic = &iosapic_lists[index];
  500. rte->rte_index = gsi - rte->iosapic->gsi_base;
  501. rte->refcnt++;
  502. list_add_tail(&rte->rte_list, &iosapic_intr_info[irq].rtes);
  503. iosapic_intr_info[irq].count++;
  504. iosapic_lists[index].rtes_inuse++;
  505. }
  506. else if (rte->refcnt == NO_REF_RTE) {
  507. struct iosapic_intr_info *info = &iosapic_intr_info[irq];
  508. if (info->count > 0 &&
  509. (info->trigger != trigger || info->polarity != polarity)){
  510. printk (KERN_WARNING
  511. "%s: cannot override the interrupt\n",
  512. __func__);
  513. return -EINVAL;
  514. }
  515. rte->refcnt++;
  516. iosapic_intr_info[irq].count++;
  517. iosapic_lists[index].rtes_inuse++;
  518. }
  519. iosapic_intr_info[irq].polarity = polarity;
  520. iosapic_intr_info[irq].dmode = delivery;
  521. iosapic_intr_info[irq].trigger = trigger;
  522. irq_type = iosapic_get_irq_chip(trigger);
  523. chip = irq_get_chip(irq);
  524. if (irq_type != NULL && chip != irq_type) {
  525. if (chip != &no_irq_chip)
  526. printk(KERN_WARNING
  527. "%s: changing vector %d from %s to %s\n",
  528. __func__, irq_to_vector(irq),
  529. chip->name, irq_type->name);
  530. chip = irq_type;
  531. }
  532. irq_set_chip_handler_name_locked(irq_get_irq_data(irq), chip,
  533. trigger == IOSAPIC_EDGE ? handle_edge_irq : handle_level_irq,
  534. NULL);
  535. return 0;
  536. }
  537. static unsigned int
  538. get_target_cpu (unsigned int gsi, int irq)
  539. {
  540. #ifdef CONFIG_SMP
  541. static int cpu = -1;
  542. extern int cpe_vector;
  543. cpumask_t domain = irq_to_domain(irq);
  544. /*
  545. * In case of vector shared by multiple RTEs, all RTEs that
  546. * share the vector need to use the same destination CPU.
  547. */
  548. if (iosapic_intr_info[irq].count)
  549. return iosapic_intr_info[irq].dest;
  550. /*
  551. * If the platform supports redirection via XTP, let it
  552. * distribute interrupts.
  553. */
  554. if (smp_int_redirect & SMP_IRQ_REDIRECTION)
  555. return cpu_physical_id(smp_processor_id());
  556. /*
  557. * Some interrupts (ACPI SCI, for instance) are registered
  558. * before the BSP is marked as online.
  559. */
  560. if (!cpu_online(smp_processor_id()))
  561. return cpu_physical_id(smp_processor_id());
  562. #ifdef CONFIG_ACPI
  563. if (cpe_vector > 0 && irq_to_vector(irq) == IA64_CPEP_VECTOR)
  564. return get_cpei_target_cpu();
  565. #endif
  566. #ifdef CONFIG_NUMA
  567. {
  568. int num_cpus, cpu_index, iosapic_index, numa_cpu, i = 0;
  569. const struct cpumask *cpu_mask;
  570. iosapic_index = find_iosapic(gsi);
  571. if (iosapic_index < 0 ||
  572. iosapic_lists[iosapic_index].node == MAX_NUMNODES)
  573. goto skip_numa_setup;
  574. cpu_mask = cpumask_of_node(iosapic_lists[iosapic_index].node);
  575. num_cpus = 0;
  576. for_each_cpu_and(numa_cpu, cpu_mask, &domain) {
  577. if (cpu_online(numa_cpu))
  578. num_cpus++;
  579. }
  580. if (!num_cpus)
  581. goto skip_numa_setup;
  582. /* Use irq assignment to distribute across cpus in node */
  583. cpu_index = irq % num_cpus;
  584. for_each_cpu_and(numa_cpu, cpu_mask, &domain)
  585. if (cpu_online(numa_cpu) && i++ >= cpu_index)
  586. break;
  587. if (numa_cpu < nr_cpu_ids)
  588. return cpu_physical_id(numa_cpu);
  589. }
  590. skip_numa_setup:
  591. #endif
  592. /*
  593. * Otherwise, round-robin interrupt vectors across all the
  594. * processors. (It'd be nice if we could be smarter in the
  595. * case of NUMA.)
  596. */
  597. do {
  598. if (++cpu >= nr_cpu_ids)
  599. cpu = 0;
  600. } while (!cpu_online(cpu) || !cpumask_test_cpu(cpu, &domain));
  601. return cpu_physical_id(cpu);
  602. #else /* CONFIG_SMP */
  603. return cpu_physical_id(smp_processor_id());
  604. #endif
  605. }
  606. static inline unsigned char choose_dmode(void)
  607. {
  608. #ifdef CONFIG_SMP
  609. if (smp_int_redirect & SMP_IRQ_REDIRECTION)
  610. return IOSAPIC_LOWEST_PRIORITY;
  611. #endif
  612. return IOSAPIC_FIXED;
  613. }
  614. /*
  615. * ACPI can describe IOSAPIC interrupts via static tables and namespace
  616. * methods. This provides an interface to register those interrupts and
  617. * program the IOSAPIC RTE.
  618. */
  619. int
  620. iosapic_register_intr (unsigned int gsi,
  621. unsigned long polarity, unsigned long trigger)
  622. {
  623. int irq, mask = 1, err;
  624. unsigned int dest;
  625. unsigned long flags;
  626. struct iosapic_rte_info *rte;
  627. u32 low32;
  628. unsigned char dmode;
  629. struct irq_desc *desc;
  630. /*
  631. * If this GSI has already been registered (i.e., it's a
  632. * shared interrupt, or we lost a race to register it),
  633. * don't touch the RTE.
  634. */
  635. spin_lock_irqsave(&iosapic_lock, flags);
  636. irq = __gsi_to_irq(gsi);
  637. if (irq > 0) {
  638. rte = find_rte(irq, gsi);
  639. if(iosapic_intr_info[irq].count == 0) {
  640. assign_irq_vector(irq);
  641. irq_init_desc(irq);
  642. } else if (rte->refcnt != NO_REF_RTE) {
  643. rte->refcnt++;
  644. goto unlock_iosapic_lock;
  645. }
  646. } else
  647. irq = create_irq();
  648. /* If vector is running out, we try to find a sharable vector */
  649. if (irq < 0) {
  650. irq = iosapic_find_sharable_irq(trigger, polarity);
  651. if (irq < 0)
  652. goto unlock_iosapic_lock;
  653. }
  654. desc = irq_to_desc(irq);
  655. raw_spin_lock(&desc->lock);
  656. dest = get_target_cpu(gsi, irq);
  657. dmode = choose_dmode();
  658. err = register_intr(gsi, irq, dmode, polarity, trigger);
  659. if (err < 0) {
  660. raw_spin_unlock(&desc->lock);
  661. irq = err;
  662. goto unlock_iosapic_lock;
  663. }
  664. /*
  665. * If the vector is shared and already unmasked for other
  666. * interrupt sources, don't mask it.
  667. */
  668. low32 = iosapic_intr_info[irq].low32;
  669. if (irq_is_shared(irq) && !(low32 & IOSAPIC_MASK))
  670. mask = 0;
  671. set_rte(gsi, irq, dest, mask);
  672. printk(KERN_INFO "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d\n",
  673. gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  674. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  675. cpu_logical_id(dest), dest, irq_to_vector(irq));
  676. raw_spin_unlock(&desc->lock);
  677. unlock_iosapic_lock:
  678. spin_unlock_irqrestore(&iosapic_lock, flags);
  679. return irq;
  680. }
  681. void
  682. iosapic_unregister_intr (unsigned int gsi)
  683. {
  684. unsigned long flags;
  685. int irq, index;
  686. u32 low32;
  687. unsigned long trigger, polarity;
  688. unsigned int dest;
  689. struct iosapic_rte_info *rte;
  690. /*
  691. * If the irq associated with the gsi is not found,
  692. * iosapic_unregister_intr() is unbalanced. We need to check
  693. * this again after getting locks.
  694. */
  695. irq = gsi_to_irq(gsi);
  696. if (irq < 0) {
  697. printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n",
  698. gsi);
  699. WARN_ON(1);
  700. return;
  701. }
  702. spin_lock_irqsave(&iosapic_lock, flags);
  703. if ((rte = find_rte(irq, gsi)) == NULL) {
  704. printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n",
  705. gsi);
  706. WARN_ON(1);
  707. goto out;
  708. }
  709. if (--rte->refcnt > 0)
  710. goto out;
  711. rte->refcnt = NO_REF_RTE;
  712. /* Mask the interrupt */
  713. low32 = iosapic_intr_info[irq].low32 | IOSAPIC_MASK;
  714. iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte->rte_index), low32);
  715. iosapic_intr_info[irq].count--;
  716. index = find_iosapic(gsi);
  717. iosapic_lists[index].rtes_inuse--;
  718. WARN_ON(iosapic_lists[index].rtes_inuse < 0);
  719. trigger = iosapic_intr_info[irq].trigger;
  720. polarity = iosapic_intr_info[irq].polarity;
  721. dest = iosapic_intr_info[irq].dest;
  722. printk(KERN_INFO
  723. "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d unregistered\n",
  724. gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  725. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  726. cpu_logical_id(dest), dest, irq_to_vector(irq));
  727. if (iosapic_intr_info[irq].count == 0) {
  728. #ifdef CONFIG_SMP
  729. /* Clear affinity */
  730. cpumask_setall(irq_get_affinity_mask(irq));
  731. #endif
  732. /* Clear the interrupt information */
  733. iosapic_intr_info[irq].dest = 0;
  734. iosapic_intr_info[irq].dmode = 0;
  735. iosapic_intr_info[irq].polarity = 0;
  736. iosapic_intr_info[irq].trigger = 0;
  737. iosapic_intr_info[irq].low32 |= IOSAPIC_MASK;
  738. /* Destroy and reserve IRQ */
  739. destroy_and_reserve_irq(irq);
  740. }
  741. out:
  742. spin_unlock_irqrestore(&iosapic_lock, flags);
  743. }
  744. /*
  745. * ACPI calls this when it finds an entry for a platform interrupt.
  746. */
  747. int __init
  748. iosapic_register_platform_intr (u32 int_type, unsigned int gsi,
  749. int iosapic_vector, u16 eid, u16 id,
  750. unsigned long polarity, unsigned long trigger)
  751. {
  752. static const char * const name[] = {"unknown", "PMI", "INIT", "CPEI"};
  753. unsigned char delivery;
  754. int irq, vector, mask = 0;
  755. unsigned int dest = ((id << 8) | eid) & 0xffff;
  756. switch (int_type) {
  757. case ACPI_INTERRUPT_PMI:
  758. irq = vector = iosapic_vector;
  759. bind_irq_vector(irq, vector, CPU_MASK_ALL);
  760. /*
  761. * since PMI vector is alloc'd by FW(ACPI) not by kernel,
  762. * we need to make sure the vector is available
  763. */
  764. iosapic_reassign_vector(irq);
  765. delivery = IOSAPIC_PMI;
  766. break;
  767. case ACPI_INTERRUPT_INIT:
  768. irq = create_irq();
  769. if (irq < 0)
  770. panic("%s: out of interrupt vectors!\n", __func__);
  771. vector = irq_to_vector(irq);
  772. delivery = IOSAPIC_INIT;
  773. break;
  774. case ACPI_INTERRUPT_CPEI:
  775. irq = vector = IA64_CPE_VECTOR;
  776. BUG_ON(bind_irq_vector(irq, vector, CPU_MASK_ALL));
  777. delivery = IOSAPIC_FIXED;
  778. mask = 1;
  779. break;
  780. default:
  781. printk(KERN_ERR "%s: invalid int type 0x%x\n", __func__,
  782. int_type);
  783. return -1;
  784. }
  785. register_intr(gsi, irq, delivery, polarity, trigger);
  786. printk(KERN_INFO
  787. "PLATFORM int %s (0x%x): GSI %u (%s, %s) -> CPU %d (0x%04x)"
  788. " vector %d\n",
  789. int_type < ARRAY_SIZE(name) ? name[int_type] : "unknown",
  790. int_type, gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"),
  791. (polarity == IOSAPIC_POL_HIGH ? "high" : "low"),
  792. cpu_logical_id(dest), dest, vector);
  793. set_rte(gsi, irq, dest, mask);
  794. return vector;
  795. }
  796. /*
  797. * ACPI calls this when it finds an entry for a legacy ISA IRQ override.
  798. */
  799. void iosapic_override_isa_irq(unsigned int isa_irq, unsigned int gsi,
  800. unsigned long polarity, unsigned long trigger)
  801. {
  802. int vector, irq;
  803. unsigned int dest = cpu_physical_id(smp_processor_id());
  804. unsigned char dmode;
  805. irq = vector = isa_irq_to_vector(isa_irq);
  806. BUG_ON(bind_irq_vector(irq, vector, CPU_MASK_ALL));
  807. dmode = choose_dmode();
  808. register_intr(gsi, irq, dmode, polarity, trigger);
  809. DBG("ISA: IRQ %u -> GSI %u (%s,%s) -> CPU %d (0x%04x) vector %d\n",
  810. isa_irq, gsi, trigger == IOSAPIC_EDGE ? "edge" : "level",
  811. polarity == IOSAPIC_POL_HIGH ? "high" : "low",
  812. cpu_logical_id(dest), dest, vector);
  813. set_rte(gsi, irq, dest, 1);
  814. }
  815. void __init
  816. ia64_native_iosapic_pcat_compat_init(void)
  817. {
  818. if (pcat_compat) {
  819. /*
  820. * Disable the compatibility mode interrupts (8259 style),
  821. * needs IN/OUT support enabled.
  822. */
  823. printk(KERN_INFO
  824. "%s: Disabling PC-AT compatible 8259 interrupts\n",
  825. __func__);
  826. outb(0xff, 0xA1);
  827. outb(0xff, 0x21);
  828. }
  829. }
  830. void __init
  831. iosapic_system_init (int system_pcat_compat)
  832. {
  833. int irq;
  834. for (irq = 0; irq < NR_IRQS; ++irq) {
  835. iosapic_intr_info[irq].low32 = IOSAPIC_MASK;
  836. /* mark as unused */
  837. INIT_LIST_HEAD(&iosapic_intr_info[irq].rtes);
  838. iosapic_intr_info[irq].count = 0;
  839. }
  840. pcat_compat = system_pcat_compat;
  841. if (pcat_compat)
  842. iosapic_pcat_compat_init();
  843. }
  844. static inline int
  845. iosapic_alloc (void)
  846. {
  847. int index;
  848. for (index = 0; index < NR_IOSAPICS; index++)
  849. if (!iosapic_lists[index].addr)
  850. return index;
  851. printk(KERN_WARNING "%s: failed to allocate iosapic\n", __func__);
  852. return -1;
  853. }
  854. static inline void
  855. iosapic_free (int index)
  856. {
  857. memset(&iosapic_lists[index], 0, sizeof(iosapic_lists[0]));
  858. }
  859. static inline int
  860. iosapic_check_gsi_range (unsigned int gsi_base, unsigned int ver)
  861. {
  862. int index;
  863. unsigned int gsi_end, base, end;
  864. /* check gsi range */
  865. gsi_end = gsi_base + ((ver >> 16) & 0xff);
  866. for (index = 0; index < NR_IOSAPICS; index++) {
  867. if (!iosapic_lists[index].addr)
  868. continue;
  869. base = iosapic_lists[index].gsi_base;
  870. end = base + iosapic_lists[index].num_rte - 1;
  871. if (gsi_end < base || end < gsi_base)
  872. continue; /* OK */
  873. return -EBUSY;
  874. }
  875. return 0;
  876. }
  877. static int
  878. iosapic_delete_rte(unsigned int irq, unsigned int gsi)
  879. {
  880. struct iosapic_rte_info *rte, *temp;
  881. list_for_each_entry_safe(rte, temp, &iosapic_intr_info[irq].rtes,
  882. rte_list) {
  883. if (rte->iosapic->gsi_base + rte->rte_index == gsi) {
  884. if (rte->refcnt)
  885. return -EBUSY;
  886. list_del(&rte->rte_list);
  887. kfree(rte);
  888. return 0;
  889. }
  890. }
  891. return -EINVAL;
  892. }
  893. int iosapic_init(unsigned long phys_addr, unsigned int gsi_base)
  894. {
  895. int num_rte, err, index;
  896. unsigned int isa_irq, ver;
  897. char __iomem *addr;
  898. unsigned long flags;
  899. spin_lock_irqsave(&iosapic_lock, flags);
  900. index = find_iosapic(gsi_base);
  901. if (index >= 0) {
  902. spin_unlock_irqrestore(&iosapic_lock, flags);
  903. return -EBUSY;
  904. }
  905. addr = ioremap(phys_addr, 0);
  906. if (addr == NULL) {
  907. spin_unlock_irqrestore(&iosapic_lock, flags);
  908. return -ENOMEM;
  909. }
  910. ver = iosapic_version(addr);
  911. if ((err = iosapic_check_gsi_range(gsi_base, ver))) {
  912. iounmap(addr);
  913. spin_unlock_irqrestore(&iosapic_lock, flags);
  914. return err;
  915. }
  916. /*
  917. * The MAX_REDIR register holds the highest input pin number
  918. * (starting from 0). We add 1 so that we can use it for
  919. * number of pins (= RTEs)
  920. */
  921. num_rte = ((ver >> 16) & 0xff) + 1;
  922. index = iosapic_alloc();
  923. iosapic_lists[index].addr = addr;
  924. iosapic_lists[index].gsi_base = gsi_base;
  925. iosapic_lists[index].num_rte = num_rte;
  926. #ifdef CONFIG_NUMA
  927. iosapic_lists[index].node = MAX_NUMNODES;
  928. #endif
  929. spin_lock_init(&iosapic_lists[index].lock);
  930. spin_unlock_irqrestore(&iosapic_lock, flags);
  931. if ((gsi_base == 0) && pcat_compat) {
  932. /*
  933. * Map the legacy ISA devices into the IOSAPIC data. Some of
  934. * these may get reprogrammed later on with data from the ACPI
  935. * Interrupt Source Override table.
  936. */
  937. for (isa_irq = 0; isa_irq < 16; ++isa_irq)
  938. iosapic_override_isa_irq(isa_irq, isa_irq,
  939. IOSAPIC_POL_HIGH,
  940. IOSAPIC_EDGE);
  941. }
  942. return 0;
  943. }
  944. int iosapic_remove(unsigned int gsi_base)
  945. {
  946. int i, irq, index, err = 0;
  947. unsigned long flags;
  948. spin_lock_irqsave(&iosapic_lock, flags);
  949. index = find_iosapic(gsi_base);
  950. if (index < 0) {
  951. printk(KERN_WARNING "%s: No IOSAPIC for GSI base %u\n",
  952. __func__, gsi_base);
  953. goto out;
  954. }
  955. if (iosapic_lists[index].rtes_inuse) {
  956. err = -EBUSY;
  957. printk(KERN_WARNING "%s: IOSAPIC for GSI base %u is busy\n",
  958. __func__, gsi_base);
  959. goto out;
  960. }
  961. for (i = gsi_base; i < gsi_base + iosapic_lists[index].num_rte; i++) {
  962. irq = __gsi_to_irq(i);
  963. if (irq < 0)
  964. continue;
  965. err = iosapic_delete_rte(irq, i);
  966. if (err)
  967. goto out;
  968. }
  969. iounmap(iosapic_lists[index].addr);
  970. iosapic_free(index);
  971. out:
  972. spin_unlock_irqrestore(&iosapic_lock, flags);
  973. return err;
  974. }
  975. #ifdef CONFIG_NUMA
  976. void map_iosapic_to_node(unsigned int gsi_base, int node)
  977. {
  978. int index;
  979. index = find_iosapic(gsi_base);
  980. if (index < 0) {
  981. printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n",
  982. __func__, gsi_base);
  983. return;
  984. }
  985. iosapic_lists[index].node = node;
  986. return;
  987. }
  988. #endif