x86, x2apic: fix lock ordering during IRQ migration
[linux-2.6/linux-2.6-openrd.git] / drivers / pci / intr_remapping.c
blob5ffa65fffb6aa7e0eabd8fa734db716234cec0ee
1 #include <linux/interrupt.h>
2 #include <linux/dmar.h>
3 #include <linux/spinlock.h>
4 #include <linux/jiffies.h>
5 #include <linux/pci.h>
6 #include <linux/irq.h>
7 #include <asm/io_apic.h>
8 #include <asm/smp.h>
9 #include <asm/cpu.h>
10 #include <linux/intel-iommu.h>
11 #include "intr_remapping.h"
13 static struct ioapic_scope ir_ioapic[MAX_IO_APICS];
14 static int ir_ioapic_num;
15 int intr_remapping_enabled;
17 struct irq_2_iommu {
18 struct intel_iommu *iommu;
19 u16 irte_index;
20 u16 sub_handle;
21 u8 irte_mask;
24 #ifdef CONFIG_SPARSE_IRQ
25 static struct irq_2_iommu *get_one_free_irq_2_iommu(int cpu)
27 struct irq_2_iommu *iommu;
28 int node;
30 node = cpu_to_node(cpu);
32 iommu = kzalloc_node(sizeof(*iommu), GFP_ATOMIC, node);
33 printk(KERN_DEBUG "alloc irq_2_iommu on cpu %d node %d\n", cpu, node);
35 return iommu;
38 static struct irq_2_iommu *irq_2_iommu(unsigned int irq)
40 struct irq_desc *desc;
42 desc = irq_to_desc(irq);
44 if (WARN_ON_ONCE(!desc))
45 return NULL;
47 return desc->irq_2_iommu;
50 static struct irq_2_iommu *irq_2_iommu_alloc_cpu(unsigned int irq, int cpu)
52 struct irq_desc *desc;
53 struct irq_2_iommu *irq_iommu;
56 * alloc irq desc if not allocated already.
58 desc = irq_to_desc_alloc_cpu(irq, cpu);
59 if (!desc) {
60 printk(KERN_INFO "can not get irq_desc for %d\n", irq);
61 return NULL;
64 irq_iommu = desc->irq_2_iommu;
66 if (!irq_iommu)
67 desc->irq_2_iommu = get_one_free_irq_2_iommu(cpu);
69 return desc->irq_2_iommu;
72 static struct irq_2_iommu *irq_2_iommu_alloc(unsigned int irq)
74 return irq_2_iommu_alloc_cpu(irq, boot_cpu_id);
77 #else /* !CONFIG_SPARSE_IRQ */
79 static struct irq_2_iommu irq_2_iommuX[NR_IRQS];
81 static struct irq_2_iommu *irq_2_iommu(unsigned int irq)
83 if (irq < nr_irqs)
84 return &irq_2_iommuX[irq];
86 return NULL;
88 static struct irq_2_iommu *irq_2_iommu_alloc(unsigned int irq)
90 return irq_2_iommu(irq);
92 #endif
94 static DEFINE_SPINLOCK(irq_2_ir_lock);
96 static struct irq_2_iommu *valid_irq_2_iommu(unsigned int irq)
98 struct irq_2_iommu *irq_iommu;
100 irq_iommu = irq_2_iommu(irq);
102 if (!irq_iommu)
103 return NULL;
105 if (!irq_iommu->iommu)
106 return NULL;
108 return irq_iommu;
111 int irq_remapped(int irq)
113 return valid_irq_2_iommu(irq) != NULL;
116 int get_irte(int irq, struct irte *entry)
118 int index;
119 struct irq_2_iommu *irq_iommu;
120 unsigned long flags;
122 if (!entry)
123 return -1;
125 spin_lock_irqsave(&irq_2_ir_lock, flags);
126 irq_iommu = valid_irq_2_iommu(irq);
127 if (!irq_iommu) {
128 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
129 return -1;
132 index = irq_iommu->irte_index + irq_iommu->sub_handle;
133 *entry = *(irq_iommu->iommu->ir_table->base + index);
135 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
136 return 0;
139 int alloc_irte(struct intel_iommu *iommu, int irq, u16 count)
141 struct ir_table *table = iommu->ir_table;
142 struct irq_2_iommu *irq_iommu;
143 u16 index, start_index;
144 unsigned int mask = 0;
145 unsigned long flags;
146 int i;
148 if (!count)
149 return -1;
151 #ifndef CONFIG_SPARSE_IRQ
152 /* protect irq_2_iommu_alloc later */
153 if (irq >= nr_irqs)
154 return -1;
155 #endif
158 * start the IRTE search from index 0.
160 index = start_index = 0;
162 if (count > 1) {
163 count = __roundup_pow_of_two(count);
164 mask = ilog2(count);
167 if (mask > ecap_max_handle_mask(iommu->ecap)) {
168 printk(KERN_ERR
169 "Requested mask %x exceeds the max invalidation handle"
170 " mask value %Lx\n", mask,
171 ecap_max_handle_mask(iommu->ecap));
172 return -1;
175 spin_lock_irqsave(&irq_2_ir_lock, flags);
176 do {
177 for (i = index; i < index + count; i++)
178 if (table->base[i].present)
179 break;
180 /* empty index found */
181 if (i == index + count)
182 break;
184 index = (index + count) % INTR_REMAP_TABLE_ENTRIES;
186 if (index == start_index) {
187 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
188 printk(KERN_ERR "can't allocate an IRTE\n");
189 return -1;
191 } while (1);
193 for (i = index; i < index + count; i++)
194 table->base[i].present = 1;
196 irq_iommu = irq_2_iommu_alloc(irq);
197 if (!irq_iommu) {
198 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
199 printk(KERN_ERR "can't allocate irq_2_iommu\n");
200 return -1;
203 irq_iommu->iommu = iommu;
204 irq_iommu->irte_index = index;
205 irq_iommu->sub_handle = 0;
206 irq_iommu->irte_mask = mask;
208 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
210 return index;
213 static int qi_flush_iec(struct intel_iommu *iommu, int index, int mask)
215 struct qi_desc desc;
217 desc.low = QI_IEC_IIDEX(index) | QI_IEC_TYPE | QI_IEC_IM(mask)
218 | QI_IEC_SELECTIVE;
219 desc.high = 0;
221 return qi_submit_sync(&desc, iommu);
224 int map_irq_to_irte_handle(int irq, u16 *sub_handle)
226 int index;
227 struct irq_2_iommu *irq_iommu;
228 unsigned long flags;
230 spin_lock_irqsave(&irq_2_ir_lock, flags);
231 irq_iommu = valid_irq_2_iommu(irq);
232 if (!irq_iommu) {
233 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
234 return -1;
237 *sub_handle = irq_iommu->sub_handle;
238 index = irq_iommu->irte_index;
239 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
240 return index;
243 int set_irte_irq(int irq, struct intel_iommu *iommu, u16 index, u16 subhandle)
245 struct irq_2_iommu *irq_iommu;
246 unsigned long flags;
248 spin_lock_irqsave(&irq_2_ir_lock, flags);
250 irq_iommu = irq_2_iommu_alloc(irq);
252 if (!irq_iommu) {
253 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
254 printk(KERN_ERR "can't allocate irq_2_iommu\n");
255 return -1;
258 irq_iommu->iommu = iommu;
259 irq_iommu->irte_index = index;
260 irq_iommu->sub_handle = subhandle;
261 irq_iommu->irte_mask = 0;
263 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
265 return 0;
268 int clear_irte_irq(int irq, struct intel_iommu *iommu, u16 index)
270 struct irq_2_iommu *irq_iommu;
271 unsigned long flags;
273 spin_lock_irqsave(&irq_2_ir_lock, flags);
274 irq_iommu = valid_irq_2_iommu(irq);
275 if (!irq_iommu) {
276 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
277 return -1;
280 irq_iommu->iommu = NULL;
281 irq_iommu->irte_index = 0;
282 irq_iommu->sub_handle = 0;
283 irq_2_iommu(irq)->irte_mask = 0;
285 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
287 return 0;
290 int modify_irte(int irq, struct irte *irte_modified)
292 int rc;
293 int index;
294 struct irte *irte;
295 struct intel_iommu *iommu;
296 struct irq_2_iommu *irq_iommu;
297 unsigned long flags;
299 spin_lock_irqsave(&irq_2_ir_lock, flags);
300 irq_iommu = valid_irq_2_iommu(irq);
301 if (!irq_iommu) {
302 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
303 return -1;
306 iommu = irq_iommu->iommu;
308 index = irq_iommu->irte_index + irq_iommu->sub_handle;
309 irte = &iommu->ir_table->base[index];
311 set_64bit((unsigned long *)irte, irte_modified->low | (1 << 1));
312 __iommu_flush_cache(iommu, irte, sizeof(*irte));
314 rc = qi_flush_iec(iommu, index, 0);
315 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
317 return rc;
320 int flush_irte(int irq)
322 int rc;
323 int index;
324 struct intel_iommu *iommu;
325 struct irq_2_iommu *irq_iommu;
326 unsigned long flags;
328 spin_lock_irqsave(&irq_2_ir_lock, flags);
329 irq_iommu = valid_irq_2_iommu(irq);
330 if (!irq_iommu) {
331 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
332 return -1;
335 iommu = irq_iommu->iommu;
337 index = irq_iommu->irte_index + irq_iommu->sub_handle;
339 rc = qi_flush_iec(iommu, index, irq_iommu->irte_mask);
340 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
342 return rc;
345 struct intel_iommu *map_ioapic_to_ir(int apic)
347 int i;
349 for (i = 0; i < MAX_IO_APICS; i++)
350 if (ir_ioapic[i].id == apic)
351 return ir_ioapic[i].iommu;
352 return NULL;
355 struct intel_iommu *map_dev_to_ir(struct pci_dev *dev)
357 struct dmar_drhd_unit *drhd;
359 drhd = dmar_find_matched_drhd_unit(dev);
360 if (!drhd)
361 return NULL;
363 return drhd->iommu;
366 int free_irte(int irq)
368 int rc = 0;
369 int index, i;
370 struct irte *irte;
371 struct intel_iommu *iommu;
372 struct irq_2_iommu *irq_iommu;
373 unsigned long flags;
375 spin_lock_irqsave(&irq_2_ir_lock, flags);
376 irq_iommu = valid_irq_2_iommu(irq);
377 if (!irq_iommu) {
378 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
379 return -1;
382 iommu = irq_iommu->iommu;
384 index = irq_iommu->irte_index + irq_iommu->sub_handle;
385 irte = &iommu->ir_table->base[index];
387 if (!irq_iommu->sub_handle) {
388 for (i = 0; i < (1 << irq_iommu->irte_mask); i++)
389 set_64bit((unsigned long *)irte, 0);
390 rc = qi_flush_iec(iommu, index, irq_iommu->irte_mask);
393 irq_iommu->iommu = NULL;
394 irq_iommu->irte_index = 0;
395 irq_iommu->sub_handle = 0;
396 irq_iommu->irte_mask = 0;
398 spin_unlock_irqrestore(&irq_2_ir_lock, flags);
400 return rc;
403 static void iommu_set_intr_remapping(struct intel_iommu *iommu, int mode)
405 u64 addr;
406 u32 cmd, sts;
407 unsigned long flags;
409 addr = virt_to_phys((void *)iommu->ir_table->base);
411 spin_lock_irqsave(&iommu->register_lock, flags);
413 dmar_writeq(iommu->reg + DMAR_IRTA_REG,
414 (addr) | IR_X2APIC_MODE(mode) | INTR_REMAP_TABLE_REG_SIZE);
416 /* Set interrupt-remapping table pointer */
417 cmd = iommu->gcmd | DMA_GCMD_SIRTP;
418 writel(cmd, iommu->reg + DMAR_GCMD_REG);
420 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
421 readl, (sts & DMA_GSTS_IRTPS), sts);
422 spin_unlock_irqrestore(&iommu->register_lock, flags);
425 * global invalidation of interrupt entry cache before enabling
426 * interrupt-remapping.
428 qi_global_iec(iommu);
430 spin_lock_irqsave(&iommu->register_lock, flags);
432 /* Enable interrupt-remapping */
433 cmd = iommu->gcmd | DMA_GCMD_IRE;
434 iommu->gcmd |= DMA_GCMD_IRE;
435 writel(cmd, iommu->reg + DMAR_GCMD_REG);
437 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
438 readl, (sts & DMA_GSTS_IRES), sts);
440 spin_unlock_irqrestore(&iommu->register_lock, flags);
444 static int setup_intr_remapping(struct intel_iommu *iommu, int mode)
446 struct ir_table *ir_table;
447 struct page *pages;
449 ir_table = iommu->ir_table = kzalloc(sizeof(struct ir_table),
450 GFP_KERNEL);
452 if (!iommu->ir_table)
453 return -ENOMEM;
455 pages = alloc_pages(GFP_KERNEL | __GFP_ZERO, INTR_REMAP_PAGE_ORDER);
457 if (!pages) {
458 printk(KERN_ERR "failed to allocate pages of order %d\n",
459 INTR_REMAP_PAGE_ORDER);
460 kfree(iommu->ir_table);
461 return -ENOMEM;
464 ir_table->base = page_address(pages);
466 iommu_set_intr_remapping(iommu, mode);
467 return 0;
470 int __init enable_intr_remapping(int eim)
472 struct dmar_drhd_unit *drhd;
473 int setup = 0;
476 * check for the Interrupt-remapping support
478 for_each_drhd_unit(drhd) {
479 struct intel_iommu *iommu = drhd->iommu;
481 if (!ecap_ir_support(iommu->ecap))
482 continue;
484 if (eim && !ecap_eim_support(iommu->ecap)) {
485 printk(KERN_INFO "DRHD %Lx: EIM not supported by DRHD, "
486 " ecap %Lx\n", drhd->reg_base_addr, iommu->ecap);
487 return -1;
492 * Enable queued invalidation for all the DRHD's.
494 for_each_drhd_unit(drhd) {
495 int ret;
496 struct intel_iommu *iommu = drhd->iommu;
497 ret = dmar_enable_qi(iommu);
499 if (ret) {
500 printk(KERN_ERR "DRHD %Lx: failed to enable queued, "
501 " invalidation, ecap %Lx, ret %d\n",
502 drhd->reg_base_addr, iommu->ecap, ret);
503 return -1;
508 * Setup Interrupt-remapping for all the DRHD's now.
510 for_each_drhd_unit(drhd) {
511 struct intel_iommu *iommu = drhd->iommu;
513 if (!ecap_ir_support(iommu->ecap))
514 continue;
516 if (setup_intr_remapping(iommu, eim))
517 goto error;
519 setup = 1;
522 if (!setup)
523 goto error;
525 intr_remapping_enabled = 1;
527 return 0;
529 error:
531 * handle error condition gracefully here!
533 return -1;
536 static int ir_parse_ioapic_scope(struct acpi_dmar_header *header,
537 struct intel_iommu *iommu)
539 struct acpi_dmar_hardware_unit *drhd;
540 struct acpi_dmar_device_scope *scope;
541 void *start, *end;
543 drhd = (struct acpi_dmar_hardware_unit *)header;
545 start = (void *)(drhd + 1);
546 end = ((void *)drhd) + header->length;
548 while (start < end) {
549 scope = start;
550 if (scope->entry_type == ACPI_DMAR_SCOPE_TYPE_IOAPIC) {
551 if (ir_ioapic_num == MAX_IO_APICS) {
552 printk(KERN_WARNING "Exceeded Max IO APICS\n");
553 return -1;
556 printk(KERN_INFO "IOAPIC id %d under DRHD base"
557 " 0x%Lx\n", scope->enumeration_id,
558 drhd->address);
560 ir_ioapic[ir_ioapic_num].iommu = iommu;
561 ir_ioapic[ir_ioapic_num].id = scope->enumeration_id;
562 ir_ioapic_num++;
564 start += scope->length;
567 return 0;
571 * Finds the assocaition between IOAPIC's and its Interrupt-remapping
572 * hardware unit.
574 int __init parse_ioapics_under_ir(void)
576 struct dmar_drhd_unit *drhd;
577 int ir_supported = 0;
579 for_each_drhd_unit(drhd) {
580 struct intel_iommu *iommu = drhd->iommu;
582 if (ecap_ir_support(iommu->ecap)) {
583 if (ir_parse_ioapic_scope(drhd->hdr, iommu))
584 return -1;
586 ir_supported = 1;
590 if (ir_supported && ir_ioapic_num != nr_ioapics) {
591 printk(KERN_WARNING
592 "Not all IO-APIC's listed under remapping hardware\n");
593 return -1;
596 return ir_supported;