KVM: Search the LAPIC's for one that will accept a PIC interrupt
[linux-2.6/btrfs-unstable.git] / arch / x86 / kvm / i8259.c
blob819b748a33f9ff84c7660425cb1d3b28bf6cd404
1 /*
2 * 8259 interrupt controller emulation
4 * Copyright (c) 2003-2004 Fabrice Bellard
5 * Copyright (c) 2007 Intel Corporation
6 * Copyright 2009 Red Hat, Inc. and/or its affilates.
8 * Permission is hereby granted, free of charge, to any person obtaining a copy
9 * of this software and associated documentation files (the "Software"), to deal
10 * in the Software without restriction, including without limitation the rights
11 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
12 * copies of the Software, and to permit persons to whom the Software is
13 * furnished to do so, subject to the following conditions:
15 * The above copyright notice and this permission notice shall be included in
16 * all copies or substantial portions of the Software.
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
21 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 * THE SOFTWARE.
25 * Authors:
26 * Yaozu (Eddie) Dong <Eddie.dong@intel.com>
27 * Port from Qemu.
29 #include <linux/mm.h>
30 #include <linux/slab.h>
31 #include <linux/bitops.h>
32 #include "irq.h"
34 #include <linux/kvm_host.h>
35 #include "trace.h"
37 static void pic_irq_request(struct kvm *kvm, int level);
39 static void pic_lock(struct kvm_pic *s)
40 __acquires(&s->lock)
42 raw_spin_lock(&s->lock);
45 static void pic_unlock(struct kvm_pic *s)
46 __releases(&s->lock)
48 bool wakeup = s->wakeup_needed;
49 struct kvm_vcpu *vcpu, *found = NULL;
50 int i;
52 s->wakeup_needed = false;
54 raw_spin_unlock(&s->lock);
56 if (wakeup) {
57 kvm_for_each_vcpu(i, vcpu, s->kvm) {
58 if (kvm_apic_accept_pic_intr(vcpu)) {
59 found = vcpu;
60 break;
64 if (!found)
65 found = s->kvm->bsp_vcpu;
67 kvm_vcpu_kick(found);
71 static void pic_clear_isr(struct kvm_kpic_state *s, int irq)
73 s->isr &= ~(1 << irq);
74 s->isr_ack |= (1 << irq);
75 if (s != &s->pics_state->pics[0])
76 irq += 8;
78 * We are dropping lock while calling ack notifiers since ack
79 * notifier callbacks for assigned devices call into PIC recursively.
80 * Other interrupt may be delivered to PIC while lock is dropped but
81 * it should be safe since PIC state is already updated at this stage.
83 pic_unlock(s->pics_state);
84 kvm_notify_acked_irq(s->pics_state->kvm, SELECT_PIC(irq), irq);
85 pic_lock(s->pics_state);
88 void kvm_pic_clear_isr_ack(struct kvm *kvm)
90 struct kvm_pic *s = pic_irqchip(kvm);
92 pic_lock(s);
93 s->pics[0].isr_ack = 0xff;
94 s->pics[1].isr_ack = 0xff;
95 pic_unlock(s);
99 * set irq level. If an edge is detected, then the IRR is set to 1
101 static inline int pic_set_irq1(struct kvm_kpic_state *s, int irq, int level)
103 int mask, ret = 1;
104 mask = 1 << irq;
105 if (s->elcr & mask) /* level triggered */
106 if (level) {
107 ret = !(s->irr & mask);
108 s->irr |= mask;
109 s->last_irr |= mask;
110 } else {
111 s->irr &= ~mask;
112 s->last_irr &= ~mask;
114 else /* edge triggered */
115 if (level) {
116 if ((s->last_irr & mask) == 0) {
117 ret = !(s->irr & mask);
118 s->irr |= mask;
120 s->last_irr |= mask;
121 } else
122 s->last_irr &= ~mask;
124 return (s->imr & mask) ? -1 : ret;
128 * return the highest priority found in mask (highest = smallest
129 * number). Return 8 if no irq
131 static inline int get_priority(struct kvm_kpic_state *s, int mask)
133 int priority;
134 if (mask == 0)
135 return 8;
136 priority = 0;
137 while ((mask & (1 << ((priority + s->priority_add) & 7))) == 0)
138 priority++;
139 return priority;
143 * return the pic wanted interrupt. return -1 if none
145 static int pic_get_irq(struct kvm_kpic_state *s)
147 int mask, cur_priority, priority;
149 mask = s->irr & ~s->imr;
150 priority = get_priority(s, mask);
151 if (priority == 8)
152 return -1;
154 * compute current priority. If special fully nested mode on the
155 * master, the IRQ coming from the slave is not taken into account
156 * for the priority computation.
158 mask = s->isr;
159 if (s->special_fully_nested_mode && s == &s->pics_state->pics[0])
160 mask &= ~(1 << 2);
161 cur_priority = get_priority(s, mask);
162 if (priority < cur_priority)
164 * higher priority found: an irq should be generated
166 return (priority + s->priority_add) & 7;
167 else
168 return -1;
172 * raise irq to CPU if necessary. must be called every time the active
173 * irq may change
175 static void pic_update_irq(struct kvm_pic *s)
177 int irq2, irq;
179 irq2 = pic_get_irq(&s->pics[1]);
180 if (irq2 >= 0) {
182 * if irq request by slave pic, signal master PIC
184 pic_set_irq1(&s->pics[0], 2, 1);
185 pic_set_irq1(&s->pics[0], 2, 0);
187 irq = pic_get_irq(&s->pics[0]);
188 pic_irq_request(s->kvm, irq >= 0);
191 void kvm_pic_update_irq(struct kvm_pic *s)
193 pic_lock(s);
194 pic_update_irq(s);
195 pic_unlock(s);
198 int kvm_pic_set_irq(void *opaque, int irq, int level)
200 struct kvm_pic *s = opaque;
201 int ret = -1;
203 pic_lock(s);
204 if (irq >= 0 && irq < PIC_NUM_PINS) {
205 ret = pic_set_irq1(&s->pics[irq >> 3], irq & 7, level);
206 pic_update_irq(s);
207 trace_kvm_pic_set_irq(irq >> 3, irq & 7, s->pics[irq >> 3].elcr,
208 s->pics[irq >> 3].imr, ret == 0);
210 pic_unlock(s);
212 return ret;
216 * acknowledge interrupt 'irq'
218 static inline void pic_intack(struct kvm_kpic_state *s, int irq)
220 s->isr |= 1 << irq;
222 * We don't clear a level sensitive interrupt here
224 if (!(s->elcr & (1 << irq)))
225 s->irr &= ~(1 << irq);
227 if (s->auto_eoi) {
228 if (s->rotate_on_auto_eoi)
229 s->priority_add = (irq + 1) & 7;
230 pic_clear_isr(s, irq);
235 int kvm_pic_read_irq(struct kvm *kvm)
237 int irq, irq2, intno;
238 struct kvm_pic *s = pic_irqchip(kvm);
240 pic_lock(s);
241 irq = pic_get_irq(&s->pics[0]);
242 if (irq >= 0) {
243 pic_intack(&s->pics[0], irq);
244 if (irq == 2) {
245 irq2 = pic_get_irq(&s->pics[1]);
246 if (irq2 >= 0)
247 pic_intack(&s->pics[1], irq2);
248 else
250 * spurious IRQ on slave controller
252 irq2 = 7;
253 intno = s->pics[1].irq_base + irq2;
254 irq = irq2 + 8;
255 } else
256 intno = s->pics[0].irq_base + irq;
257 } else {
259 * spurious IRQ on host controller
261 irq = 7;
262 intno = s->pics[0].irq_base + irq;
264 pic_update_irq(s);
265 pic_unlock(s);
267 return intno;
270 void kvm_pic_reset(struct kvm_kpic_state *s)
272 int irq;
273 struct kvm_vcpu *vcpu0 = s->pics_state->kvm->bsp_vcpu;
274 u8 irr = s->irr, isr = s->imr;
276 s->last_irr = 0;
277 s->irr = 0;
278 s->imr = 0;
279 s->isr = 0;
280 s->isr_ack = 0xff;
281 s->priority_add = 0;
282 s->irq_base = 0;
283 s->read_reg_select = 0;
284 s->poll = 0;
285 s->special_mask = 0;
286 s->init_state = 0;
287 s->auto_eoi = 0;
288 s->rotate_on_auto_eoi = 0;
289 s->special_fully_nested_mode = 0;
290 s->init4 = 0;
292 for (irq = 0; irq < PIC_NUM_PINS/2; irq++) {
293 if (vcpu0 && kvm_apic_accept_pic_intr(vcpu0))
294 if (irr & (1 << irq) || isr & (1 << irq)) {
295 pic_clear_isr(s, irq);
300 static void pic_ioport_write(void *opaque, u32 addr, u32 val)
302 struct kvm_kpic_state *s = opaque;
303 int priority, cmd, irq;
305 addr &= 1;
306 if (addr == 0) {
307 if (val & 0x10) {
308 kvm_pic_reset(s); /* init */
310 * deassert a pending interrupt
312 pic_irq_request(s->pics_state->kvm, 0);
313 s->init_state = 1;
314 s->init4 = val & 1;
315 if (val & 0x02)
316 printk(KERN_ERR "single mode not supported");
317 if (val & 0x08)
318 printk(KERN_ERR
319 "level sensitive irq not supported");
320 } else if (val & 0x08) {
321 if (val & 0x04)
322 s->poll = 1;
323 if (val & 0x02)
324 s->read_reg_select = val & 1;
325 if (val & 0x40)
326 s->special_mask = (val >> 5) & 1;
327 } else {
328 cmd = val >> 5;
329 switch (cmd) {
330 case 0:
331 case 4:
332 s->rotate_on_auto_eoi = cmd >> 2;
333 break;
334 case 1: /* end of interrupt */
335 case 5:
336 priority = get_priority(s, s->isr);
337 if (priority != 8) {
338 irq = (priority + s->priority_add) & 7;
339 if (cmd == 5)
340 s->priority_add = (irq + 1) & 7;
341 pic_clear_isr(s, irq);
342 pic_update_irq(s->pics_state);
344 break;
345 case 3:
346 irq = val & 7;
347 pic_clear_isr(s, irq);
348 pic_update_irq(s->pics_state);
349 break;
350 case 6:
351 s->priority_add = (val + 1) & 7;
352 pic_update_irq(s->pics_state);
353 break;
354 case 7:
355 irq = val & 7;
356 s->priority_add = (irq + 1) & 7;
357 pic_clear_isr(s, irq);
358 pic_update_irq(s->pics_state);
359 break;
360 default:
361 break; /* no operation */
364 } else
365 switch (s->init_state) {
366 case 0: /* normal mode */
367 s->imr = val;
368 pic_update_irq(s->pics_state);
369 break;
370 case 1:
371 s->irq_base = val & 0xf8;
372 s->init_state = 2;
373 break;
374 case 2:
375 if (s->init4)
376 s->init_state = 3;
377 else
378 s->init_state = 0;
379 break;
380 case 3:
381 s->special_fully_nested_mode = (val >> 4) & 1;
382 s->auto_eoi = (val >> 1) & 1;
383 s->init_state = 0;
384 break;
388 static u32 pic_poll_read(struct kvm_kpic_state *s, u32 addr1)
390 int ret;
392 ret = pic_get_irq(s);
393 if (ret >= 0) {
394 if (addr1 >> 7) {
395 s->pics_state->pics[0].isr &= ~(1 << 2);
396 s->pics_state->pics[0].irr &= ~(1 << 2);
398 s->irr &= ~(1 << ret);
399 pic_clear_isr(s, ret);
400 if (addr1 >> 7 || ret != 2)
401 pic_update_irq(s->pics_state);
402 } else {
403 ret = 0x07;
404 pic_update_irq(s->pics_state);
407 return ret;
410 static u32 pic_ioport_read(void *opaque, u32 addr1)
412 struct kvm_kpic_state *s = opaque;
413 unsigned int addr;
414 int ret;
416 addr = addr1;
417 addr &= 1;
418 if (s->poll) {
419 ret = pic_poll_read(s, addr1);
420 s->poll = 0;
421 } else
422 if (addr == 0)
423 if (s->read_reg_select)
424 ret = s->isr;
425 else
426 ret = s->irr;
427 else
428 ret = s->imr;
429 return ret;
432 static void elcr_ioport_write(void *opaque, u32 addr, u32 val)
434 struct kvm_kpic_state *s = opaque;
435 s->elcr = val & s->elcr_mask;
438 static u32 elcr_ioport_read(void *opaque, u32 addr1)
440 struct kvm_kpic_state *s = opaque;
441 return s->elcr;
444 static int picdev_in_range(gpa_t addr)
446 switch (addr) {
447 case 0x20:
448 case 0x21:
449 case 0xa0:
450 case 0xa1:
451 case 0x4d0:
452 case 0x4d1:
453 return 1;
454 default:
455 return 0;
459 static inline struct kvm_pic *to_pic(struct kvm_io_device *dev)
461 return container_of(dev, struct kvm_pic, dev);
464 static int picdev_write(struct kvm_io_device *this,
465 gpa_t addr, int len, const void *val)
467 struct kvm_pic *s = to_pic(this);
468 unsigned char data = *(unsigned char *)val;
469 if (!picdev_in_range(addr))
470 return -EOPNOTSUPP;
472 if (len != 1) {
473 if (printk_ratelimit())
474 printk(KERN_ERR "PIC: non byte write\n");
475 return 0;
477 pic_lock(s);
478 switch (addr) {
479 case 0x20:
480 case 0x21:
481 case 0xa0:
482 case 0xa1:
483 pic_ioport_write(&s->pics[addr >> 7], addr, data);
484 break;
485 case 0x4d0:
486 case 0x4d1:
487 elcr_ioport_write(&s->pics[addr & 1], addr, data);
488 break;
490 pic_unlock(s);
491 return 0;
494 static int picdev_read(struct kvm_io_device *this,
495 gpa_t addr, int len, void *val)
497 struct kvm_pic *s = to_pic(this);
498 unsigned char data = 0;
499 if (!picdev_in_range(addr))
500 return -EOPNOTSUPP;
502 if (len != 1) {
503 if (printk_ratelimit())
504 printk(KERN_ERR "PIC: non byte read\n");
505 return 0;
507 pic_lock(s);
508 switch (addr) {
509 case 0x20:
510 case 0x21:
511 case 0xa0:
512 case 0xa1:
513 data = pic_ioport_read(&s->pics[addr >> 7], addr);
514 break;
515 case 0x4d0:
516 case 0x4d1:
517 data = elcr_ioport_read(&s->pics[addr & 1], addr);
518 break;
520 *(unsigned char *)val = data;
521 pic_unlock(s);
522 return 0;
526 * callback when PIC0 irq status changed
528 static void pic_irq_request(struct kvm *kvm, int level)
530 struct kvm_vcpu *vcpu = kvm->bsp_vcpu;
531 struct kvm_pic *s = pic_irqchip(kvm);
532 int irq = pic_get_irq(&s->pics[0]);
534 s->output = level;
535 if (vcpu && level && (s->pics[0].isr_ack & (1 << irq))) {
536 s->pics[0].isr_ack &= ~(1 << irq);
537 s->wakeup_needed = true;
541 static const struct kvm_io_device_ops picdev_ops = {
542 .read = picdev_read,
543 .write = picdev_write,
546 struct kvm_pic *kvm_create_pic(struct kvm *kvm)
548 struct kvm_pic *s;
549 int ret;
551 s = kzalloc(sizeof(struct kvm_pic), GFP_KERNEL);
552 if (!s)
553 return NULL;
554 raw_spin_lock_init(&s->lock);
555 s->kvm = kvm;
556 s->pics[0].elcr_mask = 0xf8;
557 s->pics[1].elcr_mask = 0xde;
558 s->pics[0].pics_state = s;
559 s->pics[1].pics_state = s;
562 * Initialize PIO device
564 kvm_iodevice_init(&s->dev, &picdev_ops);
565 mutex_lock(&kvm->slots_lock);
566 ret = kvm_io_bus_register_dev(kvm, KVM_PIO_BUS, &s->dev);
567 mutex_unlock(&kvm->slots_lock);
568 if (ret < 0) {
569 kfree(s);
570 return NULL;
573 return s;
576 void kvm_destroy_pic(struct kvm *kvm)
578 struct kvm_pic *vpic = kvm->arch.vpic;
580 if (vpic) {
581 kvm_io_bus_unregister_dev(kvm, KVM_PIO_BUS, &vpic->dev);
582 kvm->arch.vpic = NULL;
583 kfree(vpic);