KVM: enable PCI multiple-segments for pass-through device
[linux-2.6.git] / arch / powerpc / kvm / powerpc.c
blob51aedd7f16bcb14d5d2f073da2fc55a53ec18575
1 /*
2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License, version 2, as
4 * published by the Free Software Foundation.
6 * This program is distributed in the hope that it will be useful,
7 * but WITHOUT ANY WARRANTY; without even the implied warranty of
8 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
9 * GNU General Public License for more details.
11 * You should have received a copy of the GNU General Public License
12 * along with this program; if not, write to the Free Software
13 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
15 * Copyright IBM Corp. 2007
17 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
18 * Christian Ehrhardt <ehrhardt@linux.vnet.ibm.com>
21 #include <linux/errno.h>
22 #include <linux/err.h>
23 #include <linux/kvm_host.h>
24 #include <linux/module.h>
25 #include <linux/vmalloc.h>
26 #include <linux/hrtimer.h>
27 #include <linux/fs.h>
28 #include <asm/cputable.h>
29 #include <asm/uaccess.h>
30 #include <asm/kvm_ppc.h>
31 #include <asm/tlbflush.h>
32 #include "timing.h"
33 #include "../mm/mmu_decl.h"
35 #define CREATE_TRACE_POINTS
36 #include "trace.h"
38 gfn_t unalias_gfn(struct kvm *kvm, gfn_t gfn)
40 return gfn;
43 int kvm_arch_vcpu_runnable(struct kvm_vcpu *v)
45 return !(v->arch.msr & MSR_WE) || !!(v->arch.pending_exceptions);
49 int kvmppc_emulate_mmio(struct kvm_run *run, struct kvm_vcpu *vcpu)
51 enum emulation_result er;
52 int r;
54 er = kvmppc_emulate_instruction(run, vcpu);
55 switch (er) {
56 case EMULATE_DONE:
57 /* Future optimization: only reload non-volatiles if they were
58 * actually modified. */
59 r = RESUME_GUEST_NV;
60 break;
61 case EMULATE_DO_MMIO:
62 run->exit_reason = KVM_EXIT_MMIO;
63 /* We must reload nonvolatiles because "update" load/store
64 * instructions modify register state. */
65 /* Future optimization: only reload non-volatiles if they were
66 * actually modified. */
67 r = RESUME_HOST_NV;
68 break;
69 case EMULATE_FAIL:
70 /* XXX Deliver Program interrupt to guest. */
71 printk(KERN_EMERG "%s: emulation failed (%08x)\n", __func__,
72 vcpu->arch.last_inst);
73 r = RESUME_HOST;
74 break;
75 default:
76 BUG();
79 return r;
82 int kvm_arch_hardware_enable(void *garbage)
84 return 0;
87 void kvm_arch_hardware_disable(void *garbage)
91 int kvm_arch_hardware_setup(void)
93 return 0;
96 void kvm_arch_hardware_unsetup(void)
100 void kvm_arch_check_processor_compat(void *rtn)
102 *(int *)rtn = kvmppc_core_check_processor_compat();
105 struct kvm *kvm_arch_create_vm(void)
107 struct kvm *kvm;
109 kvm = kzalloc(sizeof(struct kvm), GFP_KERNEL);
110 if (!kvm)
111 return ERR_PTR(-ENOMEM);
113 return kvm;
116 static void kvmppc_free_vcpus(struct kvm *kvm)
118 unsigned int i;
119 struct kvm_vcpu *vcpu;
121 kvm_for_each_vcpu(i, vcpu, kvm)
122 kvm_arch_vcpu_free(vcpu);
124 mutex_lock(&kvm->lock);
125 for (i = 0; i < atomic_read(&kvm->online_vcpus); i++)
126 kvm->vcpus[i] = NULL;
128 atomic_set(&kvm->online_vcpus, 0);
129 mutex_unlock(&kvm->lock);
132 void kvm_arch_sync_events(struct kvm *kvm)
136 void kvm_arch_destroy_vm(struct kvm *kvm)
138 kvmppc_free_vcpus(kvm);
139 kvm_free_physmem(kvm);
140 cleanup_srcu_struct(&kvm->srcu);
141 kfree(kvm);
144 int kvm_dev_ioctl_check_extension(long ext)
146 int r;
148 switch (ext) {
149 case KVM_CAP_PPC_SEGSTATE:
150 r = 1;
151 break;
152 case KVM_CAP_COALESCED_MMIO:
153 r = KVM_COALESCED_MMIO_PAGE_OFFSET;
154 break;
155 default:
156 r = 0;
157 break;
159 return r;
163 long kvm_arch_dev_ioctl(struct file *filp,
164 unsigned int ioctl, unsigned long arg)
166 return -EINVAL;
169 int kvm_arch_prepare_memory_region(struct kvm *kvm,
170 struct kvm_memory_slot *memslot,
171 struct kvm_memory_slot old,
172 struct kvm_userspace_memory_region *mem,
173 int user_alloc)
175 return 0;
178 void kvm_arch_commit_memory_region(struct kvm *kvm,
179 struct kvm_userspace_memory_region *mem,
180 struct kvm_memory_slot old,
181 int user_alloc)
183 return;
187 void kvm_arch_flush_shadow(struct kvm *kvm)
191 struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id)
193 struct kvm_vcpu *vcpu;
194 vcpu = kvmppc_core_vcpu_create(kvm, id);
195 kvmppc_create_vcpu_debugfs(vcpu, id);
196 return vcpu;
199 void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu)
201 kvmppc_remove_vcpu_debugfs(vcpu);
202 kvmppc_core_vcpu_free(vcpu);
205 void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu)
207 kvm_arch_vcpu_free(vcpu);
210 int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu)
212 return kvmppc_core_pending_dec(vcpu);
215 static void kvmppc_decrementer_func(unsigned long data)
217 struct kvm_vcpu *vcpu = (struct kvm_vcpu *)data;
219 kvmppc_core_queue_dec(vcpu);
221 if (waitqueue_active(&vcpu->wq)) {
222 wake_up_interruptible(&vcpu->wq);
223 vcpu->stat.halt_wakeup++;
228 * low level hrtimer wake routine. Because this runs in hardirq context
229 * we schedule a tasklet to do the real work.
231 enum hrtimer_restart kvmppc_decrementer_wakeup(struct hrtimer *timer)
233 struct kvm_vcpu *vcpu;
235 vcpu = container_of(timer, struct kvm_vcpu, arch.dec_timer);
236 tasklet_schedule(&vcpu->arch.tasklet);
238 return HRTIMER_NORESTART;
241 int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu)
243 hrtimer_init(&vcpu->arch.dec_timer, CLOCK_REALTIME, HRTIMER_MODE_ABS);
244 tasklet_init(&vcpu->arch.tasklet, kvmppc_decrementer_func, (ulong)vcpu);
245 vcpu->arch.dec_timer.function = kvmppc_decrementer_wakeup;
247 return 0;
250 void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu)
252 kvmppc_mmu_destroy(vcpu);
255 void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu)
257 kvmppc_core_vcpu_load(vcpu, cpu);
260 void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu)
262 kvmppc_core_vcpu_put(vcpu);
265 int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
266 struct kvm_guest_debug *dbg)
268 return -EINVAL;
271 static void kvmppc_complete_dcr_load(struct kvm_vcpu *vcpu,
272 struct kvm_run *run)
274 kvmppc_set_gpr(vcpu, vcpu->arch.io_gpr, run->dcr.data);
277 static void kvmppc_complete_mmio_load(struct kvm_vcpu *vcpu,
278 struct kvm_run *run)
280 ulong gpr;
282 if (run->mmio.len > sizeof(gpr)) {
283 printk(KERN_ERR "bad MMIO length: %d\n", run->mmio.len);
284 return;
287 if (vcpu->arch.mmio_is_bigendian) {
288 switch (run->mmio.len) {
289 case 4: gpr = *(u32 *)run->mmio.data; break;
290 case 2: gpr = *(u16 *)run->mmio.data; break;
291 case 1: gpr = *(u8 *)run->mmio.data; break;
293 } else {
294 /* Convert BE data from userland back to LE. */
295 switch (run->mmio.len) {
296 case 4: gpr = ld_le32((u32 *)run->mmio.data); break;
297 case 2: gpr = ld_le16((u16 *)run->mmio.data); break;
298 case 1: gpr = *(u8 *)run->mmio.data; break;
302 kvmppc_set_gpr(vcpu, vcpu->arch.io_gpr, gpr);
305 int kvmppc_handle_load(struct kvm_run *run, struct kvm_vcpu *vcpu,
306 unsigned int rt, unsigned int bytes, int is_bigendian)
308 if (bytes > sizeof(run->mmio.data)) {
309 printk(KERN_ERR "%s: bad MMIO length: %d\n", __func__,
310 run->mmio.len);
313 run->mmio.phys_addr = vcpu->arch.paddr_accessed;
314 run->mmio.len = bytes;
315 run->mmio.is_write = 0;
317 vcpu->arch.io_gpr = rt;
318 vcpu->arch.mmio_is_bigendian = is_bigendian;
319 vcpu->mmio_needed = 1;
320 vcpu->mmio_is_write = 0;
322 return EMULATE_DO_MMIO;
325 int kvmppc_handle_store(struct kvm_run *run, struct kvm_vcpu *vcpu,
326 u32 val, unsigned int bytes, int is_bigendian)
328 void *data = run->mmio.data;
330 if (bytes > sizeof(run->mmio.data)) {
331 printk(KERN_ERR "%s: bad MMIO length: %d\n", __func__,
332 run->mmio.len);
335 run->mmio.phys_addr = vcpu->arch.paddr_accessed;
336 run->mmio.len = bytes;
337 run->mmio.is_write = 1;
338 vcpu->mmio_needed = 1;
339 vcpu->mmio_is_write = 1;
341 /* Store the value at the lowest bytes in 'data'. */
342 if (is_bigendian) {
343 switch (bytes) {
344 case 4: *(u32 *)data = val; break;
345 case 2: *(u16 *)data = val; break;
346 case 1: *(u8 *)data = val; break;
348 } else {
349 /* Store LE value into 'data'. */
350 switch (bytes) {
351 case 4: st_le32(data, val); break;
352 case 2: st_le16(data, val); break;
353 case 1: *(u8 *)data = val; break;
357 return EMULATE_DO_MMIO;
360 int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *run)
362 int r;
363 sigset_t sigsaved;
365 vcpu_load(vcpu);
367 if (vcpu->sigset_active)
368 sigprocmask(SIG_SETMASK, &vcpu->sigset, &sigsaved);
370 if (vcpu->mmio_needed) {
371 if (!vcpu->mmio_is_write)
372 kvmppc_complete_mmio_load(vcpu, run);
373 vcpu->mmio_needed = 0;
374 } else if (vcpu->arch.dcr_needed) {
375 if (!vcpu->arch.dcr_is_write)
376 kvmppc_complete_dcr_load(vcpu, run);
377 vcpu->arch.dcr_needed = 0;
380 kvmppc_core_deliver_interrupts(vcpu);
382 local_irq_disable();
383 kvm_guest_enter();
384 r = __kvmppc_vcpu_run(run, vcpu);
385 kvm_guest_exit();
386 local_irq_enable();
388 if (vcpu->sigset_active)
389 sigprocmask(SIG_SETMASK, &sigsaved, NULL);
391 vcpu_put(vcpu);
393 return r;
396 int kvm_vcpu_ioctl_interrupt(struct kvm_vcpu *vcpu, struct kvm_interrupt *irq)
398 kvmppc_core_queue_external(vcpu, irq);
400 if (waitqueue_active(&vcpu->wq)) {
401 wake_up_interruptible(&vcpu->wq);
402 vcpu->stat.halt_wakeup++;
405 return 0;
408 int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu,
409 struct kvm_mp_state *mp_state)
411 return -EINVAL;
414 int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
415 struct kvm_mp_state *mp_state)
417 return -EINVAL;
420 long kvm_arch_vcpu_ioctl(struct file *filp,
421 unsigned int ioctl, unsigned long arg)
423 struct kvm_vcpu *vcpu = filp->private_data;
424 void __user *argp = (void __user *)arg;
425 long r;
427 switch (ioctl) {
428 case KVM_INTERRUPT: {
429 struct kvm_interrupt irq;
430 r = -EFAULT;
431 if (copy_from_user(&irq, argp, sizeof(irq)))
432 goto out;
433 r = kvm_vcpu_ioctl_interrupt(vcpu, &irq);
434 break;
436 default:
437 r = -EINVAL;
440 out:
441 return r;
444 long kvm_arch_vm_ioctl(struct file *filp,
445 unsigned int ioctl, unsigned long arg)
447 long r;
449 switch (ioctl) {
450 default:
451 r = -ENOTTY;
454 return r;
457 int kvm_arch_init(void *opaque)
459 return 0;
462 void kvm_arch_exit(void)