4 * Copyright IBM, Corp. 2008
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU GPL, version 2 or later.
10 * See the COPYING file in the top-level directory.
14 #include <sys/types.h>
15 #include <sys/ioctl.h>
19 #include <linux/kvm.h>
21 #include "qemu-common.h"
28 #define dprintf(fmt, ...) \
29 do { fprintf(stderr, fmt, ## __VA_ARGS__); } while (0)
31 #define dprintf(fmt, ...) \
35 typedef struct kvm_userspace_memory_region KVMSlot
;
46 static KVMState
*kvm_state
;
48 static KVMSlot
*kvm_alloc_slot(KVMState
*s
)
52 for (i
= 0; i
< ARRAY_SIZE(s
->slots
); i
++) {
53 /* KVM private memory slots */
56 if (s
->slots
[i
].memory_size
== 0)
63 static KVMSlot
*kvm_lookup_slot(KVMState
*s
, target_phys_addr_t start_addr
)
67 for (i
= 0; i
< ARRAY_SIZE(s
->slots
); i
++) {
68 KVMSlot
*mem
= &s
->slots
[i
];
70 if (start_addr
>= mem
->guest_phys_addr
&&
71 start_addr
< (mem
->guest_phys_addr
+ mem
->memory_size
))
78 int kvm_init_vcpu(CPUState
*env
)
80 KVMState
*s
= kvm_state
;
84 dprintf("kvm_init_vcpu\n");
86 ret
= kvm_vm_ioctl(s
, KVM_CREATE_VCPU
, env
->cpu_index
);
88 dprintf("kvm_create_vcpu failed\n");
95 mmap_size
= kvm_ioctl(s
, KVM_GET_VCPU_MMAP_SIZE
, 0);
97 dprintf("KVM_GET_VCPU_MMAP_SIZE failed\n");
101 env
->kvm_run
= mmap(NULL
, mmap_size
, PROT_READ
| PROT_WRITE
, MAP_SHARED
,
103 if (env
->kvm_run
== MAP_FAILED
) {
105 dprintf("mmap'ing vcpu state failed\n");
109 ret
= kvm_arch_init_vcpu(env
);
115 int kvm_init(int smp_cpus
)
124 s
= qemu_mallocz(sizeof(KVMState
));
128 for (i
= 0; i
< ARRAY_SIZE(s
->slots
); i
++)
129 s
->slots
[i
].slot
= i
;
132 s
->fd
= open("/dev/kvm", O_RDWR
);
134 fprintf(stderr
, "Could not access KVM kernel module: %m\n");
139 ret
= kvm_ioctl(s
, KVM_GET_API_VERSION
, 0);
140 if (ret
< KVM_API_VERSION
) {
143 fprintf(stderr
, "kvm version too old\n");
147 if (ret
> KVM_API_VERSION
) {
149 fprintf(stderr
, "kvm version not supported\n");
153 s
->vmfd
= kvm_ioctl(s
, KVM_CREATE_VM
, 0);
157 /* initially, KVM allocated its own memory and we had to jump through
158 * hooks to make phys_ram_base point to this. Modern versions of KVM
159 * just use a user allocated buffer so we can use phys_ram_base
160 * unmodified. Make sure we have a sufficiently modern version of KVM.
162 ret
= kvm_ioctl(s
, KVM_CHECK_EXTENSION
, KVM_CAP_USER_MEMORY
);
166 fprintf(stderr
, "kvm does not support KVM_CAP_USER_MEMORY\n");
170 ret
= kvm_arch_init(s
, smp_cpus
);
190 static int kvm_handle_io(CPUState
*env
, uint16_t port
, void *data
,
191 int direction
, int size
, uint32_t count
)
196 for (i
= 0; i
< count
; i
++) {
197 if (direction
== KVM_EXIT_IO_IN
) {
200 stb_p(ptr
, cpu_inb(env
, port
));
203 stw_p(ptr
, cpu_inw(env
, port
));
206 stl_p(ptr
, cpu_inl(env
, port
));
212 cpu_outb(env
, port
, ldub_p(ptr
));
215 cpu_outw(env
, port
, lduw_p(ptr
));
218 cpu_outl(env
, port
, ldl_p(ptr
));
229 int kvm_cpu_exec(CPUState
*env
)
231 struct kvm_run
*run
= env
->kvm_run
;
234 dprintf("kvm_cpu_exec()\n");
237 kvm_arch_pre_run(env
, run
);
239 if ((env
->interrupt_request
& CPU_INTERRUPT_EXIT
)) {
240 dprintf("interrupt exit requested\n");
245 ret
= kvm_vcpu_ioctl(env
, KVM_RUN
, 0);
246 kvm_arch_post_run(env
, run
);
248 if (ret
== -EINTR
|| ret
== -EAGAIN
) {
249 dprintf("io window exit\n");
255 dprintf("kvm run failed %s\n", strerror(-ret
));
259 ret
= 0; /* exit loop */
260 switch (run
->exit_reason
) {
262 dprintf("handle_io\n");
263 ret
= kvm_handle_io(env
, run
->io
.port
,
264 (uint8_t *)run
+ run
->io
.data_offset
,
270 dprintf("handle_mmio\n");
271 cpu_physical_memory_rw(run
->mmio
.phys_addr
,
277 case KVM_EXIT_IRQ_WINDOW_OPEN
:
278 dprintf("irq_window_open\n");
280 case KVM_EXIT_SHUTDOWN
:
281 dprintf("shutdown\n");
282 qemu_system_reset_request();
285 case KVM_EXIT_UNKNOWN
:
286 dprintf("kvm_exit_unknown\n");
288 case KVM_EXIT_FAIL_ENTRY
:
289 dprintf("kvm_exit_fail_entry\n");
291 case KVM_EXIT_EXCEPTION
:
292 dprintf("kvm_exit_exception\n");
295 dprintf("kvm_exit_debug\n");
298 dprintf("kvm_arch_handle_exit\n");
299 ret
= kvm_arch_handle_exit(env
, run
);
304 if ((env
->interrupt_request
& CPU_INTERRUPT_EXIT
)) {
305 env
->interrupt_request
&= ~CPU_INTERRUPT_EXIT
;
306 env
->exception_index
= EXCP_INTERRUPT
;
312 void kvm_set_phys_mem(target_phys_addr_t start_addr
,
314 ram_addr_t phys_offset
)
316 KVMState
*s
= kvm_state
;
317 ram_addr_t flags
= phys_offset
& ~TARGET_PAGE_MASK
;
320 /* KVM does not support read-only slots */
321 phys_offset
&= ~IO_MEM_ROM
;
323 mem
= kvm_lookup_slot(s
, start_addr
);
325 if ((flags
== IO_MEM_UNASSIGNED
) || (flags
>= TLB_MMIO
)) {
326 mem
->memory_size
= 0;
327 mem
->guest_phys_addr
= start_addr
;
328 mem
->userspace_addr
= 0;
331 kvm_vm_ioctl(s
, KVM_SET_USER_MEMORY_REGION
, mem
);
332 } else if (start_addr
>= mem
->guest_phys_addr
&&
333 (start_addr
+ size
) <= (mem
->guest_phys_addr
+
336 target_phys_addr_t mem_start
;
337 ram_addr_t mem_size
, mem_offset
;
340 if ((phys_offset
- (start_addr
- mem
->guest_phys_addr
)) ==
341 ((uint8_t *)mem
->userspace_addr
- phys_ram_base
))
344 /* unregister whole slot */
345 memcpy(&slot
, mem
, sizeof(slot
));
346 mem
->memory_size
= 0;
347 kvm_vm_ioctl(s
, KVM_SET_USER_MEMORY_REGION
, mem
);
349 /* register prefix slot */
350 mem_start
= slot
.guest_phys_addr
;
351 mem_size
= start_addr
- slot
.guest_phys_addr
;
352 mem_offset
= (uint8_t *)slot
.userspace_addr
- phys_ram_base
;
354 kvm_set_phys_mem(mem_start
, mem_size
, mem_offset
);
356 /* register new slot */
357 kvm_set_phys_mem(start_addr
, size
, phys_offset
);
359 /* register suffix slot */
360 mem_start
= start_addr
+ size
;
361 mem_offset
+= mem_size
+ size
;
362 mem_size
= slot
.memory_size
- mem_size
- size
;
364 kvm_set_phys_mem(mem_start
, mem_size
, mem_offset
);
368 printf("Registering overlapping slot\n");
372 /* KVM does not need to know about this memory */
373 if (flags
>= IO_MEM_UNASSIGNED
)
376 mem
= kvm_alloc_slot(s
);
377 mem
->memory_size
= size
;
378 mem
->guest_phys_addr
= start_addr
;
379 mem
->userspace_addr
= (unsigned long)(phys_ram_base
+ phys_offset
);
382 kvm_vm_ioctl(s
, KVM_SET_USER_MEMORY_REGION
, mem
);
383 /* FIXME deal with errors */
386 int kvm_ioctl(KVMState
*s
, int type
, ...)
393 arg
= va_arg(ap
, void *);
396 ret
= ioctl(s
->fd
, type
, arg
);
403 int kvm_vm_ioctl(KVMState
*s
, int type
, ...)
410 arg
= va_arg(ap
, void *);
413 ret
= ioctl(s
->vmfd
, type
, arg
);
420 int kvm_vcpu_ioctl(CPUState
*env
, int type
, ...)
427 arg
= va_arg(ap
, void *);
430 ret
= ioctl(env
->kvm_fd
, type
, arg
);