4 * Copyright (c) 2003-2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 /* Needed early for CONFIG_BSD etc. */
26 #include "config-host.h"
33 #include "qmp-commands.h"
35 #include "qemu-thread.h"
38 #include "main-loop.h"
47 #include <sys/prctl.h>
50 #define PR_MCE_KILL 33
53 #ifndef PR_MCE_KILL_SET
54 #define PR_MCE_KILL_SET 1
57 #ifndef PR_MCE_KILL_EARLY
58 #define PR_MCE_KILL_EARLY 1
61 #endif /* CONFIG_LINUX */
63 static CPUArchState
*next_cpu
;
65 static bool cpu_thread_is_idle(CPUArchState
*env
)
67 if (env
->stop
|| env
->queued_work_first
) {
70 if (env
->stopped
|| !runstate_is_running()) {
73 if (!env
->halted
|| qemu_cpu_has_work(env
) || kvm_irqchip_in_kernel()) {
79 static bool all_cpu_threads_idle(void)
83 for (env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
84 if (!cpu_thread_is_idle(env
)) {
91 /***********************************************************/
92 /* guest cycle counter */
94 /* Conversion factor from emulated instructions to virtual clock ticks. */
95 static int icount_time_shift
;
96 /* Arbitrarily pick 1MIPS as the minimum allowable speed. */
97 #define MAX_ICOUNT_SHIFT 10
98 /* Compensate for varying guest execution speed. */
99 static int64_t qemu_icount_bias
;
100 static QEMUTimer
*icount_rt_timer
;
101 static QEMUTimer
*icount_vm_timer
;
102 static QEMUTimer
*icount_warp_timer
;
103 static int64_t vm_clock_warp_start
;
104 static int64_t qemu_icount
;
106 typedef struct TimersState
{
107 int64_t cpu_ticks_prev
;
108 int64_t cpu_ticks_offset
;
109 int64_t cpu_clock_offset
;
110 int32_t cpu_ticks_enabled
;
114 TimersState timers_state
;
116 /* Return the virtual CPU time, based on the instruction counter. */
117 int64_t cpu_get_icount(void)
120 CPUArchState
*env
= cpu_single_env
;
122 icount
= qemu_icount
;
124 if (!can_do_io(env
)) {
125 fprintf(stderr
, "Bad clock read\n");
127 icount
-= (env
->icount_decr
.u16
.low
+ env
->icount_extra
);
129 return qemu_icount_bias
+ (icount
<< icount_time_shift
);
132 /* return the host CPU cycle counter and handle stop/restart */
133 int64_t cpu_get_ticks(void)
136 return cpu_get_icount();
138 if (!timers_state
.cpu_ticks_enabled
) {
139 return timers_state
.cpu_ticks_offset
;
142 ticks
= cpu_get_real_ticks();
143 if (timers_state
.cpu_ticks_prev
> ticks
) {
144 /* Note: non increasing ticks may happen if the host uses
146 timers_state
.cpu_ticks_offset
+= timers_state
.cpu_ticks_prev
- ticks
;
148 timers_state
.cpu_ticks_prev
= ticks
;
149 return ticks
+ timers_state
.cpu_ticks_offset
;
153 /* return the host CPU monotonic timer and handle stop/restart */
154 int64_t cpu_get_clock(void)
157 if (!timers_state
.cpu_ticks_enabled
) {
158 return timers_state
.cpu_clock_offset
;
161 return ti
+ timers_state
.cpu_clock_offset
;
165 /* enable cpu_get_ticks() */
166 void cpu_enable_ticks(void)
168 if (!timers_state
.cpu_ticks_enabled
) {
169 timers_state
.cpu_ticks_offset
-= cpu_get_real_ticks();
170 timers_state
.cpu_clock_offset
-= get_clock();
171 timers_state
.cpu_ticks_enabled
= 1;
175 /* disable cpu_get_ticks() : the clock is stopped. You must not call
176 cpu_get_ticks() after that. */
177 void cpu_disable_ticks(void)
179 if (timers_state
.cpu_ticks_enabled
) {
180 timers_state
.cpu_ticks_offset
= cpu_get_ticks();
181 timers_state
.cpu_clock_offset
= cpu_get_clock();
182 timers_state
.cpu_ticks_enabled
= 0;
186 /* Correlation between real and virtual time is always going to be
187 fairly approximate, so ignore small variation.
188 When the guest is idle real and virtual time will be aligned in
190 #define ICOUNT_WOBBLE (get_ticks_per_sec() / 10)
192 static void icount_adjust(void)
197 static int64_t last_delta
;
198 /* If the VM is not running, then do nothing. */
199 if (!runstate_is_running()) {
202 cur_time
= cpu_get_clock();
203 cur_icount
= qemu_get_clock_ns(vm_clock
);
204 delta
= cur_icount
- cur_time
;
205 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
207 && last_delta
+ ICOUNT_WOBBLE
< delta
* 2
208 && icount_time_shift
> 0) {
209 /* The guest is getting too far ahead. Slow time down. */
213 && last_delta
- ICOUNT_WOBBLE
> delta
* 2
214 && icount_time_shift
< MAX_ICOUNT_SHIFT
) {
215 /* The guest is getting too far behind. Speed time up. */
219 qemu_icount_bias
= cur_icount
- (qemu_icount
<< icount_time_shift
);
222 static void icount_adjust_rt(void *opaque
)
224 qemu_mod_timer(icount_rt_timer
,
225 qemu_get_clock_ms(rt_clock
) + 1000);
229 static void icount_adjust_vm(void *opaque
)
231 qemu_mod_timer(icount_vm_timer
,
232 qemu_get_clock_ns(vm_clock
) + get_ticks_per_sec() / 10);
236 static int64_t qemu_icount_round(int64_t count
)
238 return (count
+ (1 << icount_time_shift
) - 1) >> icount_time_shift
;
241 static void icount_warp_rt(void *opaque
)
243 if (vm_clock_warp_start
== -1) {
247 if (runstate_is_running()) {
248 int64_t clock
= qemu_get_clock_ns(rt_clock
);
249 int64_t warp_delta
= clock
- vm_clock_warp_start
;
250 if (use_icount
== 1) {
251 qemu_icount_bias
+= warp_delta
;
254 * In adaptive mode, do not let the vm_clock run too
255 * far ahead of real time.
257 int64_t cur_time
= cpu_get_clock();
258 int64_t cur_icount
= qemu_get_clock_ns(vm_clock
);
259 int64_t delta
= cur_time
- cur_icount
;
260 qemu_icount_bias
+= MIN(warp_delta
, delta
);
262 if (qemu_clock_expired(vm_clock
)) {
266 vm_clock_warp_start
= -1;
269 void qtest_clock_warp(int64_t dest
)
271 int64_t clock
= qemu_get_clock_ns(vm_clock
);
272 assert(qtest_enabled());
273 while (clock
< dest
) {
274 int64_t deadline
= qemu_clock_deadline(vm_clock
);
275 int64_t warp
= MIN(dest
- clock
, deadline
);
276 qemu_icount_bias
+= warp
;
277 qemu_run_timers(vm_clock
);
278 clock
= qemu_get_clock_ns(vm_clock
);
283 void qemu_clock_warp(QEMUClock
*clock
)
288 * There are too many global variables to make the "warp" behavior
289 * applicable to other clocks. But a clock argument removes the
290 * need for if statements all over the place.
292 if (clock
!= vm_clock
|| !use_icount
) {
297 * If the CPUs have been sleeping, advance the vm_clock timer now. This
298 * ensures that the deadline for the timer is computed correctly below.
299 * This also makes sure that the insn counter is synchronized before the
300 * CPU starts running, in case the CPU is woken by an event other than
301 * the earliest vm_clock timer.
303 icount_warp_rt(NULL
);
304 if (!all_cpu_threads_idle() || !qemu_clock_has_timers(vm_clock
)) {
305 qemu_del_timer(icount_warp_timer
);
309 if (qtest_enabled()) {
310 /* When testing, qtest commands advance icount. */
314 vm_clock_warp_start
= qemu_get_clock_ns(rt_clock
);
315 deadline
= qemu_clock_deadline(vm_clock
);
318 * Ensure the vm_clock proceeds even when the virtual CPU goes to
319 * sleep. Otherwise, the CPU might be waiting for a future timer
320 * interrupt to wake it up, but the interrupt never comes because
321 * the vCPU isn't running any insns and thus doesn't advance the
324 * An extreme solution for this problem would be to never let VCPUs
325 * sleep in icount mode if there is a pending vm_clock timer; rather
326 * time could just advance to the next vm_clock event. Instead, we
327 * do stop VCPUs and only advance vm_clock after some "real" time,
328 * (related to the time left until the next event) has passed. This
329 * rt_clock timer will do this. This avoids that the warps are too
330 * visible externally---for example, you will not be sending network
331 * packets continuously instead of every 100ms.
333 qemu_mod_timer(icount_warp_timer
, vm_clock_warp_start
+ deadline
);
339 static const VMStateDescription vmstate_timers
= {
342 .minimum_version_id
= 1,
343 .minimum_version_id_old
= 1,
344 .fields
= (VMStateField
[]) {
345 VMSTATE_INT64(cpu_ticks_offset
, TimersState
),
346 VMSTATE_INT64(dummy
, TimersState
),
347 VMSTATE_INT64_V(cpu_clock_offset
, TimersState
, 2),
348 VMSTATE_END_OF_LIST()
352 void configure_icount(const char *option
)
354 vmstate_register(NULL
, 0, &vmstate_timers
, &timers_state
);
359 icount_warp_timer
= qemu_new_timer_ns(rt_clock
, icount_warp_rt
, NULL
);
360 if (strcmp(option
, "auto") != 0) {
361 icount_time_shift
= strtol(option
, NULL
, 0);
368 /* 125MIPS seems a reasonable initial guess at the guest speed.
369 It will be corrected fairly quickly anyway. */
370 icount_time_shift
= 3;
372 /* Have both realtime and virtual time triggers for speed adjustment.
373 The realtime trigger catches emulated time passing too slowly,
374 the virtual time trigger catches emulated time passing too fast.
375 Realtime triggers occur even when idle, so use them less frequently
377 icount_rt_timer
= qemu_new_timer_ms(rt_clock
, icount_adjust_rt
, NULL
);
378 qemu_mod_timer(icount_rt_timer
,
379 qemu_get_clock_ms(rt_clock
) + 1000);
380 icount_vm_timer
= qemu_new_timer_ns(vm_clock
, icount_adjust_vm
, NULL
);
381 qemu_mod_timer(icount_vm_timer
,
382 qemu_get_clock_ns(vm_clock
) + get_ticks_per_sec() / 10);
385 /***********************************************************/
386 void hw_error(const char *fmt
, ...)
392 fprintf(stderr
, "qemu: hardware error: ");
393 vfprintf(stderr
, fmt
, ap
);
394 fprintf(stderr
, "\n");
395 for(env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
396 fprintf(stderr
, "CPU #%d:\n", env
->cpu_index
);
398 cpu_dump_state(env
, stderr
, fprintf
, X86_DUMP_FPU
);
400 cpu_dump_state(env
, stderr
, fprintf
, 0);
407 void cpu_synchronize_all_states(void)
411 for (cpu
= first_cpu
; cpu
; cpu
= cpu
->next_cpu
) {
412 cpu_synchronize_state(cpu
);
416 void cpu_synchronize_all_post_reset(void)
420 for (cpu
= first_cpu
; cpu
; cpu
= cpu
->next_cpu
) {
421 cpu_synchronize_post_reset(cpu
);
425 void cpu_synchronize_all_post_init(void)
429 for (cpu
= first_cpu
; cpu
; cpu
= cpu
->next_cpu
) {
430 cpu_synchronize_post_init(cpu
);
434 int cpu_is_stopped(CPUArchState
*env
)
436 return !runstate_is_running() || env
->stopped
;
439 static void do_vm_stop(RunState state
)
441 if (runstate_is_running()) {
445 vm_state_notify(0, state
);
448 monitor_protocol_event(QEVENT_STOP
, NULL
);
452 static int cpu_can_run(CPUArchState
*env
)
457 if (env
->stopped
|| !runstate_is_running()) {
463 static void cpu_handle_guest_debug(CPUArchState
*env
)
465 gdb_set_stop_cpu(env
);
466 qemu_system_debug_request();
470 static void cpu_signal(int sig
)
472 if (cpu_single_env
) {
473 cpu_exit(cpu_single_env
);
479 static void sigbus_reraise(void)
482 struct sigaction action
;
484 memset(&action
, 0, sizeof(action
));
485 action
.sa_handler
= SIG_DFL
;
486 if (!sigaction(SIGBUS
, &action
, NULL
)) {
489 sigaddset(&set
, SIGBUS
);
490 sigprocmask(SIG_UNBLOCK
, &set
, NULL
);
492 perror("Failed to re-raise SIGBUS!\n");
496 static void sigbus_handler(int n
, struct qemu_signalfd_siginfo
*siginfo
,
499 if (kvm_on_sigbus(siginfo
->ssi_code
,
500 (void *)(intptr_t)siginfo
->ssi_addr
)) {
505 static void qemu_init_sigbus(void)
507 struct sigaction action
;
509 memset(&action
, 0, sizeof(action
));
510 action
.sa_flags
= SA_SIGINFO
;
511 action
.sa_sigaction
= (void (*)(int, siginfo_t
*, void*))sigbus_handler
;
512 sigaction(SIGBUS
, &action
, NULL
);
514 prctl(PR_MCE_KILL
, PR_MCE_KILL_SET
, PR_MCE_KILL_EARLY
, 0, 0);
517 static void qemu_kvm_eat_signals(CPUArchState
*env
)
519 struct timespec ts
= { 0, 0 };
525 sigemptyset(&waitset
);
526 sigaddset(&waitset
, SIG_IPI
);
527 sigaddset(&waitset
, SIGBUS
);
530 r
= sigtimedwait(&waitset
, &siginfo
, &ts
);
531 if (r
== -1 && !(errno
== EAGAIN
|| errno
== EINTR
)) {
532 perror("sigtimedwait");
538 if (kvm_on_sigbus_vcpu(env
, siginfo
.si_code
, siginfo
.si_addr
)) {
546 r
= sigpending(&chkset
);
548 perror("sigpending");
551 } while (sigismember(&chkset
, SIG_IPI
) || sigismember(&chkset
, SIGBUS
));
554 #else /* !CONFIG_LINUX */
556 static void qemu_init_sigbus(void)
560 static void qemu_kvm_eat_signals(CPUArchState
*env
)
563 #endif /* !CONFIG_LINUX */
566 static void dummy_signal(int sig
)
570 static void qemu_kvm_init_cpu_signals(CPUArchState
*env
)
574 struct sigaction sigact
;
576 memset(&sigact
, 0, sizeof(sigact
));
577 sigact
.sa_handler
= dummy_signal
;
578 sigaction(SIG_IPI
, &sigact
, NULL
);
580 pthread_sigmask(SIG_BLOCK
, NULL
, &set
);
581 sigdelset(&set
, SIG_IPI
);
582 sigdelset(&set
, SIGBUS
);
583 r
= kvm_set_signal_mask(env
, &set
);
585 fprintf(stderr
, "kvm_set_signal_mask: %s\n", strerror(-r
));
590 static void qemu_tcg_init_cpu_signals(void)
593 struct sigaction sigact
;
595 memset(&sigact
, 0, sizeof(sigact
));
596 sigact
.sa_handler
= cpu_signal
;
597 sigaction(SIG_IPI
, &sigact
, NULL
);
600 sigaddset(&set
, SIG_IPI
);
601 pthread_sigmask(SIG_UNBLOCK
, &set
, NULL
);
605 static void qemu_kvm_init_cpu_signals(CPUArchState
*env
)
610 static void qemu_tcg_init_cpu_signals(void)
615 QemuMutex qemu_global_mutex
;
616 static QemuCond qemu_io_proceeded_cond
;
617 static bool iothread_requesting_mutex
;
619 static QemuThread io_thread
;
621 static QemuThread
*tcg_cpu_thread
;
622 static QemuCond
*tcg_halt_cond
;
625 static QemuCond qemu_cpu_cond
;
627 static QemuCond qemu_pause_cond
;
628 static QemuCond qemu_work_cond
;
630 void qemu_init_cpu_loop(void)
633 qemu_cond_init(&qemu_cpu_cond
);
634 qemu_cond_init(&qemu_pause_cond
);
635 qemu_cond_init(&qemu_work_cond
);
636 qemu_cond_init(&qemu_io_proceeded_cond
);
637 qemu_mutex_init(&qemu_global_mutex
);
639 qemu_thread_get_self(&io_thread
);
642 void run_on_cpu(CPUArchState
*env
, void (*func
)(void *data
), void *data
)
644 struct qemu_work_item wi
;
646 if (qemu_cpu_is_self(env
)) {
653 if (!env
->queued_work_first
) {
654 env
->queued_work_first
= &wi
;
656 env
->queued_work_last
->next
= &wi
;
658 env
->queued_work_last
= &wi
;
664 CPUArchState
*self_env
= cpu_single_env
;
666 qemu_cond_wait(&qemu_work_cond
, &qemu_global_mutex
);
667 cpu_single_env
= self_env
;
671 static void flush_queued_work(CPUArchState
*env
)
673 struct qemu_work_item
*wi
;
675 if (!env
->queued_work_first
) {
679 while ((wi
= env
->queued_work_first
)) {
680 env
->queued_work_first
= wi
->next
;
684 env
->queued_work_last
= NULL
;
685 qemu_cond_broadcast(&qemu_work_cond
);
688 static void qemu_wait_io_event_common(CPUArchState
*env
)
690 CPUState
*cpu
= ENV_GET_CPU(env
);
695 qemu_cond_signal(&qemu_pause_cond
);
697 flush_queued_work(env
);
698 cpu
->thread_kicked
= false;
701 static void qemu_tcg_wait_io_event(void)
705 while (all_cpu_threads_idle()) {
706 /* Start accounting real time to the virtual clock if the CPUs
708 qemu_clock_warp(vm_clock
);
709 qemu_cond_wait(tcg_halt_cond
, &qemu_global_mutex
);
712 while (iothread_requesting_mutex
) {
713 qemu_cond_wait(&qemu_io_proceeded_cond
, &qemu_global_mutex
);
716 for (env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
717 qemu_wait_io_event_common(env
);
721 static void qemu_kvm_wait_io_event(CPUArchState
*env
)
723 while (cpu_thread_is_idle(env
)) {
724 qemu_cond_wait(env
->halt_cond
, &qemu_global_mutex
);
727 qemu_kvm_eat_signals(env
);
728 qemu_wait_io_event_common(env
);
731 static void *qemu_kvm_cpu_thread_fn(void *arg
)
733 CPUArchState
*env
= arg
;
734 CPUState
*cpu
= ENV_GET_CPU(env
);
737 qemu_mutex_lock(&qemu_global_mutex
);
738 qemu_thread_get_self(cpu
->thread
);
739 env
->thread_id
= qemu_get_thread_id();
740 cpu_single_env
= env
;
742 r
= kvm_init_vcpu(env
);
744 fprintf(stderr
, "kvm_init_vcpu failed: %s\n", strerror(-r
));
748 qemu_kvm_init_cpu_signals(env
);
750 /* signal CPU creation */
752 qemu_cond_signal(&qemu_cpu_cond
);
755 if (cpu_can_run(env
)) {
756 r
= kvm_cpu_exec(env
);
757 if (r
== EXCP_DEBUG
) {
758 cpu_handle_guest_debug(env
);
761 qemu_kvm_wait_io_event(env
);
767 static void *qemu_dummy_cpu_thread_fn(void *arg
)
770 fprintf(stderr
, "qtest is not supported under Windows\n");
773 CPUArchState
*env
= arg
;
774 CPUState
*cpu
= ENV_GET_CPU(env
);
778 qemu_mutex_lock_iothread();
779 qemu_thread_get_self(cpu
->thread
);
780 env
->thread_id
= qemu_get_thread_id();
782 sigemptyset(&waitset
);
783 sigaddset(&waitset
, SIG_IPI
);
785 /* signal CPU creation */
787 qemu_cond_signal(&qemu_cpu_cond
);
789 cpu_single_env
= env
;
791 cpu_single_env
= NULL
;
792 qemu_mutex_unlock_iothread();
795 r
= sigwait(&waitset
, &sig
);
796 } while (r
== -1 && (errno
== EAGAIN
|| errno
== EINTR
));
801 qemu_mutex_lock_iothread();
802 cpu_single_env
= env
;
803 qemu_wait_io_event_common(env
);
810 static void tcg_exec_all(void);
812 static void *qemu_tcg_cpu_thread_fn(void *arg
)
814 CPUArchState
*env
= arg
;
815 CPUState
*cpu
= ENV_GET_CPU(env
);
817 qemu_tcg_init_cpu_signals();
818 qemu_thread_get_self(cpu
->thread
);
820 /* signal CPU creation */
821 qemu_mutex_lock(&qemu_global_mutex
);
822 for (env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
823 env
->thread_id
= qemu_get_thread_id();
826 qemu_cond_signal(&qemu_cpu_cond
);
828 /* wait for initial kick-off after machine start */
829 while (first_cpu
->stopped
) {
830 qemu_cond_wait(tcg_halt_cond
, &qemu_global_mutex
);
832 /* process any pending work */
833 for (env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
834 qemu_wait_io_event_common(env
);
840 if (use_icount
&& qemu_clock_deadline(vm_clock
) <= 0) {
843 qemu_tcg_wait_io_event();
849 static void qemu_cpu_kick_thread(CPUArchState
*env
)
851 CPUState
*cpu
= ENV_GET_CPU(env
);
855 err
= pthread_kill(cpu
->thread
->thread
, SIG_IPI
);
857 fprintf(stderr
, "qemu:%s: %s", __func__
, strerror(err
));
861 if (!qemu_cpu_is_self(env
)) {
862 SuspendThread(cpu
->hThread
);
864 ResumeThread(cpu
->hThread
);
869 void qemu_cpu_kick(void *_env
)
871 CPUArchState
*env
= _env
;
872 CPUState
*cpu
= ENV_GET_CPU(env
);
874 qemu_cond_broadcast(env
->halt_cond
);
875 if (!tcg_enabled() && !cpu
->thread_kicked
) {
876 qemu_cpu_kick_thread(env
);
877 cpu
->thread_kicked
= true;
881 void qemu_cpu_kick_self(void)
884 assert(cpu_single_env
);
885 CPUState
*cpu_single_cpu
= ENV_GET_CPU(cpu_single_env
);
887 if (!cpu_single_cpu
->thread_kicked
) {
888 qemu_cpu_kick_thread(cpu_single_env
);
889 cpu_single_cpu
->thread_kicked
= true;
896 int qemu_cpu_is_self(void *_env
)
898 CPUArchState
*env
= _env
;
899 CPUState
*cpu
= ENV_GET_CPU(env
);
901 return qemu_thread_is_self(cpu
->thread
);
904 void qemu_mutex_lock_iothread(void)
906 if (!tcg_enabled()) {
907 qemu_mutex_lock(&qemu_global_mutex
);
909 iothread_requesting_mutex
= true;
910 if (qemu_mutex_trylock(&qemu_global_mutex
)) {
911 qemu_cpu_kick_thread(first_cpu
);
912 qemu_mutex_lock(&qemu_global_mutex
);
914 iothread_requesting_mutex
= false;
915 qemu_cond_broadcast(&qemu_io_proceeded_cond
);
919 void qemu_mutex_unlock_iothread(void)
921 qemu_mutex_unlock(&qemu_global_mutex
);
924 static int all_vcpus_paused(void)
926 CPUArchState
*penv
= first_cpu
;
929 if (!penv
->stopped
) {
932 penv
= penv
->next_cpu
;
938 void pause_all_vcpus(void)
940 CPUArchState
*penv
= first_cpu
;
942 qemu_clock_enable(vm_clock
, false);
946 penv
= penv
->next_cpu
;
949 if (!qemu_thread_is_self(&io_thread
)) {
951 if (!kvm_enabled()) {
955 penv
= penv
->next_cpu
;
961 while (!all_vcpus_paused()) {
962 qemu_cond_wait(&qemu_pause_cond
, &qemu_global_mutex
);
966 penv
= penv
->next_cpu
;
971 void resume_all_vcpus(void)
973 CPUArchState
*penv
= first_cpu
;
975 qemu_clock_enable(vm_clock
, true);
980 penv
= penv
->next_cpu
;
984 static void qemu_tcg_init_vcpu(void *_env
)
986 CPUArchState
*env
= _env
;
987 CPUState
*cpu
= ENV_GET_CPU(env
);
989 /* share a single thread for all cpus with TCG */
990 if (!tcg_cpu_thread
) {
991 cpu
->thread
= g_malloc0(sizeof(QemuThread
));
992 env
->halt_cond
= g_malloc0(sizeof(QemuCond
));
993 qemu_cond_init(env
->halt_cond
);
994 tcg_halt_cond
= env
->halt_cond
;
995 qemu_thread_create(cpu
->thread
, qemu_tcg_cpu_thread_fn
, env
,
996 QEMU_THREAD_JOINABLE
);
998 cpu
->hThread
= qemu_thread_get_handle(cpu
->thread
);
1000 while (env
->created
== 0) {
1001 qemu_cond_wait(&qemu_cpu_cond
, &qemu_global_mutex
);
1003 tcg_cpu_thread
= cpu
->thread
;
1005 cpu
->thread
= tcg_cpu_thread
;
1006 env
->halt_cond
= tcg_halt_cond
;
1010 static void qemu_kvm_start_vcpu(CPUArchState
*env
)
1012 CPUState
*cpu
= ENV_GET_CPU(env
);
1014 cpu
->thread
= g_malloc0(sizeof(QemuThread
));
1015 env
->halt_cond
= g_malloc0(sizeof(QemuCond
));
1016 qemu_cond_init(env
->halt_cond
);
1017 qemu_thread_create(cpu
->thread
, qemu_kvm_cpu_thread_fn
, env
,
1018 QEMU_THREAD_JOINABLE
);
1019 while (env
->created
== 0) {
1020 qemu_cond_wait(&qemu_cpu_cond
, &qemu_global_mutex
);
1024 static void qemu_dummy_start_vcpu(CPUArchState
*env
)
1026 CPUState
*cpu
= ENV_GET_CPU(env
);
1028 cpu
->thread
= g_malloc0(sizeof(QemuThread
));
1029 env
->halt_cond
= g_malloc0(sizeof(QemuCond
));
1030 qemu_cond_init(env
->halt_cond
);
1031 qemu_thread_create(cpu
->thread
, qemu_dummy_cpu_thread_fn
, env
,
1032 QEMU_THREAD_JOINABLE
);
1033 while (env
->created
== 0) {
1034 qemu_cond_wait(&qemu_cpu_cond
, &qemu_global_mutex
);
1038 void qemu_init_vcpu(void *_env
)
1040 CPUArchState
*env
= _env
;
1042 env
->nr_cores
= smp_cores
;
1043 env
->nr_threads
= smp_threads
;
1045 if (kvm_enabled()) {
1046 qemu_kvm_start_vcpu(env
);
1047 } else if (tcg_enabled()) {
1048 qemu_tcg_init_vcpu(env
);
1050 qemu_dummy_start_vcpu(env
);
1054 void cpu_stop_current(void)
1056 if (cpu_single_env
) {
1057 cpu_single_env
->stop
= 0;
1058 cpu_single_env
->stopped
= 1;
1059 cpu_exit(cpu_single_env
);
1060 qemu_cond_signal(&qemu_pause_cond
);
1064 void vm_stop(RunState state
)
1066 if (!qemu_thread_is_self(&io_thread
)) {
1067 qemu_system_vmstop_request(state
);
1069 * FIXME: should not return to device code in case
1070 * vm_stop() has been requested.
1078 /* does a state transition even if the VM is already stopped,
1079 current state is forgotten forever */
1080 void vm_stop_force_state(RunState state
)
1082 if (runstate_is_running()) {
1085 runstate_set(state
);
1089 static int tcg_cpu_exec(CPUArchState
*env
)
1092 #ifdef CONFIG_PROFILER
1096 #ifdef CONFIG_PROFILER
1097 ti
= profile_getclock();
1102 qemu_icount
-= (env
->icount_decr
.u16
.low
+ env
->icount_extra
);
1103 env
->icount_decr
.u16
.low
= 0;
1104 env
->icount_extra
= 0;
1105 count
= qemu_icount_round(qemu_clock_deadline(vm_clock
));
1106 qemu_icount
+= count
;
1107 decr
= (count
> 0xffff) ? 0xffff : count
;
1109 env
->icount_decr
.u16
.low
= decr
;
1110 env
->icount_extra
= count
;
1112 ret
= cpu_exec(env
);
1113 #ifdef CONFIG_PROFILER
1114 qemu_time
+= profile_getclock() - ti
;
1117 /* Fold pending instructions back into the
1118 instruction counter, and clear the interrupt flag. */
1119 qemu_icount
-= (env
->icount_decr
.u16
.low
1120 + env
->icount_extra
);
1121 env
->icount_decr
.u32
= 0;
1122 env
->icount_extra
= 0;
1127 static void tcg_exec_all(void)
1131 /* Account partial waits to the vm_clock. */
1132 qemu_clock_warp(vm_clock
);
1134 if (next_cpu
== NULL
) {
1135 next_cpu
= first_cpu
;
1137 for (; next_cpu
!= NULL
&& !exit_request
; next_cpu
= next_cpu
->next_cpu
) {
1138 CPUArchState
*env
= next_cpu
;
1140 qemu_clock_enable(vm_clock
,
1141 (env
->singlestep_enabled
& SSTEP_NOTIMER
) == 0);
1143 if (cpu_can_run(env
)) {
1144 r
= tcg_cpu_exec(env
);
1145 if (r
== EXCP_DEBUG
) {
1146 cpu_handle_guest_debug(env
);
1149 } else if (env
->stop
|| env
->stopped
) {
1156 void set_numa_modes(void)
1161 for (env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
1162 for (i
= 0; i
< nb_numa_nodes
; i
++) {
1163 if (test_bit(env
->cpu_index
, node_cpumask
[i
])) {
1170 void set_cpu_log(const char *optarg
)
1173 const CPULogItem
*item
;
1175 mask
= cpu_str_to_log_mask(optarg
);
1177 printf("Log items (comma separated):\n");
1178 for (item
= cpu_log_items
; item
->mask
!= 0; item
++) {
1179 printf("%-10s %s\n", item
->name
, item
->help
);
1186 void set_cpu_log_filename(const char *optarg
)
1188 cpu_set_log_filename(optarg
);
1191 void list_cpus(FILE *f
, fprintf_function cpu_fprintf
, const char *optarg
)
1193 /* XXX: implement xxx_cpu_list for targets that still miss it */
1194 #if defined(cpu_list_id)
1195 cpu_list_id(f
, cpu_fprintf
, optarg
);
1196 #elif defined(cpu_list)
1197 cpu_list(f
, cpu_fprintf
); /* deprecated */
1201 CpuInfoList
*qmp_query_cpus(Error
**errp
)
1203 CpuInfoList
*head
= NULL
, *cur_item
= NULL
;
1206 for(env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
1209 cpu_synchronize_state(env
);
1211 info
= g_malloc0(sizeof(*info
));
1212 info
->value
= g_malloc0(sizeof(*info
->value
));
1213 info
->value
->CPU
= env
->cpu_index
;
1214 info
->value
->current
= (env
== first_cpu
);
1215 info
->value
->halted
= env
->halted
;
1216 info
->value
->thread_id
= env
->thread_id
;
1217 #if defined(TARGET_I386)
1218 info
->value
->has_pc
= true;
1219 info
->value
->pc
= env
->eip
+ env
->segs
[R_CS
].base
;
1220 #elif defined(TARGET_PPC)
1221 info
->value
->has_nip
= true;
1222 info
->value
->nip
= env
->nip
;
1223 #elif defined(TARGET_SPARC)
1224 info
->value
->has_pc
= true;
1225 info
->value
->pc
= env
->pc
;
1226 info
->value
->has_npc
= true;
1227 info
->value
->npc
= env
->npc
;
1228 #elif defined(TARGET_MIPS)
1229 info
->value
->has_PC
= true;
1230 info
->value
->PC
= env
->active_tc
.PC
;
1233 /* XXX: waiting for the qapi to support GSList */
1235 head
= cur_item
= info
;
1237 cur_item
->next
= info
;
1245 void qmp_memsave(int64_t addr
, int64_t size
, const char *filename
,
1246 bool has_cpu
, int64_t cpu_index
, Error
**errp
)
1257 for (env
= first_cpu
; env
; env
= env
->next_cpu
) {
1258 if (cpu_index
== env
->cpu_index
) {
1264 error_set(errp
, QERR_INVALID_PARAMETER_VALUE
, "cpu-index",
1269 f
= fopen(filename
, "wb");
1271 error_set(errp
, QERR_OPEN_FILE_FAILED
, filename
);
1279 cpu_memory_rw_debug(env
, addr
, buf
, l
, 0);
1280 if (fwrite(buf
, 1, l
, f
) != l
) {
1281 error_set(errp
, QERR_IO_ERROR
);
1292 void qmp_pmemsave(int64_t addr
, int64_t size
, const char *filename
,
1299 f
= fopen(filename
, "wb");
1301 error_set(errp
, QERR_OPEN_FILE_FAILED
, filename
);
1309 cpu_physical_memory_rw(addr
, buf
, l
, 0);
1310 if (fwrite(buf
, 1, l
, f
) != l
) {
1311 error_set(errp
, QERR_IO_ERROR
);
1322 void qmp_inject_nmi(Error
**errp
)
1324 #if defined(TARGET_I386)
1327 for (env
= first_cpu
; env
!= NULL
; env
= env
->next_cpu
) {
1328 if (!env
->apic_state
) {
1329 cpu_interrupt(env
, CPU_INTERRUPT_NMI
);
1331 apic_deliver_nmi(env
->apic_state
);
1335 error_set(errp
, QERR_UNSUPPORTED
);