Merge remote-tracking branch 'qemu/master'
[qemu/ar7.git] / translate-all.c
blob75b951bd41bd31bdace67ef2a61ba05b428aa2ca
1 /*
2 * Host code generation
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
20 #ifdef _WIN32
21 #include <windows.h>
22 #else
23 #include <sys/types.h>
24 #include <sys/mman.h>
25 #endif
27 #include "qemu-common.h"
28 #include "config.h"
30 #include "qemu-common.h"
31 #define NO_CPU_IO_DEFS
32 #include "cpu.h"
33 #include "disas/disas.h"
34 #include "tcg.h"
35 #if defined(CONFIG_USER_ONLY)
36 #include "qemu.h"
37 #if defined(TARGET_X86_64)
38 #include "vsyscall.h"
39 #endif
40 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
41 #include <sys/param.h>
42 #if __FreeBSD_version >= 700104
43 #define HAVE_KINFO_GETVMMAP
44 #define sigqueue sigqueue_freebsd /* avoid redefinition */
45 #include <sys/time.h>
46 #include <sys/proc.h>
47 #include <machine/profile.h>
48 #define _KERNEL
49 #include <sys/user.h>
50 #undef _KERNEL
51 #undef sigqueue
52 #include <libutil.h>
53 #endif
54 #endif
55 #else
56 #include "exec/address-spaces.h"
57 #endif
59 #include "exec/cputlb.h"
60 #include "translate-all.h"
61 #include "qemu/timer.h"
63 //#define DEBUG_TB_INVALIDATE
64 //#define DEBUG_FLUSH
65 /* make various TB consistency checks */
66 //#define DEBUG_TB_CHECK
68 #if !defined(CONFIG_USER_ONLY)
69 /* TB consistency checks only implemented for usermode emulation. */
70 #undef DEBUG_TB_CHECK
71 #endif
73 #define SMC_BITMAP_USE_THRESHOLD 10
75 typedef struct PageDesc {
76 /* list of TBs intersecting this ram page */
77 TranslationBlock *first_tb;
78 /* in order to optimize self modifying code, we count the number
79 of lookups we do to a given page to use a bitmap */
80 unsigned int code_write_count;
81 uint8_t *code_bitmap;
82 #if defined(CONFIG_USER_ONLY)
83 unsigned long flags;
84 #endif
85 } PageDesc;
87 /* In system mode we want L1_MAP to be based on ram offsets,
88 while in user mode we want it to be based on virtual addresses. */
89 #if !defined(CONFIG_USER_ONLY)
90 #if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
91 # define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
92 #else
93 # define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
94 #endif
95 #else
96 # define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
97 #endif
99 /* Size of the L2 (and L3, etc) page tables. */
100 #define V_L2_BITS 10
101 #define V_L2_SIZE (1 << V_L2_BITS)
103 /* The bits remaining after N lower levels of page tables. */
104 #define V_L1_BITS_REM \
105 ((L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % V_L2_BITS)
107 #if V_L1_BITS_REM < 4
108 #define V_L1_BITS (V_L1_BITS_REM + V_L2_BITS)
109 #else
110 #define V_L1_BITS V_L1_BITS_REM
111 #endif
113 #define V_L1_SIZE ((target_ulong)1 << V_L1_BITS)
115 #define V_L1_SHIFT (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - V_L1_BITS)
117 uintptr_t qemu_real_host_page_size;
118 uintptr_t qemu_host_page_size;
119 uintptr_t qemu_host_page_mask;
121 /* This is a multi-level map on the virtual address space.
122 The bottom level has pointers to PageDesc. */
123 static void *l1_map[V_L1_SIZE];
125 /* code generation context */
126 TCGContext tcg_ctx;
128 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
129 tb_page_addr_t phys_page2);
130 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr);
132 void cpu_gen_init(void)
134 tcg_context_init(&tcg_ctx);
137 /* return non zero if the very first instruction is invalid so that
138 the virtual CPU can trigger an exception.
140 '*gen_code_size_ptr' contains the size of the generated code (host
141 code).
143 int cpu_gen_code(CPUArchState *env, TranslationBlock *tb, int *gen_code_size_ptr)
145 TCGContext *s = &tcg_ctx;
146 uint8_t *gen_code_buf;
147 int gen_code_size;
148 #ifdef CONFIG_PROFILER
149 int64_t ti;
150 #endif
152 #ifdef CONFIG_PROFILER
153 s->tb_count1++; /* includes aborted translations because of
154 exceptions */
155 ti = profile_getclock();
156 #endif
157 tcg_func_start(s);
159 gen_intermediate_code(env, tb);
161 /* generate machine code */
162 gen_code_buf = tb->tc_ptr;
163 tb->tb_next_offset[0] = 0xffff;
164 tb->tb_next_offset[1] = 0xffff;
165 s->tb_next_offset = tb->tb_next_offset;
166 #ifdef USE_DIRECT_JUMP
167 s->tb_jmp_offset = tb->tb_jmp_offset;
168 s->tb_next = NULL;
169 #else
170 s->tb_jmp_offset = NULL;
171 s->tb_next = tb->tb_next;
172 #endif
174 #ifdef CONFIG_PROFILER
175 s->tb_count++;
176 s->interm_time += profile_getclock() - ti;
177 s->code_time -= profile_getclock();
178 #endif
179 gen_code_size = tcg_gen_code(s, gen_code_buf);
180 *gen_code_size_ptr = gen_code_size;
181 #ifdef CONFIG_PROFILER
182 s->code_time += profile_getclock();
183 s->code_in_len += tb->size;
184 s->code_out_len += gen_code_size;
185 #endif
187 #ifdef DEBUG_DISAS
188 if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) {
189 qemu_log("OUT: [size=%d]\n", *gen_code_size_ptr);
190 log_disas(tb->tc_ptr, *gen_code_size_ptr);
191 qemu_log("\n");
192 qemu_log_flush();
194 #endif
195 return 0;
198 /* The cpu state corresponding to 'searched_pc' is restored.
200 static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
201 uintptr_t searched_pc)
203 CPUArchState *env = cpu->env_ptr;
204 TCGContext *s = &tcg_ctx;
205 int j;
206 uintptr_t tc_ptr;
207 #ifdef CONFIG_PROFILER
208 int64_t ti;
209 #endif
211 #ifdef CONFIG_PROFILER
212 ti = profile_getclock();
213 #endif
214 tcg_func_start(s);
216 gen_intermediate_code_pc(env, tb);
218 if (use_icount) {
219 /* Reset the cycle counter to the start of the block. */
220 cpu->icount_decr.u16.low += tb->icount;
221 /* Clear the IO flag. */
222 cpu->can_do_io = 0;
225 /* find opc index corresponding to search_pc */
226 tc_ptr = (uintptr_t)tb->tc_ptr;
227 if (searched_pc < tc_ptr)
228 return -1;
230 s->tb_next_offset = tb->tb_next_offset;
231 #ifdef USE_DIRECT_JUMP
232 s->tb_jmp_offset = tb->tb_jmp_offset;
233 s->tb_next = NULL;
234 #else
235 s->tb_jmp_offset = NULL;
236 s->tb_next = tb->tb_next;
237 #endif
238 j = tcg_gen_code_search_pc(s, (uint8_t *)tc_ptr, searched_pc - tc_ptr);
239 if (j < 0)
240 return -1;
241 /* now find start of instruction before */
242 while (s->gen_opc_instr_start[j] == 0) {
243 j--;
245 cpu->icount_decr.u16.low -= s->gen_opc_icount[j];
247 restore_state_to_opc(env, tb, j);
249 #ifdef CONFIG_PROFILER
250 s->restore_time += profile_getclock() - ti;
251 s->restore_count++;
252 #endif
253 return 0;
256 bool cpu_restore_state(CPUState *cpu, uintptr_t retaddr)
258 TranslationBlock *tb;
260 tb = tb_find_pc(retaddr);
261 if (tb) {
262 cpu_restore_state_from_tb(cpu, tb, retaddr);
263 return true;
265 return false;
268 #ifdef _WIN32
269 static inline void map_exec(void *addr, long size)
271 DWORD old_protect;
272 VirtualProtect(addr, size,
273 PAGE_EXECUTE_READWRITE, &old_protect);
275 #else
276 static inline void map_exec(void *addr, long size)
278 unsigned long start, end, page_size;
280 page_size = getpagesize();
281 start = (unsigned long)addr;
282 start &= ~(page_size - 1);
284 end = (unsigned long)addr + size;
285 end += page_size - 1;
286 end &= ~(page_size - 1);
288 mprotect((void *)start, end - start,
289 PROT_READ | PROT_WRITE | PROT_EXEC);
291 #endif
293 void page_size_init(void)
295 /* NOTE: we can always suppose that qemu_host_page_size >=
296 TARGET_PAGE_SIZE */
297 #ifdef _WIN32
298 SYSTEM_INFO system_info;
300 GetSystemInfo(&system_info);
301 qemu_real_host_page_size = system_info.dwPageSize;
302 #else
303 qemu_real_host_page_size = getpagesize();
304 #endif
305 if (qemu_host_page_size == 0) {
306 qemu_host_page_size = qemu_real_host_page_size;
308 if (qemu_host_page_size < TARGET_PAGE_SIZE) {
309 qemu_host_page_size = TARGET_PAGE_SIZE;
311 qemu_host_page_mask = ~(qemu_host_page_size - 1);
314 static void page_init(void)
316 page_size_init();
317 #if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
319 #ifdef HAVE_KINFO_GETVMMAP
320 struct kinfo_vmentry *freep;
321 int i, cnt;
323 freep = kinfo_getvmmap(getpid(), &cnt);
324 if (freep) {
325 mmap_lock();
326 for (i = 0; i < cnt; i++) {
327 unsigned long startaddr, endaddr;
329 startaddr = freep[i].kve_start;
330 endaddr = freep[i].kve_end;
331 if (h2g_valid(startaddr)) {
332 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
334 if (h2g_valid(endaddr)) {
335 endaddr = h2g(endaddr);
336 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
337 } else {
338 #if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
339 endaddr = ~0ul;
340 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
341 #endif
345 free(freep);
346 mmap_unlock();
348 #else
349 FILE *f;
351 last_brk = (unsigned long)sbrk(0);
353 f = fopen("/compat/linux/proc/self/maps", "r");
354 if (f) {
355 mmap_lock();
357 do {
358 unsigned long startaddr, endaddr;
359 int n;
361 n = fscanf(f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
363 if (n == 2 && h2g_valid(startaddr)) {
364 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
366 if (h2g_valid(endaddr)) {
367 endaddr = h2g(endaddr);
368 } else {
369 endaddr = ~0ul;
371 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
373 } while (!feof(f));
375 fclose(f);
376 mmap_unlock();
378 #endif
380 #endif
383 static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
385 PageDesc *pd;
386 void **lp;
387 int i;
389 #if defined(CONFIG_USER_ONLY)
390 /* We can't use g_malloc because it may recurse into a locked mutex. */
391 # define ALLOC(P, SIZE) \
392 do { \
393 P = mmap(NULL, SIZE, PROT_READ | PROT_WRITE, \
394 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); \
395 } while (0)
396 #else
397 # define ALLOC(P, SIZE) \
398 do { P = g_malloc0(SIZE); } while (0)
399 #endif
401 /* Level 1. Always allocated. */
402 lp = l1_map + ((index >> V_L1_SHIFT) & (V_L1_SIZE - 1));
404 /* Level 2..N-1. */
405 for (i = V_L1_SHIFT / V_L2_BITS - 1; i > 0; i--) {
406 void **p = *lp;
408 if (p == NULL) {
409 if (!alloc) {
410 return NULL;
412 ALLOC(p, sizeof(void *) * V_L2_SIZE);
413 *lp = p;
416 lp = p + ((index >> (i * V_L2_BITS)) & (V_L2_SIZE - 1));
419 pd = *lp;
420 if (pd == NULL) {
421 if (!alloc) {
422 return NULL;
424 ALLOC(pd, sizeof(PageDesc) * V_L2_SIZE);
425 *lp = pd;
428 #undef ALLOC
430 return pd + (index & (V_L2_SIZE - 1));
433 static inline PageDesc *page_find(tb_page_addr_t index)
435 return page_find_alloc(index, 0);
438 #if !defined(CONFIG_USER_ONLY)
439 #define mmap_lock() do { } while (0)
440 #define mmap_unlock() do { } while (0)
441 #endif
443 #if defined(CONFIG_USER_ONLY)
444 /* Currently it is not recommended to allocate big chunks of data in
445 user mode. It will change when a dedicated libc will be used. */
446 /* ??? 64-bit hosts ought to have no problem mmaping data outside the
447 region in which the guest needs to run. Revisit this. */
448 #define USE_STATIC_CODE_GEN_BUFFER
449 #endif
451 /* ??? Should configure for this, not list operating systems here. */
452 #if (defined(__linux__) \
453 || defined(__FreeBSD__) || defined(__FreeBSD_kernel__) \
454 || defined(__DragonFly__) || defined(__OpenBSD__) \
455 || defined(__NetBSD__))
456 # define USE_MMAP
457 #endif
459 /* Minimum size of the code gen buffer. This number is randomly chosen,
460 but not so small that we can't have a fair number of TB's live. */
461 #define MIN_CODE_GEN_BUFFER_SIZE (1024u * 1024)
463 /* Maximum size of the code gen buffer we'd like to use. Unless otherwise
464 indicated, this is constrained by the range of direct branches on the
465 host cpu, as used by the TCG implementation of goto_tb. */
466 #if defined(__x86_64__)
467 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
468 #elif defined(__sparc__)
469 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
470 #elif defined(__aarch64__)
471 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
472 #elif defined(__arm__)
473 # define MAX_CODE_GEN_BUFFER_SIZE (16u * 1024 * 1024)
474 #elif defined(__s390x__)
475 /* We have a +- 4GB range on the branches; leave some slop. */
476 # define MAX_CODE_GEN_BUFFER_SIZE (3ul * 1024 * 1024 * 1024)
477 #else
478 # define MAX_CODE_GEN_BUFFER_SIZE ((size_t)-1)
479 #endif
481 #define DEFAULT_CODE_GEN_BUFFER_SIZE_1 (32u * 1024 * 1024)
483 #define DEFAULT_CODE_GEN_BUFFER_SIZE \
484 (DEFAULT_CODE_GEN_BUFFER_SIZE_1 < MAX_CODE_GEN_BUFFER_SIZE \
485 ? DEFAULT_CODE_GEN_BUFFER_SIZE_1 : MAX_CODE_GEN_BUFFER_SIZE)
487 static inline size_t size_code_gen_buffer(size_t tb_size)
489 /* Size the buffer. */
490 if (tb_size == 0) {
491 #ifdef USE_STATIC_CODE_GEN_BUFFER
492 tb_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
493 #else
494 /* ??? Needs adjustments. */
495 /* ??? If we relax the requirement that CONFIG_USER_ONLY use the
496 static buffer, we could size this on RESERVED_VA, on the text
497 segment size of the executable, or continue to use the default. */
498 tb_size = (unsigned long)(ram_size / 4);
499 #endif
501 if (tb_size < MIN_CODE_GEN_BUFFER_SIZE) {
502 tb_size = MIN_CODE_GEN_BUFFER_SIZE;
504 if (tb_size > MAX_CODE_GEN_BUFFER_SIZE) {
505 tb_size = MAX_CODE_GEN_BUFFER_SIZE;
507 tcg_ctx.code_gen_buffer_size = tb_size;
508 return tb_size;
511 #ifdef USE_STATIC_CODE_GEN_BUFFER
512 static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
513 __attribute__((aligned(CODE_GEN_ALIGN)));
515 static inline void *alloc_code_gen_buffer(void)
517 map_exec(static_code_gen_buffer, tcg_ctx.code_gen_buffer_size);
518 return static_code_gen_buffer;
520 #elif defined(USE_MMAP)
521 static inline void *alloc_code_gen_buffer(void)
523 int flags = MAP_PRIVATE | MAP_ANONYMOUS;
524 uintptr_t start = 0;
525 void *buf;
527 /* Constrain the position of the buffer based on the host cpu.
528 Note that these addresses are chosen in concert with the
529 addresses assigned in the relevant linker script file. */
530 # if defined(__PIE__) || defined(__PIC__)
531 /* Don't bother setting a preferred location if we're building
532 a position-independent executable. We're more likely to get
533 an address near the main executable if we let the kernel
534 choose the address. */
535 # elif defined(__x86_64__) && defined(MAP_32BIT)
536 /* Force the memory down into low memory with the executable.
537 Leave the choice of exact location with the kernel. */
538 flags |= MAP_32BIT;
539 /* Cannot expect to map more than 800MB in low memory. */
540 if (tcg_ctx.code_gen_buffer_size > 800u * 1024 * 1024) {
541 tcg_ctx.code_gen_buffer_size = 800u * 1024 * 1024;
543 # elif defined(__sparc__)
544 start = 0x40000000ul;
545 # elif defined(__s390x__)
546 start = 0x90000000ul;
547 # endif
549 buf = mmap((void *)start, tcg_ctx.code_gen_buffer_size,
550 PROT_WRITE | PROT_READ | PROT_EXEC, flags, -1, 0);
551 return buf == MAP_FAILED ? NULL : buf;
553 #else
554 static inline void *alloc_code_gen_buffer(void)
556 void *buf = g_malloc(tcg_ctx.code_gen_buffer_size);
558 if (buf) {
559 map_exec(buf, tcg_ctx.code_gen_buffer_size);
561 return buf;
563 #endif /* USE_STATIC_CODE_GEN_BUFFER, USE_MMAP */
565 static inline void code_gen_alloc(size_t tb_size)
567 tcg_ctx.code_gen_buffer_size = size_code_gen_buffer(tb_size);
568 tcg_ctx.code_gen_buffer = alloc_code_gen_buffer();
569 if (tcg_ctx.code_gen_buffer == NULL) {
570 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
571 exit(1);
574 qemu_madvise(tcg_ctx.code_gen_buffer, tcg_ctx.code_gen_buffer_size,
575 QEMU_MADV_HUGEPAGE);
577 /* Steal room for the prologue at the end of the buffer. This ensures
578 (via the MAX_CODE_GEN_BUFFER_SIZE limits above) that direct branches
579 from TB's to the prologue are going to be in range. It also means
580 that we don't need to mark (additional) portions of the data segment
581 as executable. */
582 tcg_ctx.code_gen_prologue = tcg_ctx.code_gen_buffer +
583 tcg_ctx.code_gen_buffer_size - 1024;
584 tcg_ctx.code_gen_buffer_size -= 1024;
586 tcg_ctx.code_gen_buffer_max_size = tcg_ctx.code_gen_buffer_size -
587 (TCG_MAX_OP_SIZE * OPC_BUF_SIZE);
588 tcg_ctx.code_gen_max_blocks = tcg_ctx.code_gen_buffer_size /
589 CODE_GEN_AVG_BLOCK_SIZE;
590 tcg_ctx.tb_ctx.tbs =
591 g_malloc(tcg_ctx.code_gen_max_blocks * sizeof(TranslationBlock));
594 /* Must be called before using the QEMU cpus. 'tb_size' is the size
595 (in bytes) allocated to the translation buffer. Zero means default
596 size. */
597 void tcg_exec_init(uintptr_t tb_size)
599 cpu_gen_init();
600 code_gen_alloc(tb_size);
601 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
602 tcg_register_jit(tcg_ctx.code_gen_buffer, tcg_ctx.code_gen_buffer_size);
603 page_init();
604 #if !defined(CONFIG_USER_ONLY) || !defined(CONFIG_USE_GUEST_BASE)
605 /* There's no guest base to take into account, so go ahead and
606 initialize the prologue now. */
607 tcg_prologue_init(&tcg_ctx);
608 #endif
611 bool tcg_enabled(void)
613 return tcg_ctx.code_gen_buffer != NULL;
616 /* Allocate a new translation block. Flush the translation buffer if
617 too many translation blocks or too much generated code. */
618 static TranslationBlock *tb_alloc(target_ulong pc)
620 TranslationBlock *tb;
622 if (tcg_ctx.tb_ctx.nb_tbs >= tcg_ctx.code_gen_max_blocks ||
623 (tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer) >=
624 tcg_ctx.code_gen_buffer_max_size) {
625 return NULL;
627 tb = &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs++];
628 tb->pc = pc;
629 tb->cflags = 0;
630 return tb;
633 void tb_free(TranslationBlock *tb)
635 /* In practice this is mostly used for single use temporary TB
636 Ignore the hard cases and just back up if this TB happens to
637 be the last one generated. */
638 if (tcg_ctx.tb_ctx.nb_tbs > 0 &&
639 tb == &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs - 1]) {
640 tcg_ctx.code_gen_ptr = tb->tc_ptr;
641 tcg_ctx.tb_ctx.nb_tbs--;
645 static inline void invalidate_page_bitmap(PageDesc *p)
647 if (p->code_bitmap) {
648 g_free(p->code_bitmap);
649 p->code_bitmap = NULL;
651 p->code_write_count = 0;
654 /* Set to NULL all the 'first_tb' fields in all PageDescs. */
655 static void page_flush_tb_1(int level, void **lp)
657 int i;
659 if (*lp == NULL) {
660 return;
662 if (level == 0) {
663 PageDesc *pd = *lp;
665 for (i = 0; i < V_L2_SIZE; ++i) {
666 pd[i].first_tb = NULL;
667 invalidate_page_bitmap(pd + i);
669 } else {
670 void **pp = *lp;
672 for (i = 0; i < V_L2_SIZE; ++i) {
673 page_flush_tb_1(level - 1, pp + i);
678 static void page_flush_tb(void)
680 int i;
682 for (i = 0; i < V_L1_SIZE; i++) {
683 page_flush_tb_1(V_L1_SHIFT / V_L2_BITS - 1, l1_map + i);
687 /* flush all the translation blocks */
688 /* XXX: tb_flush is currently not thread safe */
689 void tb_flush(CPUArchState *env1)
691 CPUState *cpu = ENV_GET_CPU(env1);
693 #if defined(DEBUG_FLUSH)
694 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
695 (unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer),
696 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.tb_ctx.nb_tbs > 0 ?
697 ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)) /
698 tcg_ctx.tb_ctx.nb_tbs : 0);
699 #endif
700 if ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)
701 > tcg_ctx.code_gen_buffer_size) {
702 cpu_abort(cpu, "Internal error: code buffer overflow\n");
704 tcg_ctx.tb_ctx.nb_tbs = 0;
706 CPU_FOREACH(cpu) {
707 memset(cpu->tb_jmp_cache, 0, sizeof(cpu->tb_jmp_cache));
710 memset(tcg_ctx.tb_ctx.tb_phys_hash, 0, sizeof(tcg_ctx.tb_ctx.tb_phys_hash));
711 page_flush_tb();
713 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
714 /* XXX: flush processor icache at this point if cache flush is
715 expensive */
716 tcg_ctx.tb_ctx.tb_flush_count++;
719 #ifdef DEBUG_TB_CHECK
721 static void tb_invalidate_check(target_ulong address)
723 TranslationBlock *tb;
724 int i;
726 address &= TARGET_PAGE_MASK;
727 for (i = 0; i < CODE_GEN_PHYS_HASH_SIZE; i++) {
728 for (tb = tb_ctx.tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
729 if (!(address + TARGET_PAGE_SIZE <= tb->pc ||
730 address >= tb->pc + tb->size)) {
731 printf("ERROR invalidate: address=" TARGET_FMT_lx
732 " PC=%08lx size=%04x\n",
733 address, (long)tb->pc, tb->size);
739 /* verify that all the pages have correct rights for code */
740 static void tb_page_check(void)
742 TranslationBlock *tb;
743 int i, flags1, flags2;
745 for (i = 0; i < CODE_GEN_PHYS_HASH_SIZE; i++) {
746 for (tb = tcg_ctx.tb_ctx.tb_phys_hash[i]; tb != NULL;
747 tb = tb->phys_hash_next) {
748 flags1 = page_get_flags(tb->pc);
749 flags2 = page_get_flags(tb->pc + tb->size - 1);
750 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
751 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
752 (long)tb->pc, tb->size, flags1, flags2);
758 #endif
760 static inline void tb_hash_remove(TranslationBlock **ptb, TranslationBlock *tb)
762 TranslationBlock *tb1;
764 for (;;) {
765 tb1 = *ptb;
766 if (tb1 == tb) {
767 *ptb = tb1->phys_hash_next;
768 break;
770 ptb = &tb1->phys_hash_next;
774 static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
776 TranslationBlock *tb1;
777 unsigned int n1;
779 for (;;) {
780 tb1 = *ptb;
781 n1 = (uintptr_t)tb1 & 3;
782 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
783 if (tb1 == tb) {
784 *ptb = tb1->page_next[n1];
785 break;
787 ptb = &tb1->page_next[n1];
791 static inline void tb_jmp_remove(TranslationBlock *tb, int n)
793 TranslationBlock *tb1, **ptb;
794 unsigned int n1;
796 ptb = &tb->jmp_next[n];
797 tb1 = *ptb;
798 if (tb1) {
799 /* find tb(n) in circular list */
800 for (;;) {
801 tb1 = *ptb;
802 n1 = (uintptr_t)tb1 & 3;
803 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
804 if (n1 == n && tb1 == tb) {
805 break;
807 if (n1 == 2) {
808 ptb = &tb1->jmp_first;
809 } else {
810 ptb = &tb1->jmp_next[n1];
813 /* now we can suppress tb(n) from the list */
814 *ptb = tb->jmp_next[n];
816 tb->jmp_next[n] = NULL;
820 /* reset the jump entry 'n' of a TB so that it is not chained to
821 another TB */
822 static inline void tb_reset_jump(TranslationBlock *tb, int n)
824 tb_set_jmp_target(tb, n, (uintptr_t)(tb->tc_ptr + tb->tb_next_offset[n]));
827 /* invalidate one TB */
828 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
830 CPUState *cpu;
831 PageDesc *p;
832 unsigned int h, n1;
833 tb_page_addr_t phys_pc;
834 TranslationBlock *tb1, *tb2;
836 /* remove the TB from the hash list */
837 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
838 h = tb_phys_hash_func(phys_pc);
839 tb_hash_remove(&tcg_ctx.tb_ctx.tb_phys_hash[h], tb);
841 /* remove the TB from the page list */
842 if (tb->page_addr[0] != page_addr) {
843 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
844 tb_page_remove(&p->first_tb, tb);
845 invalidate_page_bitmap(p);
847 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
848 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
849 tb_page_remove(&p->first_tb, tb);
850 invalidate_page_bitmap(p);
853 tcg_ctx.tb_ctx.tb_invalidated_flag = 1;
855 /* remove the TB from the hash list */
856 h = tb_jmp_cache_hash_func(tb->pc);
857 CPU_FOREACH(cpu) {
858 if (cpu->tb_jmp_cache[h] == tb) {
859 cpu->tb_jmp_cache[h] = NULL;
863 /* suppress this TB from the two jump lists */
864 tb_jmp_remove(tb, 0);
865 tb_jmp_remove(tb, 1);
867 /* suppress any remaining jumps to this TB */
868 tb1 = tb->jmp_first;
869 for (;;) {
870 n1 = (uintptr_t)tb1 & 3;
871 if (n1 == 2) {
872 break;
874 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
875 tb2 = tb1->jmp_next[n1];
876 tb_reset_jump(tb1, n1);
877 tb1->jmp_next[n1] = NULL;
878 tb1 = tb2;
880 tb->jmp_first = (TranslationBlock *)((uintptr_t)tb | 2); /* fail safe */
882 tcg_ctx.tb_ctx.tb_phys_invalidate_count++;
885 static inline void set_bits(uint8_t *tab, int start, int len)
887 int end, mask, end1;
889 end = start + len;
890 tab += start >> 3;
891 mask = 0xff << (start & 7);
892 if ((start & ~7) == (end & ~7)) {
893 if (start < end) {
894 mask &= ~(0xff << (end & 7));
895 *tab |= mask;
897 } else {
898 *tab++ |= mask;
899 start = (start + 8) & ~7;
900 end1 = end & ~7;
901 while (start < end1) {
902 *tab++ = 0xff;
903 start += 8;
905 if (start < end) {
906 mask = ~(0xff << (end & 7));
907 *tab |= mask;
912 static void build_page_bitmap(PageDesc *p)
914 int n, tb_start, tb_end;
915 TranslationBlock *tb;
917 p->code_bitmap = g_malloc0(TARGET_PAGE_SIZE / 8);
919 tb = p->first_tb;
920 while (tb != NULL) {
921 n = (uintptr_t)tb & 3;
922 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
923 /* NOTE: this is subtle as a TB may span two physical pages */
924 if (n == 0) {
925 /* NOTE: tb_end may be after the end of the page, but
926 it is not a problem */
927 tb_start = tb->pc & ~TARGET_PAGE_MASK;
928 tb_end = tb_start + tb->size;
929 if (tb_end > TARGET_PAGE_SIZE) {
930 tb_end = TARGET_PAGE_SIZE;
932 } else {
933 tb_start = 0;
934 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
936 set_bits(p->code_bitmap, tb_start, tb_end - tb_start);
937 tb = tb->page_next[n];
941 TranslationBlock *tb_gen_code(CPUState *cpu,
942 target_ulong pc, target_ulong cs_base,
943 int flags, int cflags)
945 CPUArchState *env = cpu->env_ptr;
946 TranslationBlock *tb;
947 uint8_t *tc_ptr;
948 tb_page_addr_t phys_pc, phys_page2;
949 target_ulong virt_page2;
950 int code_gen_size;
952 phys_pc = get_page_addr_code(env, pc);
953 tb = tb_alloc(pc);
954 if (!tb) {
955 /* flush must be done */
956 tb_flush(env);
957 /* cannot fail at this point */
958 tb = tb_alloc(pc);
959 /* Don't forget to invalidate previous TB info. */
960 tcg_ctx.tb_ctx.tb_invalidated_flag = 1;
962 tc_ptr = tcg_ctx.code_gen_ptr;
963 tb->tc_ptr = tc_ptr;
964 tb->cs_base = cs_base;
965 tb->flags = flags;
966 tb->cflags = cflags;
967 cpu_gen_code(env, tb, &code_gen_size);
968 tcg_ctx.code_gen_ptr = (void *)(((uintptr_t)tcg_ctx.code_gen_ptr +
969 code_gen_size + CODE_GEN_ALIGN - 1) & ~(CODE_GEN_ALIGN - 1));
971 #if defined(CONFIG_USER_ONLY) && defined(TARGET_X86_64)
972 /* if we are doing vsyscall don't link the page as it lies in high memory
973 and tb_alloc_page will abort due to page_l1_map returning NULL */
974 if (unlikely(phys_pc >= TARGET_VSYSCALL_START
975 && phys_pc < TARGET_VSYSCALL_END))
976 return tb;
977 #endif
979 /* check next page if needed */
980 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
981 phys_page2 = -1;
982 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
983 phys_page2 = get_page_addr_code(env, virt_page2);
985 tb_link_page(tb, phys_pc, phys_page2);
986 return tb;
990 * Invalidate all TBs which intersect with the target physical address range
991 * [start;end[. NOTE: start and end may refer to *different* physical pages.
992 * 'is_cpu_write_access' should be true if called from a real cpu write
993 * access: the virtual CPU will exit the current TB if code is modified inside
994 * this TB.
996 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end,
997 int is_cpu_write_access)
999 while (start < end) {
1000 tb_invalidate_phys_page_range(start, end, is_cpu_write_access);
1001 start &= TARGET_PAGE_MASK;
1002 start += TARGET_PAGE_SIZE;
1007 * Invalidate all TBs which intersect with the target physical address range
1008 * [start;end[. NOTE: start and end must refer to the *same* physical page.
1009 * 'is_cpu_write_access' should be true if called from a real cpu write
1010 * access: the virtual CPU will exit the current TB if code is modified inside
1011 * this TB.
1013 void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
1014 int is_cpu_write_access)
1016 TranslationBlock *tb, *tb_next, *saved_tb;
1017 CPUState *cpu = current_cpu;
1018 #if defined(TARGET_HAS_PRECISE_SMC)
1019 CPUArchState *env = NULL;
1020 #endif
1021 tb_page_addr_t tb_start, tb_end;
1022 PageDesc *p;
1023 int n;
1024 #ifdef TARGET_HAS_PRECISE_SMC
1025 int current_tb_not_found = is_cpu_write_access;
1026 TranslationBlock *current_tb = NULL;
1027 int current_tb_modified = 0;
1028 target_ulong current_pc = 0;
1029 target_ulong current_cs_base = 0;
1030 int current_flags = 0;
1031 #endif /* TARGET_HAS_PRECISE_SMC */
1033 p = page_find(start >> TARGET_PAGE_BITS);
1034 if (!p) {
1035 return;
1037 if (!p->code_bitmap &&
1038 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD &&
1039 is_cpu_write_access) {
1040 /* build code bitmap */
1041 build_page_bitmap(p);
1043 #if defined(TARGET_HAS_PRECISE_SMC)
1044 if (cpu != NULL) {
1045 env = cpu->env_ptr;
1047 #endif
1049 /* we remove all the TBs in the range [start, end[ */
1050 /* XXX: see if in some cases it could be faster to invalidate all
1051 the code */
1052 tb = p->first_tb;
1053 while (tb != NULL) {
1054 n = (uintptr_t)tb & 3;
1055 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1056 tb_next = tb->page_next[n];
1057 /* NOTE: this is subtle as a TB may span two physical pages */
1058 if (n == 0) {
1059 /* NOTE: tb_end may be after the end of the page, but
1060 it is not a problem */
1061 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1062 tb_end = tb_start + tb->size;
1063 } else {
1064 tb_start = tb->page_addr[1];
1065 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1067 if (!(tb_end <= start || tb_start >= end)) {
1068 #ifdef TARGET_HAS_PRECISE_SMC
1069 if (current_tb_not_found) {
1070 current_tb_not_found = 0;
1071 current_tb = NULL;
1072 if (cpu->mem_io_pc) {
1073 /* now we have a real cpu fault */
1074 current_tb = tb_find_pc(cpu->mem_io_pc);
1077 if (current_tb == tb &&
1078 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1079 /* If we are modifying the current TB, we must stop
1080 its execution. We could be more precise by checking
1081 that the modification is after the current PC, but it
1082 would require a specialized function to partially
1083 restore the CPU state */
1085 current_tb_modified = 1;
1086 cpu_restore_state_from_tb(cpu, current_tb, cpu->mem_io_pc);
1087 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1088 &current_flags);
1090 #endif /* TARGET_HAS_PRECISE_SMC */
1091 /* we need to do that to handle the case where a signal
1092 occurs while doing tb_phys_invalidate() */
1093 saved_tb = NULL;
1094 if (cpu != NULL) {
1095 saved_tb = cpu->current_tb;
1096 cpu->current_tb = NULL;
1098 tb_phys_invalidate(tb, -1);
1099 if (cpu != NULL) {
1100 cpu->current_tb = saved_tb;
1101 if (cpu->interrupt_request && cpu->current_tb) {
1102 cpu_interrupt(cpu, cpu->interrupt_request);
1106 tb = tb_next;
1108 #if !defined(CONFIG_USER_ONLY)
1109 /* if no code remaining, no need to continue to use slow writes */
1110 if (!p->first_tb) {
1111 invalidate_page_bitmap(p);
1112 if (is_cpu_write_access) {
1113 tlb_unprotect_code_phys(cpu, start, cpu->mem_io_vaddr);
1116 #endif
1117 #ifdef TARGET_HAS_PRECISE_SMC
1118 if (current_tb_modified) {
1119 /* we generate a block containing just the instruction
1120 modifying the memory. It will ensure that it cannot modify
1121 itself */
1122 cpu->current_tb = NULL;
1123 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1124 cpu_resume_from_signal(cpu, NULL);
1126 #endif
1129 /* len must be <= 8 and start must be a multiple of len */
1130 void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
1132 PageDesc *p;
1133 int offset, b;
1135 #if 0
1136 if (1) {
1137 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1138 cpu_single_env->mem_io_vaddr, len,
1139 cpu_single_env->eip,
1140 cpu_single_env->eip +
1141 (intptr_t)cpu_single_env->segs[R_CS].base);
1143 #endif
1144 p = page_find(start >> TARGET_PAGE_BITS);
1145 if (!p) {
1146 return;
1148 if (p->code_bitmap) {
1149 offset = start & ~TARGET_PAGE_MASK;
1150 b = p->code_bitmap[offset >> 3] >> (offset & 7);
1151 if (b & ((1 << len) - 1)) {
1152 goto do_invalidate;
1154 } else {
1155 do_invalidate:
1156 tb_invalidate_phys_page_range(start, start + len, 1);
1160 #if !defined(CONFIG_SOFTMMU)
1161 static void tb_invalidate_phys_page(tb_page_addr_t addr,
1162 uintptr_t pc, void *puc,
1163 bool locked)
1165 TranslationBlock *tb;
1166 PageDesc *p;
1167 int n;
1168 #ifdef TARGET_HAS_PRECISE_SMC
1169 TranslationBlock *current_tb = NULL;
1170 CPUState *cpu = current_cpu;
1171 CPUArchState *env = NULL;
1172 int current_tb_modified = 0;
1173 target_ulong current_pc = 0;
1174 target_ulong current_cs_base = 0;
1175 int current_flags = 0;
1176 #endif
1178 addr &= TARGET_PAGE_MASK;
1179 p = page_find(addr >> TARGET_PAGE_BITS);
1180 if (!p) {
1181 return;
1183 tb = p->first_tb;
1184 #ifdef TARGET_HAS_PRECISE_SMC
1185 if (tb && pc != 0) {
1186 current_tb = tb_find_pc(pc);
1188 if (cpu != NULL) {
1189 env = cpu->env_ptr;
1191 #endif
1192 while (tb != NULL) {
1193 n = (uintptr_t)tb & 3;
1194 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1195 #ifdef TARGET_HAS_PRECISE_SMC
1196 if (current_tb == tb &&
1197 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1198 /* If we are modifying the current TB, we must stop
1199 its execution. We could be more precise by checking
1200 that the modification is after the current PC, but it
1201 would require a specialized function to partially
1202 restore the CPU state */
1204 current_tb_modified = 1;
1205 cpu_restore_state_from_tb(cpu, current_tb, pc);
1206 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1207 &current_flags);
1209 #endif /* TARGET_HAS_PRECISE_SMC */
1210 tb_phys_invalidate(tb, addr);
1211 tb = tb->page_next[n];
1213 p->first_tb = NULL;
1214 #ifdef TARGET_HAS_PRECISE_SMC
1215 if (current_tb_modified) {
1216 /* we generate a block containing just the instruction
1217 modifying the memory. It will ensure that it cannot modify
1218 itself */
1219 cpu->current_tb = NULL;
1220 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1221 if (locked) {
1222 mmap_unlock();
1224 cpu_resume_from_signal(cpu, puc);
1226 #endif
1228 #endif
1230 /* add the tb in the target page and protect it if necessary */
1231 static inline void tb_alloc_page(TranslationBlock *tb,
1232 unsigned int n, tb_page_addr_t page_addr)
1234 PageDesc *p;
1235 #ifndef CONFIG_USER_ONLY
1236 bool page_already_protected;
1237 #endif
1239 tb->page_addr[n] = page_addr;
1240 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
1241 tb->page_next[n] = p->first_tb;
1242 #ifndef CONFIG_USER_ONLY
1243 page_already_protected = p->first_tb != NULL;
1244 #endif
1245 p->first_tb = (TranslationBlock *)((uintptr_t)tb | n);
1246 invalidate_page_bitmap(p);
1248 #if defined(TARGET_HAS_SMC) || 1
1250 #if defined(CONFIG_USER_ONLY)
1251 if (p->flags & PAGE_WRITE) {
1252 target_ulong addr;
1253 PageDesc *p2;
1254 int prot;
1256 /* force the host page as non writable (writes will have a
1257 page fault + mprotect overhead) */
1258 page_addr &= qemu_host_page_mask;
1259 prot = 0;
1260 for (addr = page_addr; addr < page_addr + qemu_host_page_size;
1261 addr += TARGET_PAGE_SIZE) {
1263 p2 = page_find(addr >> TARGET_PAGE_BITS);
1264 if (!p2) {
1265 continue;
1267 prot |= p2->flags;
1268 p2->flags &= ~PAGE_WRITE;
1270 mprotect(g2h(page_addr), qemu_host_page_size,
1271 (prot & PAGE_BITS) & ~PAGE_WRITE);
1272 #ifdef DEBUG_TB_INVALIDATE
1273 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
1274 page_addr);
1275 #endif
1277 #else
1278 /* if some code is already present, then the pages are already
1279 protected. So we handle the case where only the first TB is
1280 allocated in a physical page */
1281 if (!page_already_protected) {
1282 tlb_protect_code(page_addr);
1284 #endif
1286 #endif /* TARGET_HAS_SMC */
1289 /* add a new TB and link it to the physical page tables. phys_page2 is
1290 (-1) to indicate that only one page contains the TB. */
1291 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
1292 tb_page_addr_t phys_page2)
1294 unsigned int h;
1295 TranslationBlock **ptb;
1297 /* Grab the mmap lock to stop another thread invalidating this TB
1298 before we are done. */
1299 mmap_lock();
1300 /* add in the physical hash table */
1301 h = tb_phys_hash_func(phys_pc);
1302 ptb = &tcg_ctx.tb_ctx.tb_phys_hash[h];
1303 tb->phys_hash_next = *ptb;
1304 *ptb = tb;
1306 /* add in the page list */
1307 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1308 if (phys_page2 != -1) {
1309 tb_alloc_page(tb, 1, phys_page2);
1310 } else {
1311 tb->page_addr[1] = -1;
1314 tb->jmp_first = (TranslationBlock *)((uintptr_t)tb | 2);
1315 tb->jmp_next[0] = NULL;
1316 tb->jmp_next[1] = NULL;
1318 /* init original jump addresses */
1319 if (tb->tb_next_offset[0] != 0xffff) {
1320 tb_reset_jump(tb, 0);
1322 if (tb->tb_next_offset[1] != 0xffff) {
1323 tb_reset_jump(tb, 1);
1326 #ifdef DEBUG_TB_CHECK
1327 tb_page_check();
1328 #endif
1329 mmap_unlock();
1332 /* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1333 tb[1].tc_ptr. Return NULL if not found */
1334 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr)
1336 int m_min, m_max, m;
1337 uintptr_t v;
1338 TranslationBlock *tb;
1340 if (tcg_ctx.tb_ctx.nb_tbs <= 0) {
1341 return NULL;
1343 if (tc_ptr < (uintptr_t)tcg_ctx.code_gen_buffer ||
1344 tc_ptr >= (uintptr_t)tcg_ctx.code_gen_ptr) {
1345 return NULL;
1347 /* binary search (cf Knuth) */
1348 m_min = 0;
1349 m_max = tcg_ctx.tb_ctx.nb_tbs - 1;
1350 while (m_min <= m_max) {
1351 m = (m_min + m_max) >> 1;
1352 tb = &tcg_ctx.tb_ctx.tbs[m];
1353 v = (uintptr_t)tb->tc_ptr;
1354 if (v == tc_ptr) {
1355 return tb;
1356 } else if (tc_ptr < v) {
1357 m_max = m - 1;
1358 } else {
1359 m_min = m + 1;
1362 return &tcg_ctx.tb_ctx.tbs[m_max];
1365 #if defined(TARGET_HAS_ICE) && !defined(CONFIG_USER_ONLY)
1366 void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr)
1368 ram_addr_t ram_addr;
1369 MemoryRegion *mr;
1370 hwaddr l = 1;
1372 mr = address_space_translate(as, addr, &addr, &l, false);
1373 if (!(memory_region_is_ram(mr)
1374 || memory_region_is_romd(mr))) {
1375 return;
1377 ram_addr = (memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK)
1378 + addr;
1379 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
1381 #endif /* TARGET_HAS_ICE && !defined(CONFIG_USER_ONLY) */
1383 void tb_check_watchpoint(CPUState *cpu)
1385 TranslationBlock *tb;
1387 tb = tb_find_pc(cpu->mem_io_pc);
1388 if (!tb) {
1389 cpu_abort(cpu, "check_watchpoint: could not find TB for pc=%p",
1390 (void *)cpu->mem_io_pc);
1392 cpu_restore_state_from_tb(cpu, tb, cpu->mem_io_pc);
1393 tb_phys_invalidate(tb, -1);
1396 #ifndef CONFIG_USER_ONLY
1397 /* mask must never be zero, except for A20 change call */
1398 static void tcg_handle_interrupt(CPUState *cpu, int mask)
1400 int old_mask;
1402 old_mask = cpu->interrupt_request;
1403 cpu->interrupt_request |= mask;
1406 * If called from iothread context, wake the target cpu in
1407 * case its halted.
1409 if (!qemu_cpu_is_self(cpu)) {
1410 qemu_cpu_kick(cpu);
1411 return;
1414 if (use_icount) {
1415 cpu->icount_decr.u16.high = 0xffff;
1416 if (!cpu_can_do_io(cpu)
1417 && (mask & ~old_mask) != 0) {
1418 cpu_abort(cpu, "Raised interrupt while not in I/O function");
1420 } else {
1421 cpu->tcg_exit_req = 1;
1425 CPUInterruptHandler cpu_interrupt_handler = tcg_handle_interrupt;
1427 /* in deterministic execution mode, instructions doing device I/Os
1428 must be at the end of the TB */
1429 void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr)
1431 #if defined(TARGET_MIPS) || defined(TARGET_SH4)
1432 CPUArchState *env = cpu->env_ptr;
1433 #endif
1434 TranslationBlock *tb;
1435 uint32_t n, cflags;
1436 target_ulong pc, cs_base;
1437 uint64_t flags;
1439 tb = tb_find_pc(retaddr);
1440 if (!tb) {
1441 cpu_abort(cpu, "cpu_io_recompile: could not find TB for pc=%p",
1442 (void *)retaddr);
1444 n = cpu->icount_decr.u16.low + tb->icount;
1445 cpu_restore_state_from_tb(cpu, tb, retaddr);
1446 /* Calculate how many instructions had been executed before the fault
1447 occurred. */
1448 n = n - cpu->icount_decr.u16.low;
1449 /* Generate a new TB ending on the I/O insn. */
1450 n++;
1451 /* On MIPS and SH, delay slot instructions can only be restarted if
1452 they were already the first instruction in the TB. If this is not
1453 the first instruction in a TB then re-execute the preceding
1454 branch. */
1455 #if defined(TARGET_MIPS)
1456 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
1457 env->active_tc.PC -= 4;
1458 cpu->icount_decr.u16.low++;
1459 env->hflags &= ~MIPS_HFLAG_BMASK;
1461 #elif defined(TARGET_SH4)
1462 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
1463 && n > 1) {
1464 env->pc -= 2;
1465 cpu->icount_decr.u16.low++;
1466 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
1468 #endif
1469 /* This should never happen. */
1470 if (n > CF_COUNT_MASK) {
1471 cpu_abort(cpu, "TB too big during recompile");
1474 cflags = n | CF_LAST_IO;
1475 pc = tb->pc;
1476 cs_base = tb->cs_base;
1477 flags = tb->flags;
1478 tb_phys_invalidate(tb, -1);
1479 /* FIXME: In theory this could raise an exception. In practice
1480 we have already translated the block once so it's probably ok. */
1481 tb_gen_code(cpu, pc, cs_base, flags, cflags);
1482 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
1483 the first in the TB) then we end up generating a whole new TB and
1484 repeating the fault, which is horribly inefficient.
1485 Better would be to execute just this insn uncached, or generate a
1486 second new TB. */
1487 cpu_resume_from_signal(cpu, NULL);
1490 void tb_flush_jmp_cache(CPUState *cpu, target_ulong addr)
1492 unsigned int i;
1494 /* Discard jump cache entries for any tb which might potentially
1495 overlap the flushed page. */
1496 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1497 memset(&cpu->tb_jmp_cache[i], 0,
1498 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1500 i = tb_jmp_cache_hash_page(addr);
1501 memset(&cpu->tb_jmp_cache[i], 0,
1502 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1505 void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
1507 int i, target_code_size, max_target_code_size;
1508 int direct_jmp_count, direct_jmp2_count, cross_page;
1509 TranslationBlock *tb;
1511 target_code_size = 0;
1512 max_target_code_size = 0;
1513 cross_page = 0;
1514 direct_jmp_count = 0;
1515 direct_jmp2_count = 0;
1516 for (i = 0; i < tcg_ctx.tb_ctx.nb_tbs; i++) {
1517 tb = &tcg_ctx.tb_ctx.tbs[i];
1518 target_code_size += tb->size;
1519 if (tb->size > max_target_code_size) {
1520 max_target_code_size = tb->size;
1522 if (tb->page_addr[1] != -1) {
1523 cross_page++;
1525 if (tb->tb_next_offset[0] != 0xffff) {
1526 direct_jmp_count++;
1527 if (tb->tb_next_offset[1] != 0xffff) {
1528 direct_jmp2_count++;
1532 /* XXX: avoid using doubles ? */
1533 cpu_fprintf(f, "Translation buffer state:\n");
1534 cpu_fprintf(f, "gen code size %td/%zd\n",
1535 tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer,
1536 tcg_ctx.code_gen_buffer_max_size);
1537 cpu_fprintf(f, "TB count %d/%d\n",
1538 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.code_gen_max_blocks);
1539 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
1540 tcg_ctx.tb_ctx.nb_tbs ? target_code_size /
1541 tcg_ctx.tb_ctx.nb_tbs : 0,
1542 max_target_code_size);
1543 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
1544 tcg_ctx.tb_ctx.nb_tbs ? (tcg_ctx.code_gen_ptr -
1545 tcg_ctx.code_gen_buffer) /
1546 tcg_ctx.tb_ctx.nb_tbs : 0,
1547 target_code_size ? (double) (tcg_ctx.code_gen_ptr -
1548 tcg_ctx.code_gen_buffer) /
1549 target_code_size : 0);
1550 cpu_fprintf(f, "cross page TB count %d (%d%%)\n", cross_page,
1551 tcg_ctx.tb_ctx.nb_tbs ? (cross_page * 100) /
1552 tcg_ctx.tb_ctx.nb_tbs : 0);
1553 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
1554 direct_jmp_count,
1555 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp_count * 100) /
1556 tcg_ctx.tb_ctx.nb_tbs : 0,
1557 direct_jmp2_count,
1558 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp2_count * 100) /
1559 tcg_ctx.tb_ctx.nb_tbs : 0);
1560 cpu_fprintf(f, "\nStatistics:\n");
1561 cpu_fprintf(f, "TB flush count %d\n", tcg_ctx.tb_ctx.tb_flush_count);
1562 cpu_fprintf(f, "TB invalidate count %d\n",
1563 tcg_ctx.tb_ctx.tb_phys_invalidate_count);
1564 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
1565 tcg_dump_info(f, cpu_fprintf);
1568 #else /* CONFIG_USER_ONLY */
1570 void cpu_interrupt(CPUState *cpu, int mask)
1572 cpu->interrupt_request |= mask;
1573 cpu->tcg_exit_req = 1;
1577 * Walks guest process memory "regions" one by one
1578 * and calls callback function 'fn' for each region.
1580 struct walk_memory_regions_data {
1581 walk_memory_regions_fn fn;
1582 void *priv;
1583 uintptr_t start;
1584 int prot;
1587 static int walk_memory_regions_end(struct walk_memory_regions_data *data,
1588 abi_ulong end, int new_prot)
1590 if (data->start != -1ul) {
1591 int rc = data->fn(data->priv, data->start, end, data->prot);
1592 if (rc != 0) {
1593 return rc;
1597 data->start = (new_prot ? end : -1ul);
1598 data->prot = new_prot;
1600 return 0;
1603 static int walk_memory_regions_1(struct walk_memory_regions_data *data,
1604 abi_ulong base, int level, void **lp)
1606 abi_ulong pa;
1607 int i, rc;
1609 if (*lp == NULL) {
1610 return walk_memory_regions_end(data, base, 0);
1613 if (level == 0) {
1614 PageDesc *pd = *lp;
1616 for (i = 0; i < V_L2_SIZE; ++i) {
1617 int prot = pd[i].flags;
1619 pa = base | (i << TARGET_PAGE_BITS);
1620 if (prot != data->prot) {
1621 rc = walk_memory_regions_end(data, pa, prot);
1622 if (rc != 0) {
1623 return rc;
1627 } else {
1628 void **pp = *lp;
1630 for (i = 0; i < V_L2_SIZE; ++i) {
1631 pa = base | ((abi_ulong)i <<
1632 (TARGET_PAGE_BITS + V_L2_BITS * level));
1633 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
1634 if (rc != 0) {
1635 return rc;
1640 return 0;
1643 int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
1645 struct walk_memory_regions_data data;
1646 uintptr_t i;
1648 data.fn = fn;
1649 data.priv = priv;
1650 data.start = -1ul;
1651 data.prot = 0;
1653 for (i = 0; i < V_L1_SIZE; i++) {
1654 int rc = walk_memory_regions_1(&data, (abi_ulong)i << V_L1_SHIFT,
1655 V_L1_SHIFT / V_L2_BITS - 1, l1_map + i);
1657 if (rc != 0) {
1658 return rc;
1662 return walk_memory_regions_end(&data, 0, 0);
1665 static int dump_region(void *priv, abi_ulong start,
1666 abi_ulong end, abi_ulong prot)
1668 FILE *f = (FILE *)priv;
1670 (void) fprintf(f, TARGET_ABI_FMT_lx"-"TARGET_ABI_FMT_lx
1671 " "TARGET_ABI_FMT_lx" %c%c%c\n",
1672 start, end, end - start,
1673 ((prot & PAGE_READ) ? 'r' : '-'),
1674 ((prot & PAGE_WRITE) ? 'w' : '-'),
1675 ((prot & PAGE_EXEC) ? 'x' : '-'));
1677 return 0;
1680 /* dump memory mappings */
1681 void page_dump(FILE *f)
1683 const int length = sizeof(abi_ulong) * 2;
1684 (void) fprintf(f, "%-*s %-*s %-*s %s\n",
1685 length, "start", length, "end", length, "size", "prot");
1686 walk_memory_regions(f, dump_region);
1689 int page_get_flags(target_ulong address)
1691 PageDesc *p;
1693 p = page_find(address >> TARGET_PAGE_BITS);
1694 if (!p) {
1695 return 0;
1697 return p->flags;
1700 /* Modify the flags of a page and invalidate the code if necessary.
1701 The flag PAGE_WRITE_ORG is positioned automatically depending
1702 on PAGE_WRITE. The mmap_lock should already be held. */
1703 void page_set_flags(target_ulong start, target_ulong end, int flags)
1705 target_ulong addr, len;
1707 /* This function should never be called with addresses outside the
1708 guest address space. If this assert fires, it probably indicates
1709 a missing call to h2g_valid. */
1710 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
1711 assert(end < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
1712 #endif
1713 assert(start < end);
1715 start = start & TARGET_PAGE_MASK;
1716 end = TARGET_PAGE_ALIGN(end);
1718 if (flags & PAGE_WRITE) {
1719 flags |= PAGE_WRITE_ORG;
1722 for (addr = start, len = end - start;
1723 len != 0;
1724 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
1725 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
1727 /* If the write protection bit is set, then we invalidate
1728 the code inside. */
1729 if (!(p->flags & PAGE_WRITE) &&
1730 (flags & PAGE_WRITE) &&
1731 p->first_tb) {
1732 tb_invalidate_phys_page(addr, 0, NULL, false);
1734 p->flags = flags;
1738 int page_check_range(target_ulong start, target_ulong len, int flags)
1740 PageDesc *p;
1741 target_ulong end;
1742 target_ulong addr;
1744 /* This function should never be called with addresses outside the
1745 guest address space. If this assert fires, it probably indicates
1746 a missing call to h2g_valid. */
1747 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
1748 assert(start < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
1749 #endif
1751 if (len == 0) {
1752 return 0;
1754 if (start + len - 1 < start) {
1755 /* We've wrapped around. */
1756 return -1;
1759 /* must do before we loose bits in the next step */
1760 end = TARGET_PAGE_ALIGN(start + len);
1761 start = start & TARGET_PAGE_MASK;
1763 for (addr = start, len = end - start;
1764 len != 0;
1765 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
1766 p = page_find(addr >> TARGET_PAGE_BITS);
1767 if (!p) {
1768 return -1;
1770 if (!(p->flags & PAGE_VALID)) {
1771 return -1;
1774 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ)) {
1775 return -1;
1777 if (flags & PAGE_WRITE) {
1778 if (!(p->flags & PAGE_WRITE_ORG)) {
1779 return -1;
1781 /* unprotect the page if it was put read-only because it
1782 contains translated code */
1783 if (!(p->flags & PAGE_WRITE)) {
1784 if (!page_unprotect(addr, 0, NULL)) {
1785 return -1;
1788 return 0;
1791 return 0;
1794 /* called from signal handler: invalidate the code and unprotect the
1795 page. Return TRUE if the fault was successfully handled. */
1796 int page_unprotect(target_ulong address, uintptr_t pc, void *puc)
1798 unsigned int prot;
1799 PageDesc *p;
1800 target_ulong host_start, host_end, addr;
1802 /* Technically this isn't safe inside a signal handler. However we
1803 know this only ever happens in a synchronous SEGV handler, so in
1804 practice it seems to be ok. */
1805 mmap_lock();
1807 p = page_find(address >> TARGET_PAGE_BITS);
1808 if (!p) {
1809 mmap_unlock();
1810 return 0;
1813 /* if the page was really writable, then we change its
1814 protection back to writable */
1815 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
1816 host_start = address & qemu_host_page_mask;
1817 host_end = host_start + qemu_host_page_size;
1819 prot = 0;
1820 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
1821 p = page_find(addr >> TARGET_PAGE_BITS);
1822 p->flags |= PAGE_WRITE;
1823 prot |= p->flags;
1825 /* and since the content will be modified, we must invalidate
1826 the corresponding translated code. */
1827 tb_invalidate_phys_page(addr, pc, puc, true);
1828 #ifdef DEBUG_TB_CHECK
1829 tb_invalidate_check(addr);
1830 #endif
1832 mprotect((void *)g2h(host_start), qemu_host_page_size,
1833 prot & PAGE_BITS);
1835 mmap_unlock();
1836 return 1;
1838 mmap_unlock();
1839 return 0;
1841 #endif /* CONFIG_USER_ONLY */