Add qtest for vhost-user
[qemu.git] / translate-all.c
blob6b7b46e76176b0d68a7c758c480648450624c029
1 /*
2 * Host code generation
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 #ifdef _WIN32
20 #include <windows.h>
21 #else
22 #include <sys/types.h>
23 #include <sys/mman.h>
24 #endif
25 #include <stdarg.h>
26 #include <stdlib.h>
27 #include <stdio.h>
28 #include <string.h>
29 #include <inttypes.h>
31 #include "config.h"
33 #include "qemu-common.h"
34 #define NO_CPU_IO_DEFS
35 #include "cpu.h"
36 #include "disas/disas.h"
37 #include "tcg.h"
38 #if defined(CONFIG_USER_ONLY)
39 #include "qemu.h"
40 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
41 #include <sys/param.h>
42 #if __FreeBSD_version >= 700104
43 #define HAVE_KINFO_GETVMMAP
44 #define sigqueue sigqueue_freebsd /* avoid redefinition */
45 #include <sys/time.h>
46 #include <sys/proc.h>
47 #include <machine/profile.h>
48 #define _KERNEL
49 #include <sys/user.h>
50 #undef _KERNEL
51 #undef sigqueue
52 #include <libutil.h>
53 #endif
54 #endif
55 #else
56 #include "exec/address-spaces.h"
57 #endif
59 #include "exec/cputlb.h"
60 #include "translate-all.h"
61 #include "qemu/timer.h"
63 //#define DEBUG_TB_INVALIDATE
64 //#define DEBUG_FLUSH
65 /* make various TB consistency checks */
66 //#define DEBUG_TB_CHECK
68 #if !defined(CONFIG_USER_ONLY)
69 /* TB consistency checks only implemented for usermode emulation. */
70 #undef DEBUG_TB_CHECK
71 #endif
73 #define SMC_BITMAP_USE_THRESHOLD 10
75 typedef struct PageDesc {
76 /* list of TBs intersecting this ram page */
77 TranslationBlock *first_tb;
78 /* in order to optimize self modifying code, we count the number
79 of lookups we do to a given page to use a bitmap */
80 unsigned int code_write_count;
81 uint8_t *code_bitmap;
82 #if defined(CONFIG_USER_ONLY)
83 unsigned long flags;
84 #endif
85 } PageDesc;
87 /* In system mode we want L1_MAP to be based on ram offsets,
88 while in user mode we want it to be based on virtual addresses. */
89 #if !defined(CONFIG_USER_ONLY)
90 #if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
91 # define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
92 #else
93 # define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
94 #endif
95 #else
96 # define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
97 #endif
99 /* Size of the L2 (and L3, etc) page tables. */
100 #define V_L2_BITS 10
101 #define V_L2_SIZE (1 << V_L2_BITS)
103 /* The bits remaining after N lower levels of page tables. */
104 #define V_L1_BITS_REM \
105 ((L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % V_L2_BITS)
107 #if V_L1_BITS_REM < 4
108 #define V_L1_BITS (V_L1_BITS_REM + V_L2_BITS)
109 #else
110 #define V_L1_BITS V_L1_BITS_REM
111 #endif
113 #define V_L1_SIZE ((target_ulong)1 << V_L1_BITS)
115 #define V_L1_SHIFT (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - V_L1_BITS)
117 uintptr_t qemu_real_host_page_size;
118 uintptr_t qemu_host_page_size;
119 uintptr_t qemu_host_page_mask;
121 /* This is a multi-level map on the virtual address space.
122 The bottom level has pointers to PageDesc. */
123 static void *l1_map[V_L1_SIZE];
125 /* code generation context */
126 TCGContext tcg_ctx;
128 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
129 tb_page_addr_t phys_page2);
130 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr);
132 void cpu_gen_init(void)
134 tcg_context_init(&tcg_ctx);
137 /* return non zero if the very first instruction is invalid so that
138 the virtual CPU can trigger an exception.
140 '*gen_code_size_ptr' contains the size of the generated code (host
141 code).
143 int cpu_gen_code(CPUArchState *env, TranslationBlock *tb, int *gen_code_size_ptr)
145 TCGContext *s = &tcg_ctx;
146 tcg_insn_unit *gen_code_buf;
147 int gen_code_size;
148 #ifdef CONFIG_PROFILER
149 int64_t ti;
150 #endif
152 #ifdef CONFIG_PROFILER
153 s->tb_count1++; /* includes aborted translations because of
154 exceptions */
155 ti = profile_getclock();
156 #endif
157 tcg_func_start(s);
159 gen_intermediate_code(env, tb);
161 /* generate machine code */
162 gen_code_buf = tb->tc_ptr;
163 tb->tb_next_offset[0] = 0xffff;
164 tb->tb_next_offset[1] = 0xffff;
165 s->tb_next_offset = tb->tb_next_offset;
166 #ifdef USE_DIRECT_JUMP
167 s->tb_jmp_offset = tb->tb_jmp_offset;
168 s->tb_next = NULL;
169 #else
170 s->tb_jmp_offset = NULL;
171 s->tb_next = tb->tb_next;
172 #endif
174 #ifdef CONFIG_PROFILER
175 s->tb_count++;
176 s->interm_time += profile_getclock() - ti;
177 s->code_time -= profile_getclock();
178 #endif
179 gen_code_size = tcg_gen_code(s, gen_code_buf);
180 *gen_code_size_ptr = gen_code_size;
181 #ifdef CONFIG_PROFILER
182 s->code_time += profile_getclock();
183 s->code_in_len += tb->size;
184 s->code_out_len += gen_code_size;
185 #endif
187 #ifdef DEBUG_DISAS
188 if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) {
189 qemu_log("OUT: [size=%d]\n", gen_code_size);
190 log_disas(tb->tc_ptr, gen_code_size);
191 qemu_log("\n");
192 qemu_log_flush();
194 #endif
195 return 0;
198 /* The cpu state corresponding to 'searched_pc' is restored.
200 static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
201 uintptr_t searched_pc)
203 CPUArchState *env = cpu->env_ptr;
204 TCGContext *s = &tcg_ctx;
205 int j;
206 uintptr_t tc_ptr;
207 #ifdef CONFIG_PROFILER
208 int64_t ti;
209 #endif
211 #ifdef CONFIG_PROFILER
212 ti = profile_getclock();
213 #endif
214 tcg_func_start(s);
216 gen_intermediate_code_pc(env, tb);
218 if (use_icount) {
219 /* Reset the cycle counter to the start of the block. */
220 cpu->icount_decr.u16.low += tb->icount;
221 /* Clear the IO flag. */
222 cpu->can_do_io = 0;
225 /* find opc index corresponding to search_pc */
226 tc_ptr = (uintptr_t)tb->tc_ptr;
227 if (searched_pc < tc_ptr)
228 return -1;
230 s->tb_next_offset = tb->tb_next_offset;
231 #ifdef USE_DIRECT_JUMP
232 s->tb_jmp_offset = tb->tb_jmp_offset;
233 s->tb_next = NULL;
234 #else
235 s->tb_jmp_offset = NULL;
236 s->tb_next = tb->tb_next;
237 #endif
238 j = tcg_gen_code_search_pc(s, (tcg_insn_unit *)tc_ptr,
239 searched_pc - tc_ptr);
240 if (j < 0)
241 return -1;
242 /* now find start of instruction before */
243 while (s->gen_opc_instr_start[j] == 0) {
244 j--;
246 cpu->icount_decr.u16.low -= s->gen_opc_icount[j];
248 restore_state_to_opc(env, tb, j);
250 #ifdef CONFIG_PROFILER
251 s->restore_time += profile_getclock() - ti;
252 s->restore_count++;
253 #endif
254 return 0;
257 bool cpu_restore_state(CPUState *cpu, uintptr_t retaddr)
259 TranslationBlock *tb;
261 tb = tb_find_pc(retaddr);
262 if (tb) {
263 cpu_restore_state_from_tb(cpu, tb, retaddr);
264 return true;
266 return false;
269 #ifdef _WIN32
270 static inline void map_exec(void *addr, long size)
272 DWORD old_protect;
273 VirtualProtect(addr, size,
274 PAGE_EXECUTE_READWRITE, &old_protect);
276 #else
277 static inline void map_exec(void *addr, long size)
279 unsigned long start, end, page_size;
281 page_size = getpagesize();
282 start = (unsigned long)addr;
283 start &= ~(page_size - 1);
285 end = (unsigned long)addr + size;
286 end += page_size - 1;
287 end &= ~(page_size - 1);
289 mprotect((void *)start, end - start,
290 PROT_READ | PROT_WRITE | PROT_EXEC);
292 #endif
294 void page_size_init(void)
296 /* NOTE: we can always suppose that qemu_host_page_size >=
297 TARGET_PAGE_SIZE */
298 #ifdef _WIN32
299 SYSTEM_INFO system_info;
301 GetSystemInfo(&system_info);
302 qemu_real_host_page_size = system_info.dwPageSize;
303 #else
304 qemu_real_host_page_size = getpagesize();
305 #endif
306 if (qemu_host_page_size == 0) {
307 qemu_host_page_size = qemu_real_host_page_size;
309 if (qemu_host_page_size < TARGET_PAGE_SIZE) {
310 qemu_host_page_size = TARGET_PAGE_SIZE;
312 qemu_host_page_mask = ~(qemu_host_page_size - 1);
315 static void page_init(void)
317 page_size_init();
318 #if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
320 #ifdef HAVE_KINFO_GETVMMAP
321 struct kinfo_vmentry *freep;
322 int i, cnt;
324 freep = kinfo_getvmmap(getpid(), &cnt);
325 if (freep) {
326 mmap_lock();
327 for (i = 0; i < cnt; i++) {
328 unsigned long startaddr, endaddr;
330 startaddr = freep[i].kve_start;
331 endaddr = freep[i].kve_end;
332 if (h2g_valid(startaddr)) {
333 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
335 if (h2g_valid(endaddr)) {
336 endaddr = h2g(endaddr);
337 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
338 } else {
339 #if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
340 endaddr = ~0ul;
341 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
342 #endif
346 free(freep);
347 mmap_unlock();
349 #else
350 FILE *f;
352 last_brk = (unsigned long)sbrk(0);
354 f = fopen("/compat/linux/proc/self/maps", "r");
355 if (f) {
356 mmap_lock();
358 do {
359 unsigned long startaddr, endaddr;
360 int n;
362 n = fscanf(f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
364 if (n == 2 && h2g_valid(startaddr)) {
365 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
367 if (h2g_valid(endaddr)) {
368 endaddr = h2g(endaddr);
369 } else {
370 endaddr = ~0ul;
372 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
374 } while (!feof(f));
376 fclose(f);
377 mmap_unlock();
379 #endif
381 #endif
384 static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
386 PageDesc *pd;
387 void **lp;
388 int i;
390 #if defined(CONFIG_USER_ONLY)
391 /* We can't use g_malloc because it may recurse into a locked mutex. */
392 # define ALLOC(P, SIZE) \
393 do { \
394 P = mmap(NULL, SIZE, PROT_READ | PROT_WRITE, \
395 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); \
396 } while (0)
397 #else
398 # define ALLOC(P, SIZE) \
399 do { P = g_malloc0(SIZE); } while (0)
400 #endif
402 /* Level 1. Always allocated. */
403 lp = l1_map + ((index >> V_L1_SHIFT) & (V_L1_SIZE - 1));
405 /* Level 2..N-1. */
406 for (i = V_L1_SHIFT / V_L2_BITS - 1; i > 0; i--) {
407 void **p = *lp;
409 if (p == NULL) {
410 if (!alloc) {
411 return NULL;
413 ALLOC(p, sizeof(void *) * V_L2_SIZE);
414 *lp = p;
417 lp = p + ((index >> (i * V_L2_BITS)) & (V_L2_SIZE - 1));
420 pd = *lp;
421 if (pd == NULL) {
422 if (!alloc) {
423 return NULL;
425 ALLOC(pd, sizeof(PageDesc) * V_L2_SIZE);
426 *lp = pd;
429 #undef ALLOC
431 return pd + (index & (V_L2_SIZE - 1));
434 static inline PageDesc *page_find(tb_page_addr_t index)
436 return page_find_alloc(index, 0);
439 #if !defined(CONFIG_USER_ONLY)
440 #define mmap_lock() do { } while (0)
441 #define mmap_unlock() do { } while (0)
442 #endif
444 #if defined(CONFIG_USER_ONLY)
445 /* Currently it is not recommended to allocate big chunks of data in
446 user mode. It will change when a dedicated libc will be used. */
447 /* ??? 64-bit hosts ought to have no problem mmaping data outside the
448 region in which the guest needs to run. Revisit this. */
449 #define USE_STATIC_CODE_GEN_BUFFER
450 #endif
452 /* ??? Should configure for this, not list operating systems here. */
453 #if (defined(__linux__) \
454 || defined(__FreeBSD__) || defined(__FreeBSD_kernel__) \
455 || defined(__DragonFly__) || defined(__OpenBSD__) \
456 || defined(__NetBSD__))
457 # define USE_MMAP
458 #endif
460 /* Minimum size of the code gen buffer. This number is randomly chosen,
461 but not so small that we can't have a fair number of TB's live. */
462 #define MIN_CODE_GEN_BUFFER_SIZE (1024u * 1024)
464 /* Maximum size of the code gen buffer we'd like to use. Unless otherwise
465 indicated, this is constrained by the range of direct branches on the
466 host cpu, as used by the TCG implementation of goto_tb. */
467 #if defined(__x86_64__)
468 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
469 #elif defined(__sparc__)
470 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
471 #elif defined(__aarch64__)
472 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
473 #elif defined(__arm__)
474 # define MAX_CODE_GEN_BUFFER_SIZE (16u * 1024 * 1024)
475 #elif defined(__s390x__)
476 /* We have a +- 4GB range on the branches; leave some slop. */
477 # define MAX_CODE_GEN_BUFFER_SIZE (3ul * 1024 * 1024 * 1024)
478 #elif defined(__mips__)
479 /* We have a 256MB branch region, but leave room to make sure the
480 main executable is also within that region. */
481 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
482 #else
483 # define MAX_CODE_GEN_BUFFER_SIZE ((size_t)-1)
484 #endif
486 #define DEFAULT_CODE_GEN_BUFFER_SIZE_1 (32u * 1024 * 1024)
488 #define DEFAULT_CODE_GEN_BUFFER_SIZE \
489 (DEFAULT_CODE_GEN_BUFFER_SIZE_1 < MAX_CODE_GEN_BUFFER_SIZE \
490 ? DEFAULT_CODE_GEN_BUFFER_SIZE_1 : MAX_CODE_GEN_BUFFER_SIZE)
492 static inline size_t size_code_gen_buffer(size_t tb_size)
494 /* Size the buffer. */
495 if (tb_size == 0) {
496 #ifdef USE_STATIC_CODE_GEN_BUFFER
497 tb_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
498 #else
499 /* ??? Needs adjustments. */
500 /* ??? If we relax the requirement that CONFIG_USER_ONLY use the
501 static buffer, we could size this on RESERVED_VA, on the text
502 segment size of the executable, or continue to use the default. */
503 tb_size = (unsigned long)(ram_size / 4);
504 #endif
506 if (tb_size < MIN_CODE_GEN_BUFFER_SIZE) {
507 tb_size = MIN_CODE_GEN_BUFFER_SIZE;
509 if (tb_size > MAX_CODE_GEN_BUFFER_SIZE) {
510 tb_size = MAX_CODE_GEN_BUFFER_SIZE;
512 tcg_ctx.code_gen_buffer_size = tb_size;
513 return tb_size;
516 #ifdef __mips__
517 /* In order to use J and JAL within the code_gen_buffer, we require
518 that the buffer not cross a 256MB boundary. */
519 static inline bool cross_256mb(void *addr, size_t size)
521 return ((uintptr_t)addr ^ ((uintptr_t)addr + size)) & 0xf0000000;
524 /* We weren't able to allocate a buffer without crossing that boundary,
525 so make do with the larger portion of the buffer that doesn't cross.
526 Returns the new base of the buffer, and adjusts code_gen_buffer_size. */
527 static inline void *split_cross_256mb(void *buf1, size_t size1)
529 void *buf2 = (void *)(((uintptr_t)buf1 + size1) & 0xf0000000);
530 size_t size2 = buf1 + size1 - buf2;
532 size1 = buf2 - buf1;
533 if (size1 < size2) {
534 size1 = size2;
535 buf1 = buf2;
538 tcg_ctx.code_gen_buffer_size = size1;
539 return buf1;
541 #endif
543 #ifdef USE_STATIC_CODE_GEN_BUFFER
544 static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
545 __attribute__((aligned(CODE_GEN_ALIGN)));
547 static inline void *alloc_code_gen_buffer(void)
549 void *buf = static_code_gen_buffer;
550 #ifdef __mips__
551 if (cross_256mb(buf, tcg_ctx.code_gen_buffer_size)) {
552 buf = split_cross_256mb(buf, tcg_ctx.code_gen_buffer_size);
554 #endif
555 map_exec(buf, tcg_ctx.code_gen_buffer_size);
556 return buf;
558 #elif defined(USE_MMAP)
559 static inline void *alloc_code_gen_buffer(void)
561 int flags = MAP_PRIVATE | MAP_ANONYMOUS;
562 uintptr_t start = 0;
563 void *buf;
565 /* Constrain the position of the buffer based on the host cpu.
566 Note that these addresses are chosen in concert with the
567 addresses assigned in the relevant linker script file. */
568 # if defined(__PIE__) || defined(__PIC__)
569 /* Don't bother setting a preferred location if we're building
570 a position-independent executable. We're more likely to get
571 an address near the main executable if we let the kernel
572 choose the address. */
573 # elif defined(__x86_64__) && defined(MAP_32BIT)
574 /* Force the memory down into low memory with the executable.
575 Leave the choice of exact location with the kernel. */
576 flags |= MAP_32BIT;
577 /* Cannot expect to map more than 800MB in low memory. */
578 if (tcg_ctx.code_gen_buffer_size > 800u * 1024 * 1024) {
579 tcg_ctx.code_gen_buffer_size = 800u * 1024 * 1024;
581 # elif defined(__sparc__)
582 start = 0x40000000ul;
583 # elif defined(__s390x__)
584 start = 0x90000000ul;
585 # elif defined(__mips__)
586 /* ??? We ought to more explicitly manage layout for softmmu too. */
587 # ifdef CONFIG_USER_ONLY
588 start = 0x68000000ul;
589 # elif _MIPS_SIM == _ABI64
590 start = 0x128000000ul;
591 # else
592 start = 0x08000000ul;
593 # endif
594 # endif
596 buf = mmap((void *)start, tcg_ctx.code_gen_buffer_size,
597 PROT_WRITE | PROT_READ | PROT_EXEC, flags, -1, 0);
598 if (buf == MAP_FAILED) {
599 return NULL;
602 #ifdef __mips__
603 if (cross_256mb(buf, tcg_ctx.code_gen_buffer_size)) {
604 /* Try again, with the original still mapped, to avoid re-aquiring
605 that 256mb crossing. This time don't specify an address. */
606 size_t size2, size1 = tcg_ctx.code_gen_buffer_size;
607 void *buf2 = mmap(NULL, size1, PROT_WRITE | PROT_READ | PROT_EXEC,
608 flags, -1, 0);
609 if (buf2 != MAP_FAILED) {
610 if (!cross_256mb(buf2, size1)) {
611 /* Success! Use the new buffer. */
612 munmap(buf, size1);
613 return buf2;
615 /* Failure. Work with what we had. */
616 munmap(buf2, size1);
619 /* Split the original buffer. Free the smaller half. */
620 buf2 = split_cross_256mb(buf, size1);
621 size2 = tcg_ctx.code_gen_buffer_size;
622 munmap(buf + (buf == buf2 ? size2 : 0), size1 - size2);
623 return buf2;
625 #endif
627 return buf;
629 #else
630 static inline void *alloc_code_gen_buffer(void)
632 void *buf = g_malloc(tcg_ctx.code_gen_buffer_size);
634 if (buf == NULL) {
635 return NULL;
638 #ifdef __mips__
639 if (cross_256mb(buf, tcg_ctx.code_gen_buffer_size)) {
640 void *buf2 = g_malloc(tcg_ctx.code_gen_buffer_size);
641 if (buf2 != NULL && !cross_256mb(buf2, size1)) {
642 /* Success! Use the new buffer. */
643 free(buf);
644 buf = buf2;
645 } else {
646 /* Failure. Work with what we had. Since this is malloc
647 and not mmap, we can't free the other half. */
648 free(buf2);
649 buf = split_cross_256mb(buf, tcg_ctx.code_gen_buffer_size);
652 #endif
654 map_exec(buf, tcg_ctx.code_gen_buffer_size);
655 return buf;
657 #endif /* USE_STATIC_CODE_GEN_BUFFER, USE_MMAP */
659 static inline void code_gen_alloc(size_t tb_size)
661 tcg_ctx.code_gen_buffer_size = size_code_gen_buffer(tb_size);
662 tcg_ctx.code_gen_buffer = alloc_code_gen_buffer();
663 if (tcg_ctx.code_gen_buffer == NULL) {
664 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
665 exit(1);
668 qemu_madvise(tcg_ctx.code_gen_buffer, tcg_ctx.code_gen_buffer_size,
669 QEMU_MADV_HUGEPAGE);
671 /* Steal room for the prologue at the end of the buffer. This ensures
672 (via the MAX_CODE_GEN_BUFFER_SIZE limits above) that direct branches
673 from TB's to the prologue are going to be in range. It also means
674 that we don't need to mark (additional) portions of the data segment
675 as executable. */
676 tcg_ctx.code_gen_prologue = tcg_ctx.code_gen_buffer +
677 tcg_ctx.code_gen_buffer_size - 1024;
678 tcg_ctx.code_gen_buffer_size -= 1024;
680 tcg_ctx.code_gen_buffer_max_size = tcg_ctx.code_gen_buffer_size -
681 (TCG_MAX_OP_SIZE * OPC_BUF_SIZE);
682 tcg_ctx.code_gen_max_blocks = tcg_ctx.code_gen_buffer_size /
683 CODE_GEN_AVG_BLOCK_SIZE;
684 tcg_ctx.tb_ctx.tbs =
685 g_malloc(tcg_ctx.code_gen_max_blocks * sizeof(TranslationBlock));
688 /* Must be called before using the QEMU cpus. 'tb_size' is the size
689 (in bytes) allocated to the translation buffer. Zero means default
690 size. */
691 void tcg_exec_init(unsigned long tb_size)
693 cpu_gen_init();
694 code_gen_alloc(tb_size);
695 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
696 tcg_register_jit(tcg_ctx.code_gen_buffer, tcg_ctx.code_gen_buffer_size);
697 page_init();
698 #if !defined(CONFIG_USER_ONLY) || !defined(CONFIG_USE_GUEST_BASE)
699 /* There's no guest base to take into account, so go ahead and
700 initialize the prologue now. */
701 tcg_prologue_init(&tcg_ctx);
702 #endif
705 bool tcg_enabled(void)
707 return tcg_ctx.code_gen_buffer != NULL;
710 /* Allocate a new translation block. Flush the translation buffer if
711 too many translation blocks or too much generated code. */
712 static TranslationBlock *tb_alloc(target_ulong pc)
714 TranslationBlock *tb;
716 if (tcg_ctx.tb_ctx.nb_tbs >= tcg_ctx.code_gen_max_blocks ||
717 (tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer) >=
718 tcg_ctx.code_gen_buffer_max_size) {
719 return NULL;
721 tb = &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs++];
722 tb->pc = pc;
723 tb->cflags = 0;
724 return tb;
727 void tb_free(TranslationBlock *tb)
729 /* In practice this is mostly used for single use temporary TB
730 Ignore the hard cases and just back up if this TB happens to
731 be the last one generated. */
732 if (tcg_ctx.tb_ctx.nb_tbs > 0 &&
733 tb == &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs - 1]) {
734 tcg_ctx.code_gen_ptr = tb->tc_ptr;
735 tcg_ctx.tb_ctx.nb_tbs--;
739 static inline void invalidate_page_bitmap(PageDesc *p)
741 if (p->code_bitmap) {
742 g_free(p->code_bitmap);
743 p->code_bitmap = NULL;
745 p->code_write_count = 0;
748 /* Set to NULL all the 'first_tb' fields in all PageDescs. */
749 static void page_flush_tb_1(int level, void **lp)
751 int i;
753 if (*lp == NULL) {
754 return;
756 if (level == 0) {
757 PageDesc *pd = *lp;
759 for (i = 0; i < V_L2_SIZE; ++i) {
760 pd[i].first_tb = NULL;
761 invalidate_page_bitmap(pd + i);
763 } else {
764 void **pp = *lp;
766 for (i = 0; i < V_L2_SIZE; ++i) {
767 page_flush_tb_1(level - 1, pp + i);
772 static void page_flush_tb(void)
774 int i;
776 for (i = 0; i < V_L1_SIZE; i++) {
777 page_flush_tb_1(V_L1_SHIFT / V_L2_BITS - 1, l1_map + i);
781 /* flush all the translation blocks */
782 /* XXX: tb_flush is currently not thread safe */
783 void tb_flush(CPUArchState *env1)
785 CPUState *cpu = ENV_GET_CPU(env1);
787 #if defined(DEBUG_FLUSH)
788 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
789 (unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer),
790 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.tb_ctx.nb_tbs > 0 ?
791 ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)) /
792 tcg_ctx.tb_ctx.nb_tbs : 0);
793 #endif
794 if ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)
795 > tcg_ctx.code_gen_buffer_size) {
796 cpu_abort(cpu, "Internal error: code buffer overflow\n");
798 tcg_ctx.tb_ctx.nb_tbs = 0;
800 CPU_FOREACH(cpu) {
801 memset(cpu->tb_jmp_cache, 0, sizeof(cpu->tb_jmp_cache));
804 memset(tcg_ctx.tb_ctx.tb_phys_hash, 0, sizeof(tcg_ctx.tb_ctx.tb_phys_hash));
805 page_flush_tb();
807 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
808 /* XXX: flush processor icache at this point if cache flush is
809 expensive */
810 tcg_ctx.tb_ctx.tb_flush_count++;
813 #ifdef DEBUG_TB_CHECK
815 static void tb_invalidate_check(target_ulong address)
817 TranslationBlock *tb;
818 int i;
820 address &= TARGET_PAGE_MASK;
821 for (i = 0; i < CODE_GEN_PHYS_HASH_SIZE; i++) {
822 for (tb = tb_ctx.tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
823 if (!(address + TARGET_PAGE_SIZE <= tb->pc ||
824 address >= tb->pc + tb->size)) {
825 printf("ERROR invalidate: address=" TARGET_FMT_lx
826 " PC=%08lx size=%04x\n",
827 address, (long)tb->pc, tb->size);
833 /* verify that all the pages have correct rights for code */
834 static void tb_page_check(void)
836 TranslationBlock *tb;
837 int i, flags1, flags2;
839 for (i = 0; i < CODE_GEN_PHYS_HASH_SIZE; i++) {
840 for (tb = tcg_ctx.tb_ctx.tb_phys_hash[i]; tb != NULL;
841 tb = tb->phys_hash_next) {
842 flags1 = page_get_flags(tb->pc);
843 flags2 = page_get_flags(tb->pc + tb->size - 1);
844 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
845 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
846 (long)tb->pc, tb->size, flags1, flags2);
852 #endif
854 static inline void tb_hash_remove(TranslationBlock **ptb, TranslationBlock *tb)
856 TranslationBlock *tb1;
858 for (;;) {
859 tb1 = *ptb;
860 if (tb1 == tb) {
861 *ptb = tb1->phys_hash_next;
862 break;
864 ptb = &tb1->phys_hash_next;
868 static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
870 TranslationBlock *tb1;
871 unsigned int n1;
873 for (;;) {
874 tb1 = *ptb;
875 n1 = (uintptr_t)tb1 & 3;
876 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
877 if (tb1 == tb) {
878 *ptb = tb1->page_next[n1];
879 break;
881 ptb = &tb1->page_next[n1];
885 static inline void tb_jmp_remove(TranslationBlock *tb, int n)
887 TranslationBlock *tb1, **ptb;
888 unsigned int n1;
890 ptb = &tb->jmp_next[n];
891 tb1 = *ptb;
892 if (tb1) {
893 /* find tb(n) in circular list */
894 for (;;) {
895 tb1 = *ptb;
896 n1 = (uintptr_t)tb1 & 3;
897 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
898 if (n1 == n && tb1 == tb) {
899 break;
901 if (n1 == 2) {
902 ptb = &tb1->jmp_first;
903 } else {
904 ptb = &tb1->jmp_next[n1];
907 /* now we can suppress tb(n) from the list */
908 *ptb = tb->jmp_next[n];
910 tb->jmp_next[n] = NULL;
914 /* reset the jump entry 'n' of a TB so that it is not chained to
915 another TB */
916 static inline void tb_reset_jump(TranslationBlock *tb, int n)
918 tb_set_jmp_target(tb, n, (uintptr_t)(tb->tc_ptr + tb->tb_next_offset[n]));
921 /* invalidate one TB */
922 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
924 CPUState *cpu;
925 PageDesc *p;
926 unsigned int h, n1;
927 tb_page_addr_t phys_pc;
928 TranslationBlock *tb1, *tb2;
930 /* remove the TB from the hash list */
931 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
932 h = tb_phys_hash_func(phys_pc);
933 tb_hash_remove(&tcg_ctx.tb_ctx.tb_phys_hash[h], tb);
935 /* remove the TB from the page list */
936 if (tb->page_addr[0] != page_addr) {
937 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
938 tb_page_remove(&p->first_tb, tb);
939 invalidate_page_bitmap(p);
941 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
942 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
943 tb_page_remove(&p->first_tb, tb);
944 invalidate_page_bitmap(p);
947 tcg_ctx.tb_ctx.tb_invalidated_flag = 1;
949 /* remove the TB from the hash list */
950 h = tb_jmp_cache_hash_func(tb->pc);
951 CPU_FOREACH(cpu) {
952 if (cpu->tb_jmp_cache[h] == tb) {
953 cpu->tb_jmp_cache[h] = NULL;
957 /* suppress this TB from the two jump lists */
958 tb_jmp_remove(tb, 0);
959 tb_jmp_remove(tb, 1);
961 /* suppress any remaining jumps to this TB */
962 tb1 = tb->jmp_first;
963 for (;;) {
964 n1 = (uintptr_t)tb1 & 3;
965 if (n1 == 2) {
966 break;
968 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
969 tb2 = tb1->jmp_next[n1];
970 tb_reset_jump(tb1, n1);
971 tb1->jmp_next[n1] = NULL;
972 tb1 = tb2;
974 tb->jmp_first = (TranslationBlock *)((uintptr_t)tb | 2); /* fail safe */
976 tcg_ctx.tb_ctx.tb_phys_invalidate_count++;
979 static inline void set_bits(uint8_t *tab, int start, int len)
981 int end, mask, end1;
983 end = start + len;
984 tab += start >> 3;
985 mask = 0xff << (start & 7);
986 if ((start & ~7) == (end & ~7)) {
987 if (start < end) {
988 mask &= ~(0xff << (end & 7));
989 *tab |= mask;
991 } else {
992 *tab++ |= mask;
993 start = (start + 8) & ~7;
994 end1 = end & ~7;
995 while (start < end1) {
996 *tab++ = 0xff;
997 start += 8;
999 if (start < end) {
1000 mask = ~(0xff << (end & 7));
1001 *tab |= mask;
1006 static void build_page_bitmap(PageDesc *p)
1008 int n, tb_start, tb_end;
1009 TranslationBlock *tb;
1011 p->code_bitmap = g_malloc0(TARGET_PAGE_SIZE / 8);
1013 tb = p->first_tb;
1014 while (tb != NULL) {
1015 n = (uintptr_t)tb & 3;
1016 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1017 /* NOTE: this is subtle as a TB may span two physical pages */
1018 if (n == 0) {
1019 /* NOTE: tb_end may be after the end of the page, but
1020 it is not a problem */
1021 tb_start = tb->pc & ~TARGET_PAGE_MASK;
1022 tb_end = tb_start + tb->size;
1023 if (tb_end > TARGET_PAGE_SIZE) {
1024 tb_end = TARGET_PAGE_SIZE;
1026 } else {
1027 tb_start = 0;
1028 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1030 set_bits(p->code_bitmap, tb_start, tb_end - tb_start);
1031 tb = tb->page_next[n];
1035 TranslationBlock *tb_gen_code(CPUState *cpu,
1036 target_ulong pc, target_ulong cs_base,
1037 int flags, int cflags)
1039 CPUArchState *env = cpu->env_ptr;
1040 TranslationBlock *tb;
1041 tb_page_addr_t phys_pc, phys_page2;
1042 target_ulong virt_page2;
1043 int code_gen_size;
1045 phys_pc = get_page_addr_code(env, pc);
1046 tb = tb_alloc(pc);
1047 if (!tb) {
1048 /* flush must be done */
1049 tb_flush(env);
1050 /* cannot fail at this point */
1051 tb = tb_alloc(pc);
1052 /* Don't forget to invalidate previous TB info. */
1053 tcg_ctx.tb_ctx.tb_invalidated_flag = 1;
1055 tb->tc_ptr = tcg_ctx.code_gen_ptr;
1056 tb->cs_base = cs_base;
1057 tb->flags = flags;
1058 tb->cflags = cflags;
1059 cpu_gen_code(env, tb, &code_gen_size);
1060 tcg_ctx.code_gen_ptr = (void *)(((uintptr_t)tcg_ctx.code_gen_ptr +
1061 code_gen_size + CODE_GEN_ALIGN - 1) & ~(CODE_GEN_ALIGN - 1));
1063 /* check next page if needed */
1064 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
1065 phys_page2 = -1;
1066 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
1067 phys_page2 = get_page_addr_code(env, virt_page2);
1069 tb_link_page(tb, phys_pc, phys_page2);
1070 return tb;
1074 * Invalidate all TBs which intersect with the target physical address range
1075 * [start;end[. NOTE: start and end may refer to *different* physical pages.
1076 * 'is_cpu_write_access' should be true if called from a real cpu write
1077 * access: the virtual CPU will exit the current TB if code is modified inside
1078 * this TB.
1080 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end,
1081 int is_cpu_write_access)
1083 while (start < end) {
1084 tb_invalidate_phys_page_range(start, end, is_cpu_write_access);
1085 start &= TARGET_PAGE_MASK;
1086 start += TARGET_PAGE_SIZE;
1091 * Invalidate all TBs which intersect with the target physical address range
1092 * [start;end[. NOTE: start and end must refer to the *same* physical page.
1093 * 'is_cpu_write_access' should be true if called from a real cpu write
1094 * access: the virtual CPU will exit the current TB if code is modified inside
1095 * this TB.
1097 void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
1098 int is_cpu_write_access)
1100 TranslationBlock *tb, *tb_next, *saved_tb;
1101 CPUState *cpu = current_cpu;
1102 #if defined(TARGET_HAS_PRECISE_SMC)
1103 CPUArchState *env = NULL;
1104 #endif
1105 tb_page_addr_t tb_start, tb_end;
1106 PageDesc *p;
1107 int n;
1108 #ifdef TARGET_HAS_PRECISE_SMC
1109 int current_tb_not_found = is_cpu_write_access;
1110 TranslationBlock *current_tb = NULL;
1111 int current_tb_modified = 0;
1112 target_ulong current_pc = 0;
1113 target_ulong current_cs_base = 0;
1114 int current_flags = 0;
1115 #endif /* TARGET_HAS_PRECISE_SMC */
1117 p = page_find(start >> TARGET_PAGE_BITS);
1118 if (!p) {
1119 return;
1121 if (!p->code_bitmap &&
1122 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD &&
1123 is_cpu_write_access) {
1124 /* build code bitmap */
1125 build_page_bitmap(p);
1127 #if defined(TARGET_HAS_PRECISE_SMC)
1128 if (cpu != NULL) {
1129 env = cpu->env_ptr;
1131 #endif
1133 /* we remove all the TBs in the range [start, end[ */
1134 /* XXX: see if in some cases it could be faster to invalidate all
1135 the code */
1136 tb = p->first_tb;
1137 while (tb != NULL) {
1138 n = (uintptr_t)tb & 3;
1139 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1140 tb_next = tb->page_next[n];
1141 /* NOTE: this is subtle as a TB may span two physical pages */
1142 if (n == 0) {
1143 /* NOTE: tb_end may be after the end of the page, but
1144 it is not a problem */
1145 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1146 tb_end = tb_start + tb->size;
1147 } else {
1148 tb_start = tb->page_addr[1];
1149 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1151 if (!(tb_end <= start || tb_start >= end)) {
1152 #ifdef TARGET_HAS_PRECISE_SMC
1153 if (current_tb_not_found) {
1154 current_tb_not_found = 0;
1155 current_tb = NULL;
1156 if (cpu->mem_io_pc) {
1157 /* now we have a real cpu fault */
1158 current_tb = tb_find_pc(cpu->mem_io_pc);
1161 if (current_tb == tb &&
1162 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1163 /* If we are modifying the current TB, we must stop
1164 its execution. We could be more precise by checking
1165 that the modification is after the current PC, but it
1166 would require a specialized function to partially
1167 restore the CPU state */
1169 current_tb_modified = 1;
1170 cpu_restore_state_from_tb(cpu, current_tb, cpu->mem_io_pc);
1171 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1172 &current_flags);
1174 #endif /* TARGET_HAS_PRECISE_SMC */
1175 /* we need to do that to handle the case where a signal
1176 occurs while doing tb_phys_invalidate() */
1177 saved_tb = NULL;
1178 if (cpu != NULL) {
1179 saved_tb = cpu->current_tb;
1180 cpu->current_tb = NULL;
1182 tb_phys_invalidate(tb, -1);
1183 if (cpu != NULL) {
1184 cpu->current_tb = saved_tb;
1185 if (cpu->interrupt_request && cpu->current_tb) {
1186 cpu_interrupt(cpu, cpu->interrupt_request);
1190 tb = tb_next;
1192 #if !defined(CONFIG_USER_ONLY)
1193 /* if no code remaining, no need to continue to use slow writes */
1194 if (!p->first_tb) {
1195 invalidate_page_bitmap(p);
1196 if (is_cpu_write_access) {
1197 tlb_unprotect_code_phys(cpu, start, cpu->mem_io_vaddr);
1200 #endif
1201 #ifdef TARGET_HAS_PRECISE_SMC
1202 if (current_tb_modified) {
1203 /* we generate a block containing just the instruction
1204 modifying the memory. It will ensure that it cannot modify
1205 itself */
1206 cpu->current_tb = NULL;
1207 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1208 cpu_resume_from_signal(cpu, NULL);
1210 #endif
1213 /* len must be <= 8 and start must be a multiple of len */
1214 void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
1216 PageDesc *p;
1217 int offset, b;
1219 #if 0
1220 if (1) {
1221 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1222 cpu_single_env->mem_io_vaddr, len,
1223 cpu_single_env->eip,
1224 cpu_single_env->eip +
1225 (intptr_t)cpu_single_env->segs[R_CS].base);
1227 #endif
1228 p = page_find(start >> TARGET_PAGE_BITS);
1229 if (!p) {
1230 return;
1232 if (p->code_bitmap) {
1233 offset = start & ~TARGET_PAGE_MASK;
1234 b = p->code_bitmap[offset >> 3] >> (offset & 7);
1235 if (b & ((1 << len) - 1)) {
1236 goto do_invalidate;
1238 } else {
1239 do_invalidate:
1240 tb_invalidate_phys_page_range(start, start + len, 1);
1244 #if !defined(CONFIG_SOFTMMU)
1245 static void tb_invalidate_phys_page(tb_page_addr_t addr,
1246 uintptr_t pc, void *puc,
1247 bool locked)
1249 TranslationBlock *tb;
1250 PageDesc *p;
1251 int n;
1252 #ifdef TARGET_HAS_PRECISE_SMC
1253 TranslationBlock *current_tb = NULL;
1254 CPUState *cpu = current_cpu;
1255 CPUArchState *env = NULL;
1256 int current_tb_modified = 0;
1257 target_ulong current_pc = 0;
1258 target_ulong current_cs_base = 0;
1259 int current_flags = 0;
1260 #endif
1262 addr &= TARGET_PAGE_MASK;
1263 p = page_find(addr >> TARGET_PAGE_BITS);
1264 if (!p) {
1265 return;
1267 tb = p->first_tb;
1268 #ifdef TARGET_HAS_PRECISE_SMC
1269 if (tb && pc != 0) {
1270 current_tb = tb_find_pc(pc);
1272 if (cpu != NULL) {
1273 env = cpu->env_ptr;
1275 #endif
1276 while (tb != NULL) {
1277 n = (uintptr_t)tb & 3;
1278 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1279 #ifdef TARGET_HAS_PRECISE_SMC
1280 if (current_tb == tb &&
1281 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1282 /* If we are modifying the current TB, we must stop
1283 its execution. We could be more precise by checking
1284 that the modification is after the current PC, but it
1285 would require a specialized function to partially
1286 restore the CPU state */
1288 current_tb_modified = 1;
1289 cpu_restore_state_from_tb(cpu, current_tb, pc);
1290 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1291 &current_flags);
1293 #endif /* TARGET_HAS_PRECISE_SMC */
1294 tb_phys_invalidate(tb, addr);
1295 tb = tb->page_next[n];
1297 p->first_tb = NULL;
1298 #ifdef TARGET_HAS_PRECISE_SMC
1299 if (current_tb_modified) {
1300 /* we generate a block containing just the instruction
1301 modifying the memory. It will ensure that it cannot modify
1302 itself */
1303 cpu->current_tb = NULL;
1304 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1305 if (locked) {
1306 mmap_unlock();
1308 cpu_resume_from_signal(cpu, puc);
1310 #endif
1312 #endif
1314 /* add the tb in the target page and protect it if necessary */
1315 static inline void tb_alloc_page(TranslationBlock *tb,
1316 unsigned int n, tb_page_addr_t page_addr)
1318 PageDesc *p;
1319 #ifndef CONFIG_USER_ONLY
1320 bool page_already_protected;
1321 #endif
1323 tb->page_addr[n] = page_addr;
1324 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
1325 tb->page_next[n] = p->first_tb;
1326 #ifndef CONFIG_USER_ONLY
1327 page_already_protected = p->first_tb != NULL;
1328 #endif
1329 p->first_tb = (TranslationBlock *)((uintptr_t)tb | n);
1330 invalidate_page_bitmap(p);
1332 #if defined(TARGET_HAS_SMC) || 1
1334 #if defined(CONFIG_USER_ONLY)
1335 if (p->flags & PAGE_WRITE) {
1336 target_ulong addr;
1337 PageDesc *p2;
1338 int prot;
1340 /* force the host page as non writable (writes will have a
1341 page fault + mprotect overhead) */
1342 page_addr &= qemu_host_page_mask;
1343 prot = 0;
1344 for (addr = page_addr; addr < page_addr + qemu_host_page_size;
1345 addr += TARGET_PAGE_SIZE) {
1347 p2 = page_find(addr >> TARGET_PAGE_BITS);
1348 if (!p2) {
1349 continue;
1351 prot |= p2->flags;
1352 p2->flags &= ~PAGE_WRITE;
1354 mprotect(g2h(page_addr), qemu_host_page_size,
1355 (prot & PAGE_BITS) & ~PAGE_WRITE);
1356 #ifdef DEBUG_TB_INVALIDATE
1357 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
1358 page_addr);
1359 #endif
1361 #else
1362 /* if some code is already present, then the pages are already
1363 protected. So we handle the case where only the first TB is
1364 allocated in a physical page */
1365 if (!page_already_protected) {
1366 tlb_protect_code(page_addr);
1368 #endif
1370 #endif /* TARGET_HAS_SMC */
1373 /* add a new TB and link it to the physical page tables. phys_page2 is
1374 (-1) to indicate that only one page contains the TB. */
1375 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
1376 tb_page_addr_t phys_page2)
1378 unsigned int h;
1379 TranslationBlock **ptb;
1381 /* Grab the mmap lock to stop another thread invalidating this TB
1382 before we are done. */
1383 mmap_lock();
1384 /* add in the physical hash table */
1385 h = tb_phys_hash_func(phys_pc);
1386 ptb = &tcg_ctx.tb_ctx.tb_phys_hash[h];
1387 tb->phys_hash_next = *ptb;
1388 *ptb = tb;
1390 /* add in the page list */
1391 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1392 if (phys_page2 != -1) {
1393 tb_alloc_page(tb, 1, phys_page2);
1394 } else {
1395 tb->page_addr[1] = -1;
1398 tb->jmp_first = (TranslationBlock *)((uintptr_t)tb | 2);
1399 tb->jmp_next[0] = NULL;
1400 tb->jmp_next[1] = NULL;
1402 /* init original jump addresses */
1403 if (tb->tb_next_offset[0] != 0xffff) {
1404 tb_reset_jump(tb, 0);
1406 if (tb->tb_next_offset[1] != 0xffff) {
1407 tb_reset_jump(tb, 1);
1410 #ifdef DEBUG_TB_CHECK
1411 tb_page_check();
1412 #endif
1413 mmap_unlock();
1416 /* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1417 tb[1].tc_ptr. Return NULL if not found */
1418 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr)
1420 int m_min, m_max, m;
1421 uintptr_t v;
1422 TranslationBlock *tb;
1424 if (tcg_ctx.tb_ctx.nb_tbs <= 0) {
1425 return NULL;
1427 if (tc_ptr < (uintptr_t)tcg_ctx.code_gen_buffer ||
1428 tc_ptr >= (uintptr_t)tcg_ctx.code_gen_ptr) {
1429 return NULL;
1431 /* binary search (cf Knuth) */
1432 m_min = 0;
1433 m_max = tcg_ctx.tb_ctx.nb_tbs - 1;
1434 while (m_min <= m_max) {
1435 m = (m_min + m_max) >> 1;
1436 tb = &tcg_ctx.tb_ctx.tbs[m];
1437 v = (uintptr_t)tb->tc_ptr;
1438 if (v == tc_ptr) {
1439 return tb;
1440 } else if (tc_ptr < v) {
1441 m_max = m - 1;
1442 } else {
1443 m_min = m + 1;
1446 return &tcg_ctx.tb_ctx.tbs[m_max];
1449 #if defined(TARGET_HAS_ICE) && !defined(CONFIG_USER_ONLY)
1450 void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr)
1452 ram_addr_t ram_addr;
1453 MemoryRegion *mr;
1454 hwaddr l = 1;
1456 mr = address_space_translate(as, addr, &addr, &l, false);
1457 if (!(memory_region_is_ram(mr)
1458 || memory_region_is_romd(mr))) {
1459 return;
1461 ram_addr = (memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK)
1462 + addr;
1463 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
1465 #endif /* TARGET_HAS_ICE && !defined(CONFIG_USER_ONLY) */
1467 void tb_check_watchpoint(CPUState *cpu)
1469 TranslationBlock *tb;
1471 tb = tb_find_pc(cpu->mem_io_pc);
1472 if (!tb) {
1473 cpu_abort(cpu, "check_watchpoint: could not find TB for pc=%p",
1474 (void *)cpu->mem_io_pc);
1476 cpu_restore_state_from_tb(cpu, tb, cpu->mem_io_pc);
1477 tb_phys_invalidate(tb, -1);
1480 #ifndef CONFIG_USER_ONLY
1481 /* mask must never be zero, except for A20 change call */
1482 static void tcg_handle_interrupt(CPUState *cpu, int mask)
1484 int old_mask;
1486 old_mask = cpu->interrupt_request;
1487 cpu->interrupt_request |= mask;
1490 * If called from iothread context, wake the target cpu in
1491 * case its halted.
1493 if (!qemu_cpu_is_self(cpu)) {
1494 qemu_cpu_kick(cpu);
1495 return;
1498 if (use_icount) {
1499 cpu->icount_decr.u16.high = 0xffff;
1500 if (!cpu_can_do_io(cpu)
1501 && (mask & ~old_mask) != 0) {
1502 cpu_abort(cpu, "Raised interrupt while not in I/O function");
1504 } else {
1505 cpu->tcg_exit_req = 1;
1509 CPUInterruptHandler cpu_interrupt_handler = tcg_handle_interrupt;
1511 /* in deterministic execution mode, instructions doing device I/Os
1512 must be at the end of the TB */
1513 void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr)
1515 #if defined(TARGET_MIPS) || defined(TARGET_SH4)
1516 CPUArchState *env = cpu->env_ptr;
1517 #endif
1518 TranslationBlock *tb;
1519 uint32_t n, cflags;
1520 target_ulong pc, cs_base;
1521 uint64_t flags;
1523 tb = tb_find_pc(retaddr);
1524 if (!tb) {
1525 cpu_abort(cpu, "cpu_io_recompile: could not find TB for pc=%p",
1526 (void *)retaddr);
1528 n = cpu->icount_decr.u16.low + tb->icount;
1529 cpu_restore_state_from_tb(cpu, tb, retaddr);
1530 /* Calculate how many instructions had been executed before the fault
1531 occurred. */
1532 n = n - cpu->icount_decr.u16.low;
1533 /* Generate a new TB ending on the I/O insn. */
1534 n++;
1535 /* On MIPS and SH, delay slot instructions can only be restarted if
1536 they were already the first instruction in the TB. If this is not
1537 the first instruction in a TB then re-execute the preceding
1538 branch. */
1539 #if defined(TARGET_MIPS)
1540 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
1541 env->active_tc.PC -= 4;
1542 cpu->icount_decr.u16.low++;
1543 env->hflags &= ~MIPS_HFLAG_BMASK;
1545 #elif defined(TARGET_SH4)
1546 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
1547 && n > 1) {
1548 env->pc -= 2;
1549 cpu->icount_decr.u16.low++;
1550 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
1552 #endif
1553 /* This should never happen. */
1554 if (n > CF_COUNT_MASK) {
1555 cpu_abort(cpu, "TB too big during recompile");
1558 cflags = n | CF_LAST_IO;
1559 pc = tb->pc;
1560 cs_base = tb->cs_base;
1561 flags = tb->flags;
1562 tb_phys_invalidate(tb, -1);
1563 /* FIXME: In theory this could raise an exception. In practice
1564 we have already translated the block once so it's probably ok. */
1565 tb_gen_code(cpu, pc, cs_base, flags, cflags);
1566 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
1567 the first in the TB) then we end up generating a whole new TB and
1568 repeating the fault, which is horribly inefficient.
1569 Better would be to execute just this insn uncached, or generate a
1570 second new TB. */
1571 cpu_resume_from_signal(cpu, NULL);
1574 void tb_flush_jmp_cache(CPUState *cpu, target_ulong addr)
1576 unsigned int i;
1578 /* Discard jump cache entries for any tb which might potentially
1579 overlap the flushed page. */
1580 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1581 memset(&cpu->tb_jmp_cache[i], 0,
1582 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1584 i = tb_jmp_cache_hash_page(addr);
1585 memset(&cpu->tb_jmp_cache[i], 0,
1586 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1589 void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
1591 int i, target_code_size, max_target_code_size;
1592 int direct_jmp_count, direct_jmp2_count, cross_page;
1593 TranslationBlock *tb;
1595 target_code_size = 0;
1596 max_target_code_size = 0;
1597 cross_page = 0;
1598 direct_jmp_count = 0;
1599 direct_jmp2_count = 0;
1600 for (i = 0; i < tcg_ctx.tb_ctx.nb_tbs; i++) {
1601 tb = &tcg_ctx.tb_ctx.tbs[i];
1602 target_code_size += tb->size;
1603 if (tb->size > max_target_code_size) {
1604 max_target_code_size = tb->size;
1606 if (tb->page_addr[1] != -1) {
1607 cross_page++;
1609 if (tb->tb_next_offset[0] != 0xffff) {
1610 direct_jmp_count++;
1611 if (tb->tb_next_offset[1] != 0xffff) {
1612 direct_jmp2_count++;
1616 /* XXX: avoid using doubles ? */
1617 cpu_fprintf(f, "Translation buffer state:\n");
1618 cpu_fprintf(f, "gen code size %td/%zd\n",
1619 tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer,
1620 tcg_ctx.code_gen_buffer_max_size);
1621 cpu_fprintf(f, "TB count %d/%d\n",
1622 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.code_gen_max_blocks);
1623 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
1624 tcg_ctx.tb_ctx.nb_tbs ? target_code_size /
1625 tcg_ctx.tb_ctx.nb_tbs : 0,
1626 max_target_code_size);
1627 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
1628 tcg_ctx.tb_ctx.nb_tbs ? (tcg_ctx.code_gen_ptr -
1629 tcg_ctx.code_gen_buffer) /
1630 tcg_ctx.tb_ctx.nb_tbs : 0,
1631 target_code_size ? (double) (tcg_ctx.code_gen_ptr -
1632 tcg_ctx.code_gen_buffer) /
1633 target_code_size : 0);
1634 cpu_fprintf(f, "cross page TB count %d (%d%%)\n", cross_page,
1635 tcg_ctx.tb_ctx.nb_tbs ? (cross_page * 100) /
1636 tcg_ctx.tb_ctx.nb_tbs : 0);
1637 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
1638 direct_jmp_count,
1639 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp_count * 100) /
1640 tcg_ctx.tb_ctx.nb_tbs : 0,
1641 direct_jmp2_count,
1642 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp2_count * 100) /
1643 tcg_ctx.tb_ctx.nb_tbs : 0);
1644 cpu_fprintf(f, "\nStatistics:\n");
1645 cpu_fprintf(f, "TB flush count %d\n", tcg_ctx.tb_ctx.tb_flush_count);
1646 cpu_fprintf(f, "TB invalidate count %d\n",
1647 tcg_ctx.tb_ctx.tb_phys_invalidate_count);
1648 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
1649 tcg_dump_info(f, cpu_fprintf);
1652 #else /* CONFIG_USER_ONLY */
1654 void cpu_interrupt(CPUState *cpu, int mask)
1656 cpu->interrupt_request |= mask;
1657 cpu->tcg_exit_req = 1;
1661 * Walks guest process memory "regions" one by one
1662 * and calls callback function 'fn' for each region.
1664 struct walk_memory_regions_data {
1665 walk_memory_regions_fn fn;
1666 void *priv;
1667 uintptr_t start;
1668 int prot;
1671 static int walk_memory_regions_end(struct walk_memory_regions_data *data,
1672 abi_ulong end, int new_prot)
1674 if (data->start != -1ul) {
1675 int rc = data->fn(data->priv, data->start, end, data->prot);
1676 if (rc != 0) {
1677 return rc;
1681 data->start = (new_prot ? end : -1ul);
1682 data->prot = new_prot;
1684 return 0;
1687 static int walk_memory_regions_1(struct walk_memory_regions_data *data,
1688 abi_ulong base, int level, void **lp)
1690 abi_ulong pa;
1691 int i, rc;
1693 if (*lp == NULL) {
1694 return walk_memory_regions_end(data, base, 0);
1697 if (level == 0) {
1698 PageDesc *pd = *lp;
1700 for (i = 0; i < V_L2_SIZE; ++i) {
1701 int prot = pd[i].flags;
1703 pa = base | (i << TARGET_PAGE_BITS);
1704 if (prot != data->prot) {
1705 rc = walk_memory_regions_end(data, pa, prot);
1706 if (rc != 0) {
1707 return rc;
1711 } else {
1712 void **pp = *lp;
1714 for (i = 0; i < V_L2_SIZE; ++i) {
1715 pa = base | ((abi_ulong)i <<
1716 (TARGET_PAGE_BITS + V_L2_BITS * level));
1717 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
1718 if (rc != 0) {
1719 return rc;
1724 return 0;
1727 int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
1729 struct walk_memory_regions_data data;
1730 uintptr_t i;
1732 data.fn = fn;
1733 data.priv = priv;
1734 data.start = -1ul;
1735 data.prot = 0;
1737 for (i = 0; i < V_L1_SIZE; i++) {
1738 int rc = walk_memory_regions_1(&data, (abi_ulong)i << V_L1_SHIFT,
1739 V_L1_SHIFT / V_L2_BITS - 1, l1_map + i);
1741 if (rc != 0) {
1742 return rc;
1746 return walk_memory_regions_end(&data, 0, 0);
1749 static int dump_region(void *priv, abi_ulong start,
1750 abi_ulong end, unsigned long prot)
1752 FILE *f = (FILE *)priv;
1754 (void) fprintf(f, TARGET_ABI_FMT_lx"-"TARGET_ABI_FMT_lx
1755 " "TARGET_ABI_FMT_lx" %c%c%c\n",
1756 start, end, end - start,
1757 ((prot & PAGE_READ) ? 'r' : '-'),
1758 ((prot & PAGE_WRITE) ? 'w' : '-'),
1759 ((prot & PAGE_EXEC) ? 'x' : '-'));
1761 return 0;
1764 /* dump memory mappings */
1765 void page_dump(FILE *f)
1767 const int length = sizeof(abi_ulong) * 2;
1768 (void) fprintf(f, "%-*s %-*s %-*s %s\n",
1769 length, "start", length, "end", length, "size", "prot");
1770 walk_memory_regions(f, dump_region);
1773 int page_get_flags(target_ulong address)
1775 PageDesc *p;
1777 p = page_find(address >> TARGET_PAGE_BITS);
1778 if (!p) {
1779 return 0;
1781 return p->flags;
1784 /* Modify the flags of a page and invalidate the code if necessary.
1785 The flag PAGE_WRITE_ORG is positioned automatically depending
1786 on PAGE_WRITE. The mmap_lock should already be held. */
1787 void page_set_flags(target_ulong start, target_ulong end, int flags)
1789 target_ulong addr, len;
1791 /* This function should never be called with addresses outside the
1792 guest address space. If this assert fires, it probably indicates
1793 a missing call to h2g_valid. */
1794 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
1795 assert(end < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
1796 #endif
1797 assert(start < end);
1799 start = start & TARGET_PAGE_MASK;
1800 end = TARGET_PAGE_ALIGN(end);
1802 if (flags & PAGE_WRITE) {
1803 flags |= PAGE_WRITE_ORG;
1806 for (addr = start, len = end - start;
1807 len != 0;
1808 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
1809 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
1811 /* If the write protection bit is set, then we invalidate
1812 the code inside. */
1813 if (!(p->flags & PAGE_WRITE) &&
1814 (flags & PAGE_WRITE) &&
1815 p->first_tb) {
1816 tb_invalidate_phys_page(addr, 0, NULL, false);
1818 p->flags = flags;
1822 int page_check_range(target_ulong start, target_ulong len, int flags)
1824 PageDesc *p;
1825 target_ulong end;
1826 target_ulong addr;
1828 /* This function should never be called with addresses outside the
1829 guest address space. If this assert fires, it probably indicates
1830 a missing call to h2g_valid. */
1831 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
1832 assert(start < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
1833 #endif
1835 if (len == 0) {
1836 return 0;
1838 if (start + len - 1 < start) {
1839 /* We've wrapped around. */
1840 return -1;
1843 /* must do before we loose bits in the next step */
1844 end = TARGET_PAGE_ALIGN(start + len);
1845 start = start & TARGET_PAGE_MASK;
1847 for (addr = start, len = end - start;
1848 len != 0;
1849 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
1850 p = page_find(addr >> TARGET_PAGE_BITS);
1851 if (!p) {
1852 return -1;
1854 if (!(p->flags & PAGE_VALID)) {
1855 return -1;
1858 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ)) {
1859 return -1;
1861 if (flags & PAGE_WRITE) {
1862 if (!(p->flags & PAGE_WRITE_ORG)) {
1863 return -1;
1865 /* unprotect the page if it was put read-only because it
1866 contains translated code */
1867 if (!(p->flags & PAGE_WRITE)) {
1868 if (!page_unprotect(addr, 0, NULL)) {
1869 return -1;
1874 return 0;
1877 /* called from signal handler: invalidate the code and unprotect the
1878 page. Return TRUE if the fault was successfully handled. */
1879 int page_unprotect(target_ulong address, uintptr_t pc, void *puc)
1881 unsigned int prot;
1882 PageDesc *p;
1883 target_ulong host_start, host_end, addr;
1885 /* Technically this isn't safe inside a signal handler. However we
1886 know this only ever happens in a synchronous SEGV handler, so in
1887 practice it seems to be ok. */
1888 mmap_lock();
1890 p = page_find(address >> TARGET_PAGE_BITS);
1891 if (!p) {
1892 mmap_unlock();
1893 return 0;
1896 /* if the page was really writable, then we change its
1897 protection back to writable */
1898 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
1899 host_start = address & qemu_host_page_mask;
1900 host_end = host_start + qemu_host_page_size;
1902 prot = 0;
1903 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
1904 p = page_find(addr >> TARGET_PAGE_BITS);
1905 p->flags |= PAGE_WRITE;
1906 prot |= p->flags;
1908 /* and since the content will be modified, we must invalidate
1909 the corresponding translated code. */
1910 tb_invalidate_phys_page(addr, pc, puc, true);
1911 #ifdef DEBUG_TB_CHECK
1912 tb_invalidate_check(addr);
1913 #endif
1915 mprotect((void *)g2h(host_start), qemu_host_page_size,
1916 prot & PAGE_BITS);
1918 mmap_unlock();
1919 return 1;
1921 mmap_unlock();
1922 return 0;
1924 #endif /* CONFIG_USER_ONLY */