qcow2: Remove stale FIXME comment
[qemu.git] / translate-all.c
blob3dd9214904d201f726317bad9357b35c3bd104d2
1 /*
2 * Host code generation
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 #ifdef _WIN32
20 #include <windows.h>
21 #endif
22 #include "qemu/osdep.h"
25 #include "qemu-common.h"
26 #define NO_CPU_IO_DEFS
27 #include "cpu.h"
28 #include "trace.h"
29 #include "disas/disas.h"
30 #include "exec/exec-all.h"
31 #include "tcg.h"
32 #if defined(CONFIG_USER_ONLY)
33 #include "qemu.h"
34 #include "exec/exec-all.h"
35 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
36 #include <sys/param.h>
37 #if __FreeBSD_version >= 700104
38 #define HAVE_KINFO_GETVMMAP
39 #define sigqueue sigqueue_freebsd /* avoid redefinition */
40 #include <sys/proc.h>
41 #include <machine/profile.h>
42 #define _KERNEL
43 #include <sys/user.h>
44 #undef _KERNEL
45 #undef sigqueue
46 #include <libutil.h>
47 #endif
48 #endif
49 #else
50 #include "exec/address-spaces.h"
51 #endif
53 #include "exec/cputlb.h"
54 #include "exec/tb-hash.h"
55 #include "translate-all.h"
56 #include "qemu/bitmap.h"
57 #include "qemu/timer.h"
58 #include "exec/log.h"
60 /* #define DEBUG_TB_INVALIDATE */
61 /* #define DEBUG_TB_FLUSH */
62 /* #define DEBUG_LOCKING */
63 /* make various TB consistency checks */
64 /* #define DEBUG_TB_CHECK */
66 #if !defined(CONFIG_USER_ONLY)
67 /* TB consistency checks only implemented for usermode emulation. */
68 #undef DEBUG_TB_CHECK
69 #endif
71 /* Access to the various translations structures need to be serialised via locks
72 * for consistency. This is automatic for SoftMMU based system
73 * emulation due to its single threaded nature. In user-mode emulation
74 * access to the memory related structures are protected with the
75 * mmap_lock.
77 #ifdef DEBUG_LOCKING
78 #define DEBUG_MEM_LOCKS 1
79 #else
80 #define DEBUG_MEM_LOCKS 0
81 #endif
83 #ifdef CONFIG_SOFTMMU
84 #define assert_memory_lock() do { /* nothing */ } while (0)
85 #else
86 #define assert_memory_lock() do { \
87 if (DEBUG_MEM_LOCKS) { \
88 g_assert(have_mmap_lock()); \
89 } \
90 } while (0)
91 #endif
93 #define SMC_BITMAP_USE_THRESHOLD 10
95 typedef struct PageDesc {
96 /* list of TBs intersecting this ram page */
97 TranslationBlock *first_tb;
98 #ifdef CONFIG_SOFTMMU
99 /* in order to optimize self modifying code, we count the number
100 of lookups we do to a given page to use a bitmap */
101 unsigned int code_write_count;
102 unsigned long *code_bitmap;
103 #else
104 unsigned long flags;
105 #endif
106 } PageDesc;
108 /* In system mode we want L1_MAP to be based on ram offsets,
109 while in user mode we want it to be based on virtual addresses. */
110 #if !defined(CONFIG_USER_ONLY)
111 #if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
112 # define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
113 #else
114 # define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
115 #endif
116 #else
117 # define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
118 #endif
120 /* Size of the L2 (and L3, etc) page tables. */
121 #define V_L2_BITS 10
122 #define V_L2_SIZE (1 << V_L2_BITS)
124 uintptr_t qemu_host_page_size;
125 intptr_t qemu_host_page_mask;
128 * L1 Mapping properties
130 static int v_l1_size;
131 static int v_l1_shift;
132 static int v_l2_levels;
134 /* The bottom level has pointers to PageDesc, and is indexed by
135 * anything from 4 to (V_L2_BITS + 3) bits, depending on target page size.
137 #define V_L1_MIN_BITS 4
138 #define V_L1_MAX_BITS (V_L2_BITS + 3)
139 #define V_L1_MAX_SIZE (1 << V_L1_MAX_BITS)
141 static void *l1_map[V_L1_MAX_SIZE];
143 /* code generation context */
144 TCGContext tcg_ctx;
145 bool parallel_cpus;
147 /* translation block context */
148 #ifdef CONFIG_USER_ONLY
149 __thread int have_tb_lock;
150 #endif
152 static void page_table_config_init(void)
154 uint32_t v_l1_bits;
156 assert(TARGET_PAGE_BITS);
157 /* The bits remaining after N lower levels of page tables. */
158 v_l1_bits = (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % V_L2_BITS;
159 if (v_l1_bits < V_L1_MIN_BITS) {
160 v_l1_bits += V_L2_BITS;
163 v_l1_size = 1 << v_l1_bits;
164 v_l1_shift = L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - v_l1_bits;
165 v_l2_levels = v_l1_shift / V_L2_BITS - 1;
167 assert(v_l1_bits <= V_L1_MAX_BITS);
168 assert(v_l1_shift % V_L2_BITS == 0);
169 assert(v_l2_levels >= 0);
172 void tb_lock(void)
174 #ifdef CONFIG_USER_ONLY
175 assert(!have_tb_lock);
176 qemu_mutex_lock(&tcg_ctx.tb_ctx.tb_lock);
177 have_tb_lock++;
178 #endif
181 void tb_unlock(void)
183 #ifdef CONFIG_USER_ONLY
184 assert(have_tb_lock);
185 have_tb_lock--;
186 qemu_mutex_unlock(&tcg_ctx.tb_ctx.tb_lock);
187 #endif
190 void tb_lock_reset(void)
192 #ifdef CONFIG_USER_ONLY
193 if (have_tb_lock) {
194 qemu_mutex_unlock(&tcg_ctx.tb_ctx.tb_lock);
195 have_tb_lock = 0;
197 #endif
200 #ifdef DEBUG_LOCKING
201 #define DEBUG_TB_LOCKS 1
202 #else
203 #define DEBUG_TB_LOCKS 0
204 #endif
206 #ifdef CONFIG_SOFTMMU
207 #define assert_tb_lock() do { /* nothing */ } while (0)
208 #else
209 #define assert_tb_lock() do { \
210 if (DEBUG_TB_LOCKS) { \
211 g_assert(have_tb_lock); \
213 } while (0)
214 #endif
217 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr);
219 void cpu_gen_init(void)
221 tcg_context_init(&tcg_ctx);
224 /* Encode VAL as a signed leb128 sequence at P.
225 Return P incremented past the encoded value. */
226 static uint8_t *encode_sleb128(uint8_t *p, target_long val)
228 int more, byte;
230 do {
231 byte = val & 0x7f;
232 val >>= 7;
233 more = !((val == 0 && (byte & 0x40) == 0)
234 || (val == -1 && (byte & 0x40) != 0));
235 if (more) {
236 byte |= 0x80;
238 *p++ = byte;
239 } while (more);
241 return p;
244 /* Decode a signed leb128 sequence at *PP; increment *PP past the
245 decoded value. Return the decoded value. */
246 static target_long decode_sleb128(uint8_t **pp)
248 uint8_t *p = *pp;
249 target_long val = 0;
250 int byte, shift = 0;
252 do {
253 byte = *p++;
254 val |= (target_ulong)(byte & 0x7f) << shift;
255 shift += 7;
256 } while (byte & 0x80);
257 if (shift < TARGET_LONG_BITS && (byte & 0x40)) {
258 val |= -(target_ulong)1 << shift;
261 *pp = p;
262 return val;
265 /* Encode the data collected about the instructions while compiling TB.
266 Place the data at BLOCK, and return the number of bytes consumed.
268 The logical table consisits of TARGET_INSN_START_WORDS target_ulong's,
269 which come from the target's insn_start data, followed by a uintptr_t
270 which comes from the host pc of the end of the code implementing the insn.
272 Each line of the table is encoded as sleb128 deltas from the previous
273 line. The seed for the first line is { tb->pc, 0..., tb->tc_ptr }.
274 That is, the first column is seeded with the guest pc, the last column
275 with the host pc, and the middle columns with zeros. */
277 static int encode_search(TranslationBlock *tb, uint8_t *block)
279 uint8_t *highwater = tcg_ctx.code_gen_highwater;
280 uint8_t *p = block;
281 int i, j, n;
283 tb->tc_search = block;
285 for (i = 0, n = tb->icount; i < n; ++i) {
286 target_ulong prev;
288 for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
289 if (i == 0) {
290 prev = (j == 0 ? tb->pc : 0);
291 } else {
292 prev = tcg_ctx.gen_insn_data[i - 1][j];
294 p = encode_sleb128(p, tcg_ctx.gen_insn_data[i][j] - prev);
296 prev = (i == 0 ? 0 : tcg_ctx.gen_insn_end_off[i - 1]);
297 p = encode_sleb128(p, tcg_ctx.gen_insn_end_off[i] - prev);
299 /* Test for (pending) buffer overflow. The assumption is that any
300 one row beginning below the high water mark cannot overrun
301 the buffer completely. Thus we can test for overflow after
302 encoding a row without having to check during encoding. */
303 if (unlikely(p > highwater)) {
304 return -1;
308 return p - block;
311 /* The cpu state corresponding to 'searched_pc' is restored.
312 * Called with tb_lock held.
314 static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
315 uintptr_t searched_pc)
317 target_ulong data[TARGET_INSN_START_WORDS] = { tb->pc };
318 uintptr_t host_pc = (uintptr_t)tb->tc_ptr;
319 CPUArchState *env = cpu->env_ptr;
320 uint8_t *p = tb->tc_search;
321 int i, j, num_insns = tb->icount;
322 #ifdef CONFIG_PROFILER
323 int64_t ti = profile_getclock();
324 #endif
326 searched_pc -= GETPC_ADJ;
328 if (searched_pc < host_pc) {
329 return -1;
332 /* Reconstruct the stored insn data while looking for the point at
333 which the end of the insn exceeds the searched_pc. */
334 for (i = 0; i < num_insns; ++i) {
335 for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
336 data[j] += decode_sleb128(&p);
338 host_pc += decode_sleb128(&p);
339 if (host_pc > searched_pc) {
340 goto found;
343 return -1;
345 found:
346 if (tb->cflags & CF_USE_ICOUNT) {
347 assert(use_icount);
348 /* Reset the cycle counter to the start of the block. */
349 cpu->icount_decr.u16.low += num_insns;
350 /* Clear the IO flag. */
351 cpu->can_do_io = 0;
353 cpu->icount_decr.u16.low -= i;
354 restore_state_to_opc(env, tb, data);
356 #ifdef CONFIG_PROFILER
357 tcg_ctx.restore_time += profile_getclock() - ti;
358 tcg_ctx.restore_count++;
359 #endif
360 return 0;
363 bool cpu_restore_state(CPUState *cpu, uintptr_t retaddr)
365 TranslationBlock *tb;
366 bool r = false;
368 tb_lock();
369 tb = tb_find_pc(retaddr);
370 if (tb) {
371 cpu_restore_state_from_tb(cpu, tb, retaddr);
372 if (tb->cflags & CF_NOCACHE) {
373 /* one-shot translation, invalidate it immediately */
374 tb_phys_invalidate(tb, -1);
375 tb_free(tb);
377 r = true;
379 tb_unlock();
381 return r;
384 void page_size_init(void)
386 /* NOTE: we can always suppose that qemu_host_page_size >=
387 TARGET_PAGE_SIZE */
388 qemu_real_host_page_size = getpagesize();
389 qemu_real_host_page_mask = -(intptr_t)qemu_real_host_page_size;
390 if (qemu_host_page_size == 0) {
391 qemu_host_page_size = qemu_real_host_page_size;
393 if (qemu_host_page_size < TARGET_PAGE_SIZE) {
394 qemu_host_page_size = TARGET_PAGE_SIZE;
396 qemu_host_page_mask = -(intptr_t)qemu_host_page_size;
399 static void page_init(void)
401 page_size_init();
402 page_table_config_init();
404 #if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
406 #ifdef HAVE_KINFO_GETVMMAP
407 struct kinfo_vmentry *freep;
408 int i, cnt;
410 freep = kinfo_getvmmap(getpid(), &cnt);
411 if (freep) {
412 mmap_lock();
413 for (i = 0; i < cnt; i++) {
414 unsigned long startaddr, endaddr;
416 startaddr = freep[i].kve_start;
417 endaddr = freep[i].kve_end;
418 if (h2g_valid(startaddr)) {
419 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
421 if (h2g_valid(endaddr)) {
422 endaddr = h2g(endaddr);
423 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
424 } else {
425 #if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
426 endaddr = ~0ul;
427 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
428 #endif
432 free(freep);
433 mmap_unlock();
435 #else
436 FILE *f;
438 last_brk = (unsigned long)sbrk(0);
440 f = fopen("/compat/linux/proc/self/maps", "r");
441 if (f) {
442 mmap_lock();
444 do {
445 unsigned long startaddr, endaddr;
446 int n;
448 n = fscanf(f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
450 if (n == 2 && h2g_valid(startaddr)) {
451 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
453 if (h2g_valid(endaddr)) {
454 endaddr = h2g(endaddr);
455 } else {
456 endaddr = ~0ul;
458 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
460 } while (!feof(f));
462 fclose(f);
463 mmap_unlock();
465 #endif
467 #endif
470 /* If alloc=1:
471 * Called with tb_lock held for system emulation.
472 * Called with mmap_lock held for user-mode emulation.
474 static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
476 PageDesc *pd;
477 void **lp;
478 int i;
480 if (alloc) {
481 assert_memory_lock();
484 /* Level 1. Always allocated. */
485 lp = l1_map + ((index >> v_l1_shift) & (v_l1_size - 1));
487 /* Level 2..N-1. */
488 for (i = v_l2_levels; i > 0; i--) {
489 void **p = atomic_rcu_read(lp);
491 if (p == NULL) {
492 if (!alloc) {
493 return NULL;
495 p = g_new0(void *, V_L2_SIZE);
496 atomic_rcu_set(lp, p);
499 lp = p + ((index >> (i * V_L2_BITS)) & (V_L2_SIZE - 1));
502 pd = atomic_rcu_read(lp);
503 if (pd == NULL) {
504 if (!alloc) {
505 return NULL;
507 pd = g_new0(PageDesc, V_L2_SIZE);
508 atomic_rcu_set(lp, pd);
511 return pd + (index & (V_L2_SIZE - 1));
514 static inline PageDesc *page_find(tb_page_addr_t index)
516 return page_find_alloc(index, 0);
519 #if defined(CONFIG_USER_ONLY)
520 /* Currently it is not recommended to allocate big chunks of data in
521 user mode. It will change when a dedicated libc will be used. */
522 /* ??? 64-bit hosts ought to have no problem mmaping data outside the
523 region in which the guest needs to run. Revisit this. */
524 #define USE_STATIC_CODE_GEN_BUFFER
525 #endif
527 /* Minimum size of the code gen buffer. This number is randomly chosen,
528 but not so small that we can't have a fair number of TB's live. */
529 #define MIN_CODE_GEN_BUFFER_SIZE (1024u * 1024)
531 /* Maximum size of the code gen buffer we'd like to use. Unless otherwise
532 indicated, this is constrained by the range of direct branches on the
533 host cpu, as used by the TCG implementation of goto_tb. */
534 #if defined(__x86_64__)
535 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
536 #elif defined(__sparc__)
537 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
538 #elif defined(__powerpc64__)
539 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
540 #elif defined(__powerpc__)
541 # define MAX_CODE_GEN_BUFFER_SIZE (32u * 1024 * 1024)
542 #elif defined(__aarch64__)
543 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
544 #elif defined(__arm__)
545 # define MAX_CODE_GEN_BUFFER_SIZE (16u * 1024 * 1024)
546 #elif defined(__s390x__)
547 /* We have a +- 4GB range on the branches; leave some slop. */
548 # define MAX_CODE_GEN_BUFFER_SIZE (3ul * 1024 * 1024 * 1024)
549 #elif defined(__mips__)
550 /* We have a 256MB branch region, but leave room to make sure the
551 main executable is also within that region. */
552 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
553 #else
554 # define MAX_CODE_GEN_BUFFER_SIZE ((size_t)-1)
555 #endif
557 #define DEFAULT_CODE_GEN_BUFFER_SIZE_1 (32u * 1024 * 1024)
559 #define DEFAULT_CODE_GEN_BUFFER_SIZE \
560 (DEFAULT_CODE_GEN_BUFFER_SIZE_1 < MAX_CODE_GEN_BUFFER_SIZE \
561 ? DEFAULT_CODE_GEN_BUFFER_SIZE_1 : MAX_CODE_GEN_BUFFER_SIZE)
563 static inline size_t size_code_gen_buffer(size_t tb_size)
565 /* Size the buffer. */
566 if (tb_size == 0) {
567 #ifdef USE_STATIC_CODE_GEN_BUFFER
568 tb_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
569 #else
570 /* ??? Needs adjustments. */
571 /* ??? If we relax the requirement that CONFIG_USER_ONLY use the
572 static buffer, we could size this on RESERVED_VA, on the text
573 segment size of the executable, or continue to use the default. */
574 tb_size = (unsigned long)(ram_size / 4);
575 #endif
577 if (tb_size < MIN_CODE_GEN_BUFFER_SIZE) {
578 tb_size = MIN_CODE_GEN_BUFFER_SIZE;
580 if (tb_size > MAX_CODE_GEN_BUFFER_SIZE) {
581 tb_size = MAX_CODE_GEN_BUFFER_SIZE;
583 return tb_size;
586 #ifdef __mips__
587 /* In order to use J and JAL within the code_gen_buffer, we require
588 that the buffer not cross a 256MB boundary. */
589 static inline bool cross_256mb(void *addr, size_t size)
591 return ((uintptr_t)addr ^ ((uintptr_t)addr + size)) & ~0x0ffffffful;
594 /* We weren't able to allocate a buffer without crossing that boundary,
595 so make do with the larger portion of the buffer that doesn't cross.
596 Returns the new base of the buffer, and adjusts code_gen_buffer_size. */
597 static inline void *split_cross_256mb(void *buf1, size_t size1)
599 void *buf2 = (void *)(((uintptr_t)buf1 + size1) & ~0x0ffffffful);
600 size_t size2 = buf1 + size1 - buf2;
602 size1 = buf2 - buf1;
603 if (size1 < size2) {
604 size1 = size2;
605 buf1 = buf2;
608 tcg_ctx.code_gen_buffer_size = size1;
609 return buf1;
611 #endif
613 #ifdef USE_STATIC_CODE_GEN_BUFFER
614 static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
615 __attribute__((aligned(CODE_GEN_ALIGN)));
617 # ifdef _WIN32
618 static inline void do_protect(void *addr, long size, int prot)
620 DWORD old_protect;
621 VirtualProtect(addr, size, prot, &old_protect);
624 static inline void map_exec(void *addr, long size)
626 do_protect(addr, size, PAGE_EXECUTE_READWRITE);
629 static inline void map_none(void *addr, long size)
631 do_protect(addr, size, PAGE_NOACCESS);
633 # else
634 static inline void do_protect(void *addr, long size, int prot)
636 uintptr_t start, end;
638 start = (uintptr_t)addr;
639 start &= qemu_real_host_page_mask;
641 end = (uintptr_t)addr + size;
642 end = ROUND_UP(end, qemu_real_host_page_size);
644 mprotect((void *)start, end - start, prot);
647 static inline void map_exec(void *addr, long size)
649 do_protect(addr, size, PROT_READ | PROT_WRITE | PROT_EXEC);
652 static inline void map_none(void *addr, long size)
654 do_protect(addr, size, PROT_NONE);
656 # endif /* WIN32 */
658 static inline void *alloc_code_gen_buffer(void)
660 void *buf = static_code_gen_buffer;
661 size_t full_size, size;
663 /* The size of the buffer, rounded down to end on a page boundary. */
664 full_size = (((uintptr_t)buf + sizeof(static_code_gen_buffer))
665 & qemu_real_host_page_mask) - (uintptr_t)buf;
667 /* Reserve a guard page. */
668 size = full_size - qemu_real_host_page_size;
670 /* Honor a command-line option limiting the size of the buffer. */
671 if (size > tcg_ctx.code_gen_buffer_size) {
672 size = (((uintptr_t)buf + tcg_ctx.code_gen_buffer_size)
673 & qemu_real_host_page_mask) - (uintptr_t)buf;
675 tcg_ctx.code_gen_buffer_size = size;
677 #ifdef __mips__
678 if (cross_256mb(buf, size)) {
679 buf = split_cross_256mb(buf, size);
680 size = tcg_ctx.code_gen_buffer_size;
682 #endif
684 map_exec(buf, size);
685 map_none(buf + size, qemu_real_host_page_size);
686 qemu_madvise(buf, size, QEMU_MADV_HUGEPAGE);
688 return buf;
690 #elif defined(_WIN32)
691 static inline void *alloc_code_gen_buffer(void)
693 size_t size = tcg_ctx.code_gen_buffer_size;
694 void *buf1, *buf2;
696 /* Perform the allocation in two steps, so that the guard page
697 is reserved but uncommitted. */
698 buf1 = VirtualAlloc(NULL, size + qemu_real_host_page_size,
699 MEM_RESERVE, PAGE_NOACCESS);
700 if (buf1 != NULL) {
701 buf2 = VirtualAlloc(buf1, size, MEM_COMMIT, PAGE_EXECUTE_READWRITE);
702 assert(buf1 == buf2);
705 return buf1;
707 #else
708 static inline void *alloc_code_gen_buffer(void)
710 int flags = MAP_PRIVATE | MAP_ANONYMOUS;
711 uintptr_t start = 0;
712 size_t size = tcg_ctx.code_gen_buffer_size;
713 void *buf;
715 /* Constrain the position of the buffer based on the host cpu.
716 Note that these addresses are chosen in concert with the
717 addresses assigned in the relevant linker script file. */
718 # if defined(__PIE__) || defined(__PIC__)
719 /* Don't bother setting a preferred location if we're building
720 a position-independent executable. We're more likely to get
721 an address near the main executable if we let the kernel
722 choose the address. */
723 # elif defined(__x86_64__) && defined(MAP_32BIT)
724 /* Force the memory down into low memory with the executable.
725 Leave the choice of exact location with the kernel. */
726 flags |= MAP_32BIT;
727 /* Cannot expect to map more than 800MB in low memory. */
728 if (size > 800u * 1024 * 1024) {
729 tcg_ctx.code_gen_buffer_size = size = 800u * 1024 * 1024;
731 # elif defined(__sparc__)
732 start = 0x40000000ul;
733 # elif defined(__s390x__)
734 start = 0x90000000ul;
735 # elif defined(__mips__)
736 # if _MIPS_SIM == _ABI64
737 start = 0x128000000ul;
738 # else
739 start = 0x08000000ul;
740 # endif
741 # endif
743 buf = mmap((void *)start, size + qemu_real_host_page_size,
744 PROT_NONE, flags, -1, 0);
745 if (buf == MAP_FAILED) {
746 return NULL;
749 #ifdef __mips__
750 if (cross_256mb(buf, size)) {
751 /* Try again, with the original still mapped, to avoid re-acquiring
752 that 256mb crossing. This time don't specify an address. */
753 size_t size2;
754 void *buf2 = mmap(NULL, size + qemu_real_host_page_size,
755 PROT_NONE, flags, -1, 0);
756 switch (buf2 != MAP_FAILED) {
757 case 1:
758 if (!cross_256mb(buf2, size)) {
759 /* Success! Use the new buffer. */
760 munmap(buf, size + qemu_real_host_page_size);
761 break;
763 /* Failure. Work with what we had. */
764 munmap(buf2, size + qemu_real_host_page_size);
765 /* fallthru */
766 default:
767 /* Split the original buffer. Free the smaller half. */
768 buf2 = split_cross_256mb(buf, size);
769 size2 = tcg_ctx.code_gen_buffer_size;
770 if (buf == buf2) {
771 munmap(buf + size2 + qemu_real_host_page_size, size - size2);
772 } else {
773 munmap(buf, size - size2);
775 size = size2;
776 break;
778 buf = buf2;
780 #endif
782 /* Make the final buffer accessible. The guard page at the end
783 will remain inaccessible with PROT_NONE. */
784 mprotect(buf, size, PROT_WRITE | PROT_READ | PROT_EXEC);
786 /* Request large pages for the buffer. */
787 qemu_madvise(buf, size, QEMU_MADV_HUGEPAGE);
789 return buf;
791 #endif /* USE_STATIC_CODE_GEN_BUFFER, WIN32, POSIX */
793 static inline void code_gen_alloc(size_t tb_size)
795 tcg_ctx.code_gen_buffer_size = size_code_gen_buffer(tb_size);
796 tcg_ctx.code_gen_buffer = alloc_code_gen_buffer();
797 if (tcg_ctx.code_gen_buffer == NULL) {
798 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
799 exit(1);
802 /* Estimate a good size for the number of TBs we can support. We
803 still haven't deducted the prologue from the buffer size here,
804 but that's minimal and won't affect the estimate much. */
805 tcg_ctx.code_gen_max_blocks
806 = tcg_ctx.code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
807 tcg_ctx.tb_ctx.tbs = g_new(TranslationBlock, tcg_ctx.code_gen_max_blocks);
809 qemu_mutex_init(&tcg_ctx.tb_ctx.tb_lock);
812 static void tb_htable_init(void)
814 unsigned int mode = QHT_MODE_AUTO_RESIZE;
816 qht_init(&tcg_ctx.tb_ctx.htable, CODE_GEN_HTABLE_SIZE, mode);
819 /* Must be called before using the QEMU cpus. 'tb_size' is the size
820 (in bytes) allocated to the translation buffer. Zero means default
821 size. */
822 void tcg_exec_init(unsigned long tb_size)
824 cpu_gen_init();
825 page_init();
826 tb_htable_init();
827 code_gen_alloc(tb_size);
828 #if defined(CONFIG_SOFTMMU)
829 /* There's no guest base to take into account, so go ahead and
830 initialize the prologue now. */
831 tcg_prologue_init(&tcg_ctx);
832 #endif
835 bool tcg_enabled(void)
837 return tcg_ctx.code_gen_buffer != NULL;
841 * Allocate a new translation block. Flush the translation buffer if
842 * too many translation blocks or too much generated code.
844 * Called with tb_lock held.
846 static TranslationBlock *tb_alloc(target_ulong pc)
848 TranslationBlock *tb;
850 assert_tb_lock();
852 if (tcg_ctx.tb_ctx.nb_tbs >= tcg_ctx.code_gen_max_blocks) {
853 return NULL;
855 tb = &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs++];
856 tb->pc = pc;
857 tb->cflags = 0;
858 tb->invalid = false;
859 return tb;
862 /* Called with tb_lock held. */
863 void tb_free(TranslationBlock *tb)
865 assert_tb_lock();
867 /* In practice this is mostly used for single use temporary TB
868 Ignore the hard cases and just back up if this TB happens to
869 be the last one generated. */
870 if (tcg_ctx.tb_ctx.nb_tbs > 0 &&
871 tb == &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs - 1]) {
872 tcg_ctx.code_gen_ptr = tb->tc_ptr;
873 tcg_ctx.tb_ctx.nb_tbs--;
877 static inline void invalidate_page_bitmap(PageDesc *p)
879 #ifdef CONFIG_SOFTMMU
880 g_free(p->code_bitmap);
881 p->code_bitmap = NULL;
882 p->code_write_count = 0;
883 #endif
886 /* Set to NULL all the 'first_tb' fields in all PageDescs. */
887 static void page_flush_tb_1(int level, void **lp)
889 int i;
891 if (*lp == NULL) {
892 return;
894 if (level == 0) {
895 PageDesc *pd = *lp;
897 for (i = 0; i < V_L2_SIZE; ++i) {
898 pd[i].first_tb = NULL;
899 invalidate_page_bitmap(pd + i);
901 } else {
902 void **pp = *lp;
904 for (i = 0; i < V_L2_SIZE; ++i) {
905 page_flush_tb_1(level - 1, pp + i);
910 static void page_flush_tb(void)
912 int i, l1_sz = v_l1_size;
914 for (i = 0; i < l1_sz; i++) {
915 page_flush_tb_1(v_l2_levels, l1_map + i);
919 /* flush all the translation blocks */
920 static void do_tb_flush(CPUState *cpu, run_on_cpu_data tb_flush_count)
922 tb_lock();
924 /* If it is already been done on request of another CPU,
925 * just retry.
927 if (tcg_ctx.tb_ctx.tb_flush_count != tb_flush_count.host_int) {
928 goto done;
931 #if defined(DEBUG_TB_FLUSH)
932 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
933 (unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer),
934 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.tb_ctx.nb_tbs > 0 ?
935 ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)) /
936 tcg_ctx.tb_ctx.nb_tbs : 0);
937 #endif
938 if ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)
939 > tcg_ctx.code_gen_buffer_size) {
940 cpu_abort(cpu, "Internal error: code buffer overflow\n");
943 CPU_FOREACH(cpu) {
944 int i;
946 for (i = 0; i < TB_JMP_CACHE_SIZE; ++i) {
947 atomic_set(&cpu->tb_jmp_cache[i], NULL);
951 tcg_ctx.tb_ctx.nb_tbs = 0;
952 qht_reset_size(&tcg_ctx.tb_ctx.htable, CODE_GEN_HTABLE_SIZE);
953 page_flush_tb();
955 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
956 /* XXX: flush processor icache at this point if cache flush is
957 expensive */
958 atomic_mb_set(&tcg_ctx.tb_ctx.tb_flush_count,
959 tcg_ctx.tb_ctx.tb_flush_count + 1);
961 done:
962 tb_unlock();
965 void tb_flush(CPUState *cpu)
967 if (tcg_enabled()) {
968 unsigned tb_flush_count = atomic_mb_read(&tcg_ctx.tb_ctx.tb_flush_count);
969 async_safe_run_on_cpu(cpu, do_tb_flush,
970 RUN_ON_CPU_HOST_INT(tb_flush_count));
974 #ifdef DEBUG_TB_CHECK
976 static void
977 do_tb_invalidate_check(struct qht *ht, void *p, uint32_t hash, void *userp)
979 TranslationBlock *tb = p;
980 target_ulong addr = *(target_ulong *)userp;
982 if (!(addr + TARGET_PAGE_SIZE <= tb->pc || addr >= tb->pc + tb->size)) {
983 printf("ERROR invalidate: address=" TARGET_FMT_lx
984 " PC=%08lx size=%04x\n", addr, (long)tb->pc, tb->size);
988 /* verify that all the pages have correct rights for code
990 * Called with tb_lock held.
992 static void tb_invalidate_check(target_ulong address)
994 address &= TARGET_PAGE_MASK;
995 qht_iter(&tcg_ctx.tb_ctx.htable, do_tb_invalidate_check, &address);
998 static void
999 do_tb_page_check(struct qht *ht, void *p, uint32_t hash, void *userp)
1001 TranslationBlock *tb = p;
1002 int flags1, flags2;
1004 flags1 = page_get_flags(tb->pc);
1005 flags2 = page_get_flags(tb->pc + tb->size - 1);
1006 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
1007 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
1008 (long)tb->pc, tb->size, flags1, flags2);
1012 /* verify that all the pages have correct rights for code */
1013 static void tb_page_check(void)
1015 qht_iter(&tcg_ctx.tb_ctx.htable, do_tb_page_check, NULL);
1018 #endif
1020 static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
1022 TranslationBlock *tb1;
1023 unsigned int n1;
1025 for (;;) {
1026 tb1 = *ptb;
1027 n1 = (uintptr_t)tb1 & 3;
1028 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
1029 if (tb1 == tb) {
1030 *ptb = tb1->page_next[n1];
1031 break;
1033 ptb = &tb1->page_next[n1];
1037 /* remove the TB from a list of TBs jumping to the n-th jump target of the TB */
1038 static inline void tb_remove_from_jmp_list(TranslationBlock *tb, int n)
1040 TranslationBlock *tb1;
1041 uintptr_t *ptb, ntb;
1042 unsigned int n1;
1044 ptb = &tb->jmp_list_next[n];
1045 if (*ptb) {
1046 /* find tb(n) in circular list */
1047 for (;;) {
1048 ntb = *ptb;
1049 n1 = ntb & 3;
1050 tb1 = (TranslationBlock *)(ntb & ~3);
1051 if (n1 == n && tb1 == tb) {
1052 break;
1054 if (n1 == 2) {
1055 ptb = &tb1->jmp_list_first;
1056 } else {
1057 ptb = &tb1->jmp_list_next[n1];
1060 /* now we can suppress tb(n) from the list */
1061 *ptb = tb->jmp_list_next[n];
1063 tb->jmp_list_next[n] = (uintptr_t)NULL;
1067 /* reset the jump entry 'n' of a TB so that it is not chained to
1068 another TB */
1069 static inline void tb_reset_jump(TranslationBlock *tb, int n)
1071 uintptr_t addr = (uintptr_t)(tb->tc_ptr + tb->jmp_reset_offset[n]);
1072 tb_set_jmp_target(tb, n, addr);
1075 /* remove any jumps to the TB */
1076 static inline void tb_jmp_unlink(TranslationBlock *tb)
1078 TranslationBlock *tb1;
1079 uintptr_t *ptb, ntb;
1080 unsigned int n1;
1082 ptb = &tb->jmp_list_first;
1083 for (;;) {
1084 ntb = *ptb;
1085 n1 = ntb & 3;
1086 tb1 = (TranslationBlock *)(ntb & ~3);
1087 if (n1 == 2) {
1088 break;
1090 tb_reset_jump(tb1, n1);
1091 *ptb = tb1->jmp_list_next[n1];
1092 tb1->jmp_list_next[n1] = (uintptr_t)NULL;
1096 /* invalidate one TB
1098 * Called with tb_lock held.
1100 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
1102 CPUState *cpu;
1103 PageDesc *p;
1104 uint32_t h;
1105 tb_page_addr_t phys_pc;
1107 assert_tb_lock();
1109 atomic_set(&tb->invalid, true);
1111 /* remove the TB from the hash list */
1112 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1113 h = tb_hash_func(phys_pc, tb->pc, tb->flags);
1114 qht_remove(&tcg_ctx.tb_ctx.htable, tb, h);
1116 /* remove the TB from the page list */
1117 if (tb->page_addr[0] != page_addr) {
1118 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
1119 tb_page_remove(&p->first_tb, tb);
1120 invalidate_page_bitmap(p);
1122 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
1123 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
1124 tb_page_remove(&p->first_tb, tb);
1125 invalidate_page_bitmap(p);
1128 /* remove the TB from the hash list */
1129 h = tb_jmp_cache_hash_func(tb->pc);
1130 CPU_FOREACH(cpu) {
1131 if (atomic_read(&cpu->tb_jmp_cache[h]) == tb) {
1132 atomic_set(&cpu->tb_jmp_cache[h], NULL);
1136 /* suppress this TB from the two jump lists */
1137 tb_remove_from_jmp_list(tb, 0);
1138 tb_remove_from_jmp_list(tb, 1);
1140 /* suppress any remaining jumps to this TB */
1141 tb_jmp_unlink(tb);
1143 tcg_ctx.tb_ctx.tb_phys_invalidate_count++;
1146 #ifdef CONFIG_SOFTMMU
1147 static void build_page_bitmap(PageDesc *p)
1149 int n, tb_start, tb_end;
1150 TranslationBlock *tb;
1152 p->code_bitmap = bitmap_new(TARGET_PAGE_SIZE);
1154 tb = p->first_tb;
1155 while (tb != NULL) {
1156 n = (uintptr_t)tb & 3;
1157 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1158 /* NOTE: this is subtle as a TB may span two physical pages */
1159 if (n == 0) {
1160 /* NOTE: tb_end may be after the end of the page, but
1161 it is not a problem */
1162 tb_start = tb->pc & ~TARGET_PAGE_MASK;
1163 tb_end = tb_start + tb->size;
1164 if (tb_end > TARGET_PAGE_SIZE) {
1165 tb_end = TARGET_PAGE_SIZE;
1167 } else {
1168 tb_start = 0;
1169 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1171 bitmap_set(p->code_bitmap, tb_start, tb_end - tb_start);
1172 tb = tb->page_next[n];
1175 #endif
1177 /* add the tb in the target page and protect it if necessary
1179 * Called with mmap_lock held for user-mode emulation.
1181 static inline void tb_alloc_page(TranslationBlock *tb,
1182 unsigned int n, tb_page_addr_t page_addr)
1184 PageDesc *p;
1185 #ifndef CONFIG_USER_ONLY
1186 bool page_already_protected;
1187 #endif
1189 assert_memory_lock();
1191 tb->page_addr[n] = page_addr;
1192 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
1193 tb->page_next[n] = p->first_tb;
1194 #ifndef CONFIG_USER_ONLY
1195 page_already_protected = p->first_tb != NULL;
1196 #endif
1197 p->first_tb = (TranslationBlock *)((uintptr_t)tb | n);
1198 invalidate_page_bitmap(p);
1200 #if defined(CONFIG_USER_ONLY)
1201 if (p->flags & PAGE_WRITE) {
1202 target_ulong addr;
1203 PageDesc *p2;
1204 int prot;
1206 /* force the host page as non writable (writes will have a
1207 page fault + mprotect overhead) */
1208 page_addr &= qemu_host_page_mask;
1209 prot = 0;
1210 for (addr = page_addr; addr < page_addr + qemu_host_page_size;
1211 addr += TARGET_PAGE_SIZE) {
1213 p2 = page_find(addr >> TARGET_PAGE_BITS);
1214 if (!p2) {
1215 continue;
1217 prot |= p2->flags;
1218 p2->flags &= ~PAGE_WRITE;
1220 mprotect(g2h(page_addr), qemu_host_page_size,
1221 (prot & PAGE_BITS) & ~PAGE_WRITE);
1222 #ifdef DEBUG_TB_INVALIDATE
1223 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
1224 page_addr);
1225 #endif
1227 #else
1228 /* if some code is already present, then the pages are already
1229 protected. So we handle the case where only the first TB is
1230 allocated in a physical page */
1231 if (!page_already_protected) {
1232 tlb_protect_code(page_addr);
1234 #endif
1237 /* add a new TB and link it to the physical page tables. phys_page2 is
1238 * (-1) to indicate that only one page contains the TB.
1240 * Called with mmap_lock held for user-mode emulation.
1242 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
1243 tb_page_addr_t phys_page2)
1245 uint32_t h;
1247 assert_memory_lock();
1249 /* add in the page list */
1250 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1251 if (phys_page2 != -1) {
1252 tb_alloc_page(tb, 1, phys_page2);
1253 } else {
1254 tb->page_addr[1] = -1;
1257 /* add in the hash table */
1258 h = tb_hash_func(phys_pc, tb->pc, tb->flags);
1259 qht_insert(&tcg_ctx.tb_ctx.htable, tb, h);
1261 #ifdef DEBUG_TB_CHECK
1262 tb_page_check();
1263 #endif
1266 /* Called with mmap_lock held for user mode emulation. */
1267 TranslationBlock *tb_gen_code(CPUState *cpu,
1268 target_ulong pc, target_ulong cs_base,
1269 uint32_t flags, int cflags)
1271 CPUArchState *env = cpu->env_ptr;
1272 TranslationBlock *tb;
1273 tb_page_addr_t phys_pc, phys_page2;
1274 target_ulong virt_page2;
1275 tcg_insn_unit *gen_code_buf;
1276 int gen_code_size, search_size;
1277 #ifdef CONFIG_PROFILER
1278 int64_t ti;
1279 #endif
1280 assert_memory_lock();
1282 phys_pc = get_page_addr_code(env, pc);
1283 if (use_icount && !(cflags & CF_IGNORE_ICOUNT)) {
1284 cflags |= CF_USE_ICOUNT;
1287 tb = tb_alloc(pc);
1288 if (unlikely(!tb)) {
1289 buffer_overflow:
1290 /* flush must be done */
1291 tb_flush(cpu);
1292 mmap_unlock();
1293 cpu_loop_exit(cpu);
1296 gen_code_buf = tcg_ctx.code_gen_ptr;
1297 tb->tc_ptr = gen_code_buf;
1298 tb->cs_base = cs_base;
1299 tb->flags = flags;
1300 tb->cflags = cflags;
1302 #ifdef CONFIG_PROFILER
1303 tcg_ctx.tb_count1++; /* includes aborted translations because of
1304 exceptions */
1305 ti = profile_getclock();
1306 #endif
1308 tcg_func_start(&tcg_ctx);
1310 tcg_ctx.cpu = ENV_GET_CPU(env);
1311 gen_intermediate_code(env, tb);
1312 tcg_ctx.cpu = NULL;
1314 trace_translate_block(tb, tb->pc, tb->tc_ptr);
1316 /* generate machine code */
1317 tb->jmp_reset_offset[0] = TB_JMP_RESET_OFFSET_INVALID;
1318 tb->jmp_reset_offset[1] = TB_JMP_RESET_OFFSET_INVALID;
1319 tcg_ctx.tb_jmp_reset_offset = tb->jmp_reset_offset;
1320 #ifdef USE_DIRECT_JUMP
1321 tcg_ctx.tb_jmp_insn_offset = tb->jmp_insn_offset;
1322 tcg_ctx.tb_jmp_target_addr = NULL;
1323 #else
1324 tcg_ctx.tb_jmp_insn_offset = NULL;
1325 tcg_ctx.tb_jmp_target_addr = tb->jmp_target_addr;
1326 #endif
1328 #ifdef CONFIG_PROFILER
1329 tcg_ctx.tb_count++;
1330 tcg_ctx.interm_time += profile_getclock() - ti;
1331 tcg_ctx.code_time -= profile_getclock();
1332 #endif
1334 /* ??? Overflow could be handled better here. In particular, we
1335 don't need to re-do gen_intermediate_code, nor should we re-do
1336 the tcg optimization currently hidden inside tcg_gen_code. All
1337 that should be required is to flush the TBs, allocate a new TB,
1338 re-initialize it per above, and re-do the actual code generation. */
1339 gen_code_size = tcg_gen_code(&tcg_ctx, tb);
1340 if (unlikely(gen_code_size < 0)) {
1341 goto buffer_overflow;
1343 search_size = encode_search(tb, (void *)gen_code_buf + gen_code_size);
1344 if (unlikely(search_size < 0)) {
1345 goto buffer_overflow;
1348 #ifdef CONFIG_PROFILER
1349 tcg_ctx.code_time += profile_getclock();
1350 tcg_ctx.code_in_len += tb->size;
1351 tcg_ctx.code_out_len += gen_code_size;
1352 tcg_ctx.search_out_len += search_size;
1353 #endif
1355 #ifdef DEBUG_DISAS
1356 if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM) &&
1357 qemu_log_in_addr_range(tb->pc)) {
1358 qemu_log_lock();
1359 qemu_log("OUT: [size=%d]\n", gen_code_size);
1360 log_disas(tb->tc_ptr, gen_code_size);
1361 qemu_log("\n");
1362 qemu_log_flush();
1363 qemu_log_unlock();
1365 #endif
1367 tcg_ctx.code_gen_ptr = (void *)
1368 ROUND_UP((uintptr_t)gen_code_buf + gen_code_size + search_size,
1369 CODE_GEN_ALIGN);
1371 /* init jump list */
1372 assert(((uintptr_t)tb & 3) == 0);
1373 tb->jmp_list_first = (uintptr_t)tb | 2;
1374 tb->jmp_list_next[0] = (uintptr_t)NULL;
1375 tb->jmp_list_next[1] = (uintptr_t)NULL;
1377 /* init original jump addresses wich has been set during tcg_gen_code() */
1378 if (tb->jmp_reset_offset[0] != TB_JMP_RESET_OFFSET_INVALID) {
1379 tb_reset_jump(tb, 0);
1381 if (tb->jmp_reset_offset[1] != TB_JMP_RESET_OFFSET_INVALID) {
1382 tb_reset_jump(tb, 1);
1385 /* check next page if needed */
1386 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
1387 phys_page2 = -1;
1388 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
1389 phys_page2 = get_page_addr_code(env, virt_page2);
1391 /* As long as consistency of the TB stuff is provided by tb_lock in user
1392 * mode and is implicit in single-threaded softmmu emulation, no explicit
1393 * memory barrier is required before tb_link_page() makes the TB visible
1394 * through the physical hash table and physical page list.
1396 tb_link_page(tb, phys_pc, phys_page2);
1397 return tb;
1401 * Invalidate all TBs which intersect with the target physical address range
1402 * [start;end[. NOTE: start and end may refer to *different* physical pages.
1403 * 'is_cpu_write_access' should be true if called from a real cpu write
1404 * access: the virtual CPU will exit the current TB if code is modified inside
1405 * this TB.
1407 * Called with mmap_lock held for user-mode emulation, grabs tb_lock
1408 * Called with tb_lock held for system-mode emulation
1410 static void tb_invalidate_phys_range_1(tb_page_addr_t start, tb_page_addr_t end)
1412 while (start < end) {
1413 tb_invalidate_phys_page_range(start, end, 0);
1414 start &= TARGET_PAGE_MASK;
1415 start += TARGET_PAGE_SIZE;
1419 #ifdef CONFIG_SOFTMMU
1420 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end)
1422 assert_tb_lock();
1423 tb_invalidate_phys_range_1(start, end);
1425 #else
1426 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end)
1428 assert_memory_lock();
1429 tb_lock();
1430 tb_invalidate_phys_range_1(start, end);
1431 tb_unlock();
1433 #endif
1435 * Invalidate all TBs which intersect with the target physical address range
1436 * [start;end[. NOTE: start and end must refer to the *same* physical page.
1437 * 'is_cpu_write_access' should be true if called from a real cpu write
1438 * access: the virtual CPU will exit the current TB if code is modified inside
1439 * this TB.
1441 * Called with tb_lock/mmap_lock held for user-mode emulation
1442 * Called with tb_lock held for system-mode emulation
1444 void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
1445 int is_cpu_write_access)
1447 TranslationBlock *tb, *tb_next;
1448 #if defined(TARGET_HAS_PRECISE_SMC)
1449 CPUState *cpu = current_cpu;
1450 CPUArchState *env = NULL;
1451 #endif
1452 tb_page_addr_t tb_start, tb_end;
1453 PageDesc *p;
1454 int n;
1455 #ifdef TARGET_HAS_PRECISE_SMC
1456 int current_tb_not_found = is_cpu_write_access;
1457 TranslationBlock *current_tb = NULL;
1458 int current_tb_modified = 0;
1459 target_ulong current_pc = 0;
1460 target_ulong current_cs_base = 0;
1461 uint32_t current_flags = 0;
1462 #endif /* TARGET_HAS_PRECISE_SMC */
1464 assert_memory_lock();
1465 assert_tb_lock();
1467 p = page_find(start >> TARGET_PAGE_BITS);
1468 if (!p) {
1469 return;
1471 #if defined(TARGET_HAS_PRECISE_SMC)
1472 if (cpu != NULL) {
1473 env = cpu->env_ptr;
1475 #endif
1477 /* we remove all the TBs in the range [start, end[ */
1478 /* XXX: see if in some cases it could be faster to invalidate all
1479 the code */
1480 tb = p->first_tb;
1481 while (tb != NULL) {
1482 n = (uintptr_t)tb & 3;
1483 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1484 tb_next = tb->page_next[n];
1485 /* NOTE: this is subtle as a TB may span two physical pages */
1486 if (n == 0) {
1487 /* NOTE: tb_end may be after the end of the page, but
1488 it is not a problem */
1489 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1490 tb_end = tb_start + tb->size;
1491 } else {
1492 tb_start = tb->page_addr[1];
1493 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1495 if (!(tb_end <= start || tb_start >= end)) {
1496 #ifdef TARGET_HAS_PRECISE_SMC
1497 if (current_tb_not_found) {
1498 current_tb_not_found = 0;
1499 current_tb = NULL;
1500 if (cpu->mem_io_pc) {
1501 /* now we have a real cpu fault */
1502 current_tb = tb_find_pc(cpu->mem_io_pc);
1505 if (current_tb == tb &&
1506 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1507 /* If we are modifying the current TB, we must stop
1508 its execution. We could be more precise by checking
1509 that the modification is after the current PC, but it
1510 would require a specialized function to partially
1511 restore the CPU state */
1513 current_tb_modified = 1;
1514 cpu_restore_state_from_tb(cpu, current_tb, cpu->mem_io_pc);
1515 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1516 &current_flags);
1518 #endif /* TARGET_HAS_PRECISE_SMC */
1519 tb_phys_invalidate(tb, -1);
1521 tb = tb_next;
1523 #if !defined(CONFIG_USER_ONLY)
1524 /* if no code remaining, no need to continue to use slow writes */
1525 if (!p->first_tb) {
1526 invalidate_page_bitmap(p);
1527 tlb_unprotect_code(start);
1529 #endif
1530 #ifdef TARGET_HAS_PRECISE_SMC
1531 if (current_tb_modified) {
1532 /* we generate a block containing just the instruction
1533 modifying the memory. It will ensure that it cannot modify
1534 itself */
1535 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1536 cpu_loop_exit_noexc(cpu);
1538 #endif
1541 #ifdef CONFIG_SOFTMMU
1542 /* len must be <= 8 and start must be a multiple of len.
1543 * Called via softmmu_template.h when code areas are written to with
1544 * tb_lock held.
1546 void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
1548 PageDesc *p;
1550 #if 0
1551 if (1) {
1552 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1553 cpu_single_env->mem_io_vaddr, len,
1554 cpu_single_env->eip,
1555 cpu_single_env->eip +
1556 (intptr_t)cpu_single_env->segs[R_CS].base);
1558 #endif
1559 assert_memory_lock();
1561 p = page_find(start >> TARGET_PAGE_BITS);
1562 if (!p) {
1563 return;
1565 if (!p->code_bitmap &&
1566 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD) {
1567 /* build code bitmap. FIXME: writes should be protected by
1568 * tb_lock, reads by tb_lock or RCU.
1570 build_page_bitmap(p);
1572 if (p->code_bitmap) {
1573 unsigned int nr;
1574 unsigned long b;
1576 nr = start & ~TARGET_PAGE_MASK;
1577 b = p->code_bitmap[BIT_WORD(nr)] >> (nr & (BITS_PER_LONG - 1));
1578 if (b & ((1 << len) - 1)) {
1579 goto do_invalidate;
1581 } else {
1582 do_invalidate:
1583 tb_invalidate_phys_page_range(start, start + len, 1);
1586 #else
1587 /* Called with mmap_lock held. If pc is not 0 then it indicates the
1588 * host PC of the faulting store instruction that caused this invalidate.
1589 * Returns true if the caller needs to abort execution of the current
1590 * TB (because it was modified by this store and the guest CPU has
1591 * precise-SMC semantics).
1593 static bool tb_invalidate_phys_page(tb_page_addr_t addr, uintptr_t pc)
1595 TranslationBlock *tb;
1596 PageDesc *p;
1597 int n;
1598 #ifdef TARGET_HAS_PRECISE_SMC
1599 TranslationBlock *current_tb = NULL;
1600 CPUState *cpu = current_cpu;
1601 CPUArchState *env = NULL;
1602 int current_tb_modified = 0;
1603 target_ulong current_pc = 0;
1604 target_ulong current_cs_base = 0;
1605 uint32_t current_flags = 0;
1606 #endif
1608 assert_memory_lock();
1610 addr &= TARGET_PAGE_MASK;
1611 p = page_find(addr >> TARGET_PAGE_BITS);
1612 if (!p) {
1613 return false;
1616 tb_lock();
1617 tb = p->first_tb;
1618 #ifdef TARGET_HAS_PRECISE_SMC
1619 if (tb && pc != 0) {
1620 current_tb = tb_find_pc(pc);
1622 if (cpu != NULL) {
1623 env = cpu->env_ptr;
1625 #endif
1626 while (tb != NULL) {
1627 n = (uintptr_t)tb & 3;
1628 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1629 #ifdef TARGET_HAS_PRECISE_SMC
1630 if (current_tb == tb &&
1631 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1632 /* If we are modifying the current TB, we must stop
1633 its execution. We could be more precise by checking
1634 that the modification is after the current PC, but it
1635 would require a specialized function to partially
1636 restore the CPU state */
1638 current_tb_modified = 1;
1639 cpu_restore_state_from_tb(cpu, current_tb, pc);
1640 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1641 &current_flags);
1643 #endif /* TARGET_HAS_PRECISE_SMC */
1644 tb_phys_invalidate(tb, addr);
1645 tb = tb->page_next[n];
1647 p->first_tb = NULL;
1648 #ifdef TARGET_HAS_PRECISE_SMC
1649 if (current_tb_modified) {
1650 /* we generate a block containing just the instruction
1651 modifying the memory. It will ensure that it cannot modify
1652 itself */
1653 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1654 /* tb_lock will be reset after cpu_loop_exit_noexc longjmps
1655 * back into the cpu_exec loop. */
1656 return true;
1658 #endif
1659 tb_unlock();
1661 return false;
1663 #endif
1665 /* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1666 tb[1].tc_ptr. Return NULL if not found */
1667 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr)
1669 int m_min, m_max, m;
1670 uintptr_t v;
1671 TranslationBlock *tb;
1673 if (tcg_ctx.tb_ctx.nb_tbs <= 0) {
1674 return NULL;
1676 if (tc_ptr < (uintptr_t)tcg_ctx.code_gen_buffer ||
1677 tc_ptr >= (uintptr_t)tcg_ctx.code_gen_ptr) {
1678 return NULL;
1680 /* binary search (cf Knuth) */
1681 m_min = 0;
1682 m_max = tcg_ctx.tb_ctx.nb_tbs - 1;
1683 while (m_min <= m_max) {
1684 m = (m_min + m_max) >> 1;
1685 tb = &tcg_ctx.tb_ctx.tbs[m];
1686 v = (uintptr_t)tb->tc_ptr;
1687 if (v == tc_ptr) {
1688 return tb;
1689 } else if (tc_ptr < v) {
1690 m_max = m - 1;
1691 } else {
1692 m_min = m + 1;
1695 return &tcg_ctx.tb_ctx.tbs[m_max];
1698 #if !defined(CONFIG_USER_ONLY)
1699 void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr)
1701 ram_addr_t ram_addr;
1702 MemoryRegion *mr;
1703 hwaddr l = 1;
1705 rcu_read_lock();
1706 mr = address_space_translate(as, addr, &addr, &l, false);
1707 if (!(memory_region_is_ram(mr)
1708 || memory_region_is_romd(mr))) {
1709 rcu_read_unlock();
1710 return;
1712 ram_addr = memory_region_get_ram_addr(mr) + addr;
1713 tb_lock();
1714 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
1715 tb_unlock();
1716 rcu_read_unlock();
1718 #endif /* !defined(CONFIG_USER_ONLY) */
1720 /* Called with tb_lock held. */
1721 void tb_check_watchpoint(CPUState *cpu)
1723 TranslationBlock *tb;
1725 tb = tb_find_pc(cpu->mem_io_pc);
1726 if (tb) {
1727 /* We can use retranslation to find the PC. */
1728 cpu_restore_state_from_tb(cpu, tb, cpu->mem_io_pc);
1729 tb_phys_invalidate(tb, -1);
1730 } else {
1731 /* The exception probably happened in a helper. The CPU state should
1732 have been saved before calling it. Fetch the PC from there. */
1733 CPUArchState *env = cpu->env_ptr;
1734 target_ulong pc, cs_base;
1735 tb_page_addr_t addr;
1736 uint32_t flags;
1738 cpu_get_tb_cpu_state(env, &pc, &cs_base, &flags);
1739 addr = get_page_addr_code(env, pc);
1740 tb_invalidate_phys_range(addr, addr + 1);
1744 #ifndef CONFIG_USER_ONLY
1745 /* in deterministic execution mode, instructions doing device I/Os
1746 must be at the end of the TB */
1747 void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr)
1749 #if defined(TARGET_MIPS) || defined(TARGET_SH4)
1750 CPUArchState *env = cpu->env_ptr;
1751 #endif
1752 TranslationBlock *tb;
1753 uint32_t n, cflags;
1754 target_ulong pc, cs_base;
1755 uint32_t flags;
1757 tb_lock();
1758 tb = tb_find_pc(retaddr);
1759 if (!tb) {
1760 cpu_abort(cpu, "cpu_io_recompile: could not find TB for pc=%p",
1761 (void *)retaddr);
1763 n = cpu->icount_decr.u16.low + tb->icount;
1764 cpu_restore_state_from_tb(cpu, tb, retaddr);
1765 /* Calculate how many instructions had been executed before the fault
1766 occurred. */
1767 n = n - cpu->icount_decr.u16.low;
1768 /* Generate a new TB ending on the I/O insn. */
1769 n++;
1770 /* On MIPS and SH, delay slot instructions can only be restarted if
1771 they were already the first instruction in the TB. If this is not
1772 the first instruction in a TB then re-execute the preceding
1773 branch. */
1774 #if defined(TARGET_MIPS)
1775 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
1776 env->active_tc.PC -= (env->hflags & MIPS_HFLAG_B16 ? 2 : 4);
1777 cpu->icount_decr.u16.low++;
1778 env->hflags &= ~MIPS_HFLAG_BMASK;
1780 #elif defined(TARGET_SH4)
1781 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
1782 && n > 1) {
1783 env->pc -= 2;
1784 cpu->icount_decr.u16.low++;
1785 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
1787 #endif
1788 /* This should never happen. */
1789 if (n > CF_COUNT_MASK) {
1790 cpu_abort(cpu, "TB too big during recompile");
1793 cflags = n | CF_LAST_IO;
1794 pc = tb->pc;
1795 cs_base = tb->cs_base;
1796 flags = tb->flags;
1797 tb_phys_invalidate(tb, -1);
1798 if (tb->cflags & CF_NOCACHE) {
1799 if (tb->orig_tb) {
1800 /* Invalidate original TB if this TB was generated in
1801 * cpu_exec_nocache() */
1802 tb_phys_invalidate(tb->orig_tb, -1);
1804 tb_free(tb);
1806 /* FIXME: In theory this could raise an exception. In practice
1807 we have already translated the block once so it's probably ok. */
1808 tb_gen_code(cpu, pc, cs_base, flags, cflags);
1810 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
1811 * the first in the TB) then we end up generating a whole new TB and
1812 * repeating the fault, which is horribly inefficient.
1813 * Better would be to execute just this insn uncached, or generate a
1814 * second new TB.
1816 * cpu_loop_exit_noexc will longjmp back to cpu_exec where the
1817 * tb_lock gets reset.
1819 cpu_loop_exit_noexc(cpu);
1822 void tb_flush_jmp_cache(CPUState *cpu, target_ulong addr)
1824 unsigned int i;
1826 /* Discard jump cache entries for any tb which might potentially
1827 overlap the flushed page. */
1828 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1829 memset(&cpu->tb_jmp_cache[i], 0,
1830 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1832 i = tb_jmp_cache_hash_page(addr);
1833 memset(&cpu->tb_jmp_cache[i], 0,
1834 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1837 static void print_qht_statistics(FILE *f, fprintf_function cpu_fprintf,
1838 struct qht_stats hst)
1840 uint32_t hgram_opts;
1841 size_t hgram_bins;
1842 char *hgram;
1844 if (!hst.head_buckets) {
1845 return;
1847 cpu_fprintf(f, "TB hash buckets %zu/%zu (%0.2f%% head buckets used)\n",
1848 hst.used_head_buckets, hst.head_buckets,
1849 (double)hst.used_head_buckets / hst.head_buckets * 100);
1851 hgram_opts = QDIST_PR_BORDER | QDIST_PR_LABELS;
1852 hgram_opts |= QDIST_PR_100X | QDIST_PR_PERCENT;
1853 if (qdist_xmax(&hst.occupancy) - qdist_xmin(&hst.occupancy) == 1) {
1854 hgram_opts |= QDIST_PR_NODECIMAL;
1856 hgram = qdist_pr(&hst.occupancy, 10, hgram_opts);
1857 cpu_fprintf(f, "TB hash occupancy %0.2f%% avg chain occ. Histogram: %s\n",
1858 qdist_avg(&hst.occupancy) * 100, hgram);
1859 g_free(hgram);
1861 hgram_opts = QDIST_PR_BORDER | QDIST_PR_LABELS;
1862 hgram_bins = qdist_xmax(&hst.chain) - qdist_xmin(&hst.chain);
1863 if (hgram_bins > 10) {
1864 hgram_bins = 10;
1865 } else {
1866 hgram_bins = 0;
1867 hgram_opts |= QDIST_PR_NODECIMAL | QDIST_PR_NOBINRANGE;
1869 hgram = qdist_pr(&hst.chain, hgram_bins, hgram_opts);
1870 cpu_fprintf(f, "TB hash avg chain %0.3f buckets. Histogram: %s\n",
1871 qdist_avg(&hst.chain), hgram);
1872 g_free(hgram);
1875 void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
1877 int i, target_code_size, max_target_code_size;
1878 int direct_jmp_count, direct_jmp2_count, cross_page;
1879 TranslationBlock *tb;
1880 struct qht_stats hst;
1882 tb_lock();
1884 target_code_size = 0;
1885 max_target_code_size = 0;
1886 cross_page = 0;
1887 direct_jmp_count = 0;
1888 direct_jmp2_count = 0;
1889 for (i = 0; i < tcg_ctx.tb_ctx.nb_tbs; i++) {
1890 tb = &tcg_ctx.tb_ctx.tbs[i];
1891 target_code_size += tb->size;
1892 if (tb->size > max_target_code_size) {
1893 max_target_code_size = tb->size;
1895 if (tb->page_addr[1] != -1) {
1896 cross_page++;
1898 if (tb->jmp_reset_offset[0] != TB_JMP_RESET_OFFSET_INVALID) {
1899 direct_jmp_count++;
1900 if (tb->jmp_reset_offset[1] != TB_JMP_RESET_OFFSET_INVALID) {
1901 direct_jmp2_count++;
1905 /* XXX: avoid using doubles ? */
1906 cpu_fprintf(f, "Translation buffer state:\n");
1907 cpu_fprintf(f, "gen code size %td/%zd\n",
1908 tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer,
1909 tcg_ctx.code_gen_highwater - tcg_ctx.code_gen_buffer);
1910 cpu_fprintf(f, "TB count %d/%d\n",
1911 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.code_gen_max_blocks);
1912 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
1913 tcg_ctx.tb_ctx.nb_tbs ? target_code_size /
1914 tcg_ctx.tb_ctx.nb_tbs : 0,
1915 max_target_code_size);
1916 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
1917 tcg_ctx.tb_ctx.nb_tbs ? (tcg_ctx.code_gen_ptr -
1918 tcg_ctx.code_gen_buffer) /
1919 tcg_ctx.tb_ctx.nb_tbs : 0,
1920 target_code_size ? (double) (tcg_ctx.code_gen_ptr -
1921 tcg_ctx.code_gen_buffer) /
1922 target_code_size : 0);
1923 cpu_fprintf(f, "cross page TB count %d (%d%%)\n", cross_page,
1924 tcg_ctx.tb_ctx.nb_tbs ? (cross_page * 100) /
1925 tcg_ctx.tb_ctx.nb_tbs : 0);
1926 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
1927 direct_jmp_count,
1928 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp_count * 100) /
1929 tcg_ctx.tb_ctx.nb_tbs : 0,
1930 direct_jmp2_count,
1931 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp2_count * 100) /
1932 tcg_ctx.tb_ctx.nb_tbs : 0);
1934 qht_statistics_init(&tcg_ctx.tb_ctx.htable, &hst);
1935 print_qht_statistics(f, cpu_fprintf, hst);
1936 qht_statistics_destroy(&hst);
1938 cpu_fprintf(f, "\nStatistics:\n");
1939 cpu_fprintf(f, "TB flush count %u\n",
1940 atomic_read(&tcg_ctx.tb_ctx.tb_flush_count));
1941 cpu_fprintf(f, "TB invalidate count %d\n",
1942 tcg_ctx.tb_ctx.tb_phys_invalidate_count);
1943 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
1944 tcg_dump_info(f, cpu_fprintf);
1946 tb_unlock();
1949 void dump_opcount_info(FILE *f, fprintf_function cpu_fprintf)
1951 tcg_dump_op_count(f, cpu_fprintf);
1954 #else /* CONFIG_USER_ONLY */
1956 void cpu_interrupt(CPUState *cpu, int mask)
1958 cpu->interrupt_request |= mask;
1959 cpu->tcg_exit_req = 1;
1963 * Walks guest process memory "regions" one by one
1964 * and calls callback function 'fn' for each region.
1966 struct walk_memory_regions_data {
1967 walk_memory_regions_fn fn;
1968 void *priv;
1969 target_ulong start;
1970 int prot;
1973 static int walk_memory_regions_end(struct walk_memory_regions_data *data,
1974 target_ulong end, int new_prot)
1976 if (data->start != -1u) {
1977 int rc = data->fn(data->priv, data->start, end, data->prot);
1978 if (rc != 0) {
1979 return rc;
1983 data->start = (new_prot ? end : -1u);
1984 data->prot = new_prot;
1986 return 0;
1989 static int walk_memory_regions_1(struct walk_memory_regions_data *data,
1990 target_ulong base, int level, void **lp)
1992 target_ulong pa;
1993 int i, rc;
1995 if (*lp == NULL) {
1996 return walk_memory_regions_end(data, base, 0);
1999 if (level == 0) {
2000 PageDesc *pd = *lp;
2002 for (i = 0; i < V_L2_SIZE; ++i) {
2003 int prot = pd[i].flags;
2005 pa = base | (i << TARGET_PAGE_BITS);
2006 if (prot != data->prot) {
2007 rc = walk_memory_regions_end(data, pa, prot);
2008 if (rc != 0) {
2009 return rc;
2013 } else {
2014 void **pp = *lp;
2016 for (i = 0; i < V_L2_SIZE; ++i) {
2017 pa = base | ((target_ulong)i <<
2018 (TARGET_PAGE_BITS + V_L2_BITS * level));
2019 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2020 if (rc != 0) {
2021 return rc;
2026 return 0;
2029 int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2031 struct walk_memory_regions_data data;
2032 uintptr_t i, l1_sz = v_l1_size;
2034 data.fn = fn;
2035 data.priv = priv;
2036 data.start = -1u;
2037 data.prot = 0;
2039 for (i = 0; i < l1_sz; i++) {
2040 target_ulong base = i << (v_l1_shift + TARGET_PAGE_BITS);
2041 int rc = walk_memory_regions_1(&data, base, v_l2_levels, l1_map + i);
2042 if (rc != 0) {
2043 return rc;
2047 return walk_memory_regions_end(&data, 0, 0);
2050 static int dump_region(void *priv, target_ulong start,
2051 target_ulong end, unsigned long prot)
2053 FILE *f = (FILE *)priv;
2055 (void) fprintf(f, TARGET_FMT_lx"-"TARGET_FMT_lx
2056 " "TARGET_FMT_lx" %c%c%c\n",
2057 start, end, end - start,
2058 ((prot & PAGE_READ) ? 'r' : '-'),
2059 ((prot & PAGE_WRITE) ? 'w' : '-'),
2060 ((prot & PAGE_EXEC) ? 'x' : '-'));
2062 return 0;
2065 /* dump memory mappings */
2066 void page_dump(FILE *f)
2068 const int length = sizeof(target_ulong) * 2;
2069 (void) fprintf(f, "%-*s %-*s %-*s %s\n",
2070 length, "start", length, "end", length, "size", "prot");
2071 walk_memory_regions(f, dump_region);
2074 int page_get_flags(target_ulong address)
2076 PageDesc *p;
2078 p = page_find(address >> TARGET_PAGE_BITS);
2079 if (!p) {
2080 return 0;
2082 return p->flags;
2085 /* Modify the flags of a page and invalidate the code if necessary.
2086 The flag PAGE_WRITE_ORG is positioned automatically depending
2087 on PAGE_WRITE. The mmap_lock should already be held. */
2088 void page_set_flags(target_ulong start, target_ulong end, int flags)
2090 target_ulong addr, len;
2092 /* This function should never be called with addresses outside the
2093 guest address space. If this assert fires, it probably indicates
2094 a missing call to h2g_valid. */
2095 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2096 assert(end < ((target_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2097 #endif
2098 assert(start < end);
2099 assert_memory_lock();
2101 start = start & TARGET_PAGE_MASK;
2102 end = TARGET_PAGE_ALIGN(end);
2104 if (flags & PAGE_WRITE) {
2105 flags |= PAGE_WRITE_ORG;
2108 for (addr = start, len = end - start;
2109 len != 0;
2110 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2111 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2113 /* If the write protection bit is set, then we invalidate
2114 the code inside. */
2115 if (!(p->flags & PAGE_WRITE) &&
2116 (flags & PAGE_WRITE) &&
2117 p->first_tb) {
2118 tb_invalidate_phys_page(addr, 0);
2120 p->flags = flags;
2124 int page_check_range(target_ulong start, target_ulong len, int flags)
2126 PageDesc *p;
2127 target_ulong end;
2128 target_ulong addr;
2130 /* This function should never be called with addresses outside the
2131 guest address space. If this assert fires, it probably indicates
2132 a missing call to h2g_valid. */
2133 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2134 assert(start < ((target_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2135 #endif
2137 if (len == 0) {
2138 return 0;
2140 if (start + len - 1 < start) {
2141 /* We've wrapped around. */
2142 return -1;
2145 /* must do before we loose bits in the next step */
2146 end = TARGET_PAGE_ALIGN(start + len);
2147 start = start & TARGET_PAGE_MASK;
2149 for (addr = start, len = end - start;
2150 len != 0;
2151 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2152 p = page_find(addr >> TARGET_PAGE_BITS);
2153 if (!p) {
2154 return -1;
2156 if (!(p->flags & PAGE_VALID)) {
2157 return -1;
2160 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ)) {
2161 return -1;
2163 if (flags & PAGE_WRITE) {
2164 if (!(p->flags & PAGE_WRITE_ORG)) {
2165 return -1;
2167 /* unprotect the page if it was put read-only because it
2168 contains translated code */
2169 if (!(p->flags & PAGE_WRITE)) {
2170 if (!page_unprotect(addr, 0)) {
2171 return -1;
2176 return 0;
2179 /* called from signal handler: invalidate the code and unprotect the
2180 * page. Return 0 if the fault was not handled, 1 if it was handled,
2181 * and 2 if it was handled but the caller must cause the TB to be
2182 * immediately exited. (We can only return 2 if the 'pc' argument is
2183 * non-zero.)
2185 int page_unprotect(target_ulong address, uintptr_t pc)
2187 unsigned int prot;
2188 bool current_tb_invalidated;
2189 PageDesc *p;
2190 target_ulong host_start, host_end, addr;
2192 /* Technically this isn't safe inside a signal handler. However we
2193 know this only ever happens in a synchronous SEGV handler, so in
2194 practice it seems to be ok. */
2195 mmap_lock();
2197 p = page_find(address >> TARGET_PAGE_BITS);
2198 if (!p) {
2199 mmap_unlock();
2200 return 0;
2203 /* if the page was really writable, then we change its
2204 protection back to writable */
2205 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
2206 host_start = address & qemu_host_page_mask;
2207 host_end = host_start + qemu_host_page_size;
2209 prot = 0;
2210 current_tb_invalidated = false;
2211 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
2212 p = page_find(addr >> TARGET_PAGE_BITS);
2213 p->flags |= PAGE_WRITE;
2214 prot |= p->flags;
2216 /* and since the content will be modified, we must invalidate
2217 the corresponding translated code. */
2218 current_tb_invalidated |= tb_invalidate_phys_page(addr, pc);
2219 #ifdef DEBUG_TB_CHECK
2220 tb_invalidate_check(addr);
2221 #endif
2223 mprotect((void *)g2h(host_start), qemu_host_page_size,
2224 prot & PAGE_BITS);
2226 mmap_unlock();
2227 /* If current TB was invalidated return to main loop */
2228 return current_tb_invalidated ? 2 : 1;
2230 mmap_unlock();
2231 return 0;
2233 #endif /* CONFIG_USER_ONLY */