ppc/spapr: implement H_SIGNAL_SYS_RESET
[qemu/kevin.git] / translate-all.c
blob6d2fcabca792a5e54af2bda1e95ea28c837b2338
1 /*
2 * Host code generation
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 #ifdef _WIN32
20 #include <windows.h>
21 #endif
22 #include "qemu/osdep.h"
25 #include "qemu-common.h"
26 #define NO_CPU_IO_DEFS
27 #include "cpu.h"
28 #include "trace.h"
29 #include "disas/disas.h"
30 #include "exec/exec-all.h"
31 #include "tcg.h"
32 #if defined(CONFIG_USER_ONLY)
33 #include "qemu.h"
34 #include "exec/exec-all.h"
35 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
36 #include <sys/param.h>
37 #if __FreeBSD_version >= 700104
38 #define HAVE_KINFO_GETVMMAP
39 #define sigqueue sigqueue_freebsd /* avoid redefinition */
40 #include <sys/proc.h>
41 #include <machine/profile.h>
42 #define _KERNEL
43 #include <sys/user.h>
44 #undef _KERNEL
45 #undef sigqueue
46 #include <libutil.h>
47 #endif
48 #endif
49 #else
50 #include "exec/address-spaces.h"
51 #endif
53 #include "exec/cputlb.h"
54 #include "exec/tb-hash.h"
55 #include "translate-all.h"
56 #include "qemu/bitmap.h"
57 #include "qemu/timer.h"
58 #include "exec/log.h"
60 /* #define DEBUG_TB_INVALIDATE */
61 /* #define DEBUG_TB_FLUSH */
62 /* #define DEBUG_LOCKING */
63 /* make various TB consistency checks */
64 /* #define DEBUG_TB_CHECK */
66 #if !defined(CONFIG_USER_ONLY)
67 /* TB consistency checks only implemented for usermode emulation. */
68 #undef DEBUG_TB_CHECK
69 #endif
71 /* Access to the various translations structures need to be serialised via locks
72 * for consistency. This is automatic for SoftMMU based system
73 * emulation due to its single threaded nature. In user-mode emulation
74 * access to the memory related structures are protected with the
75 * mmap_lock.
77 #ifdef DEBUG_LOCKING
78 #define DEBUG_MEM_LOCKS 1
79 #else
80 #define DEBUG_MEM_LOCKS 0
81 #endif
83 #ifdef CONFIG_SOFTMMU
84 #define assert_memory_lock() do { /* nothing */ } while (0)
85 #else
86 #define assert_memory_lock() do { \
87 if (DEBUG_MEM_LOCKS) { \
88 g_assert(have_mmap_lock()); \
89 } \
90 } while (0)
91 #endif
93 #define SMC_BITMAP_USE_THRESHOLD 10
95 typedef struct PageDesc {
96 /* list of TBs intersecting this ram page */
97 TranslationBlock *first_tb;
98 #ifdef CONFIG_SOFTMMU
99 /* in order to optimize self modifying code, we count the number
100 of lookups we do to a given page to use a bitmap */
101 unsigned int code_write_count;
102 unsigned long *code_bitmap;
103 #else
104 unsigned long flags;
105 #endif
106 } PageDesc;
108 /* In system mode we want L1_MAP to be based on ram offsets,
109 while in user mode we want it to be based on virtual addresses. */
110 #if !defined(CONFIG_USER_ONLY)
111 #if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
112 # define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
113 #else
114 # define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
115 #endif
116 #else
117 # define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
118 #endif
120 /* Size of the L2 (and L3, etc) page tables. */
121 #define V_L2_BITS 10
122 #define V_L2_SIZE (1 << V_L2_BITS)
124 uintptr_t qemu_host_page_size;
125 intptr_t qemu_host_page_mask;
128 * L1 Mapping properties
130 static int v_l1_size;
131 static int v_l1_shift;
132 static int v_l2_levels;
134 /* The bottom level has pointers to PageDesc, and is indexed by
135 * anything from 4 to (V_L2_BITS + 3) bits, depending on target page size.
137 #define V_L1_MIN_BITS 4
138 #define V_L1_MAX_BITS (V_L2_BITS + 3)
139 #define V_L1_MAX_SIZE (1 << V_L1_MAX_BITS)
141 static void *l1_map[V_L1_MAX_SIZE];
143 /* code generation context */
144 TCGContext tcg_ctx;
145 bool parallel_cpus;
147 /* translation block context */
148 #ifdef CONFIG_USER_ONLY
149 __thread int have_tb_lock;
150 #endif
152 static void page_table_config_init(void)
154 uint32_t v_l1_bits;
156 assert(TARGET_PAGE_BITS);
157 /* The bits remaining after N lower levels of page tables. */
158 v_l1_bits = (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % V_L2_BITS;
159 if (v_l1_bits < V_L1_MIN_BITS) {
160 v_l1_bits += V_L2_BITS;
163 v_l1_size = 1 << v_l1_bits;
164 v_l1_shift = L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - v_l1_bits;
165 v_l2_levels = v_l1_shift / V_L2_BITS - 1;
167 assert(v_l1_bits <= V_L1_MAX_BITS);
168 assert(v_l1_shift % V_L2_BITS == 0);
169 assert(v_l2_levels >= 0);
172 void tb_lock(void)
174 #ifdef CONFIG_USER_ONLY
175 assert(!have_tb_lock);
176 qemu_mutex_lock(&tcg_ctx.tb_ctx.tb_lock);
177 have_tb_lock++;
178 #endif
181 void tb_unlock(void)
183 #ifdef CONFIG_USER_ONLY
184 assert(have_tb_lock);
185 have_tb_lock--;
186 qemu_mutex_unlock(&tcg_ctx.tb_ctx.tb_lock);
187 #endif
190 void tb_lock_reset(void)
192 #ifdef CONFIG_USER_ONLY
193 if (have_tb_lock) {
194 qemu_mutex_unlock(&tcg_ctx.tb_ctx.tb_lock);
195 have_tb_lock = 0;
197 #endif
200 #ifdef DEBUG_LOCKING
201 #define DEBUG_TB_LOCKS 1
202 #else
203 #define DEBUG_TB_LOCKS 0
204 #endif
206 #ifdef CONFIG_SOFTMMU
207 #define assert_tb_lock() do { /* nothing */ } while (0)
208 #else
209 #define assert_tb_lock() do { \
210 if (DEBUG_TB_LOCKS) { \
211 g_assert(have_tb_lock); \
213 } while (0)
214 #endif
217 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr);
219 void cpu_gen_init(void)
221 tcg_context_init(&tcg_ctx);
224 /* Encode VAL as a signed leb128 sequence at P.
225 Return P incremented past the encoded value. */
226 static uint8_t *encode_sleb128(uint8_t *p, target_long val)
228 int more, byte;
230 do {
231 byte = val & 0x7f;
232 val >>= 7;
233 more = !((val == 0 && (byte & 0x40) == 0)
234 || (val == -1 && (byte & 0x40) != 0));
235 if (more) {
236 byte |= 0x80;
238 *p++ = byte;
239 } while (more);
241 return p;
244 /* Decode a signed leb128 sequence at *PP; increment *PP past the
245 decoded value. Return the decoded value. */
246 static target_long decode_sleb128(uint8_t **pp)
248 uint8_t *p = *pp;
249 target_long val = 0;
250 int byte, shift = 0;
252 do {
253 byte = *p++;
254 val |= (target_ulong)(byte & 0x7f) << shift;
255 shift += 7;
256 } while (byte & 0x80);
257 if (shift < TARGET_LONG_BITS && (byte & 0x40)) {
258 val |= -(target_ulong)1 << shift;
261 *pp = p;
262 return val;
265 /* Encode the data collected about the instructions while compiling TB.
266 Place the data at BLOCK, and return the number of bytes consumed.
268 The logical table consisits of TARGET_INSN_START_WORDS target_ulong's,
269 which come from the target's insn_start data, followed by a uintptr_t
270 which comes from the host pc of the end of the code implementing the insn.
272 Each line of the table is encoded as sleb128 deltas from the previous
273 line. The seed for the first line is { tb->pc, 0..., tb->tc_ptr }.
274 That is, the first column is seeded with the guest pc, the last column
275 with the host pc, and the middle columns with zeros. */
277 static int encode_search(TranslationBlock *tb, uint8_t *block)
279 uint8_t *highwater = tcg_ctx.code_gen_highwater;
280 uint8_t *p = block;
281 int i, j, n;
283 tb->tc_search = block;
285 for (i = 0, n = tb->icount; i < n; ++i) {
286 target_ulong prev;
288 for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
289 if (i == 0) {
290 prev = (j == 0 ? tb->pc : 0);
291 } else {
292 prev = tcg_ctx.gen_insn_data[i - 1][j];
294 p = encode_sleb128(p, tcg_ctx.gen_insn_data[i][j] - prev);
296 prev = (i == 0 ? 0 : tcg_ctx.gen_insn_end_off[i - 1]);
297 p = encode_sleb128(p, tcg_ctx.gen_insn_end_off[i] - prev);
299 /* Test for (pending) buffer overflow. The assumption is that any
300 one row beginning below the high water mark cannot overrun
301 the buffer completely. Thus we can test for overflow after
302 encoding a row without having to check during encoding. */
303 if (unlikely(p > highwater)) {
304 return -1;
308 return p - block;
311 /* The cpu state corresponding to 'searched_pc' is restored.
312 * Called with tb_lock held.
314 static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
315 uintptr_t searched_pc)
317 target_ulong data[TARGET_INSN_START_WORDS] = { tb->pc };
318 uintptr_t host_pc = (uintptr_t)tb->tc_ptr;
319 CPUArchState *env = cpu->env_ptr;
320 uint8_t *p = tb->tc_search;
321 int i, j, num_insns = tb->icount;
322 #ifdef CONFIG_PROFILER
323 int64_t ti = profile_getclock();
324 #endif
326 searched_pc -= GETPC_ADJ;
328 if (searched_pc < host_pc) {
329 return -1;
332 /* Reconstruct the stored insn data while looking for the point at
333 which the end of the insn exceeds the searched_pc. */
334 for (i = 0; i < num_insns; ++i) {
335 for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
336 data[j] += decode_sleb128(&p);
338 host_pc += decode_sleb128(&p);
339 if (host_pc > searched_pc) {
340 goto found;
343 return -1;
345 found:
346 if (tb->cflags & CF_USE_ICOUNT) {
347 assert(use_icount);
348 /* Reset the cycle counter to the start of the block. */
349 cpu->icount_decr.u16.low += num_insns;
350 /* Clear the IO flag. */
351 cpu->can_do_io = 0;
353 cpu->icount_decr.u16.low -= i;
354 restore_state_to_opc(env, tb, data);
356 #ifdef CONFIG_PROFILER
357 tcg_ctx.restore_time += profile_getclock() - ti;
358 tcg_ctx.restore_count++;
359 #endif
360 return 0;
363 bool cpu_restore_state(CPUState *cpu, uintptr_t retaddr)
365 TranslationBlock *tb;
366 bool r = false;
368 tb_lock();
369 tb = tb_find_pc(retaddr);
370 if (tb) {
371 cpu_restore_state_from_tb(cpu, tb, retaddr);
372 if (tb->cflags & CF_NOCACHE) {
373 /* one-shot translation, invalidate it immediately */
374 tb_phys_invalidate(tb, -1);
375 tb_free(tb);
377 r = true;
379 tb_unlock();
381 return r;
384 void page_size_init(void)
386 /* NOTE: we can always suppose that qemu_host_page_size >=
387 TARGET_PAGE_SIZE */
388 qemu_real_host_page_size = getpagesize();
389 qemu_real_host_page_mask = -(intptr_t)qemu_real_host_page_size;
390 if (qemu_host_page_size == 0) {
391 qemu_host_page_size = qemu_real_host_page_size;
393 if (qemu_host_page_size < TARGET_PAGE_SIZE) {
394 qemu_host_page_size = TARGET_PAGE_SIZE;
396 qemu_host_page_mask = -(intptr_t)qemu_host_page_size;
399 static void page_init(void)
401 page_size_init();
402 page_table_config_init();
404 #if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
406 #ifdef HAVE_KINFO_GETVMMAP
407 struct kinfo_vmentry *freep;
408 int i, cnt;
410 freep = kinfo_getvmmap(getpid(), &cnt);
411 if (freep) {
412 mmap_lock();
413 for (i = 0; i < cnt; i++) {
414 unsigned long startaddr, endaddr;
416 startaddr = freep[i].kve_start;
417 endaddr = freep[i].kve_end;
418 if (h2g_valid(startaddr)) {
419 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
421 if (h2g_valid(endaddr)) {
422 endaddr = h2g(endaddr);
423 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
424 } else {
425 #if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
426 endaddr = ~0ul;
427 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
428 #endif
432 free(freep);
433 mmap_unlock();
435 #else
436 FILE *f;
438 last_brk = (unsigned long)sbrk(0);
440 f = fopen("/compat/linux/proc/self/maps", "r");
441 if (f) {
442 mmap_lock();
444 do {
445 unsigned long startaddr, endaddr;
446 int n;
448 n = fscanf(f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
450 if (n == 2 && h2g_valid(startaddr)) {
451 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
453 if (h2g_valid(endaddr)) {
454 endaddr = h2g(endaddr);
455 } else {
456 endaddr = ~0ul;
458 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
460 } while (!feof(f));
462 fclose(f);
463 mmap_unlock();
465 #endif
467 #endif
470 /* If alloc=1:
471 * Called with tb_lock held for system emulation.
472 * Called with mmap_lock held for user-mode emulation.
474 static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
476 PageDesc *pd;
477 void **lp;
478 int i;
480 if (alloc) {
481 assert_memory_lock();
484 /* Level 1. Always allocated. */
485 lp = l1_map + ((index >> v_l1_shift) & (v_l1_size - 1));
487 /* Level 2..N-1. */
488 for (i = v_l2_levels; i > 0; i--) {
489 void **p = atomic_rcu_read(lp);
491 if (p == NULL) {
492 if (!alloc) {
493 return NULL;
495 p = g_new0(void *, V_L2_SIZE);
496 atomic_rcu_set(lp, p);
499 lp = p + ((index >> (i * V_L2_BITS)) & (V_L2_SIZE - 1));
502 pd = atomic_rcu_read(lp);
503 if (pd == NULL) {
504 if (!alloc) {
505 return NULL;
507 pd = g_new0(PageDesc, V_L2_SIZE);
508 atomic_rcu_set(lp, pd);
511 return pd + (index & (V_L2_SIZE - 1));
514 static inline PageDesc *page_find(tb_page_addr_t index)
516 return page_find_alloc(index, 0);
519 #if defined(CONFIG_USER_ONLY)
520 /* Currently it is not recommended to allocate big chunks of data in
521 user mode. It will change when a dedicated libc will be used. */
522 /* ??? 64-bit hosts ought to have no problem mmaping data outside the
523 region in which the guest needs to run. Revisit this. */
524 #define USE_STATIC_CODE_GEN_BUFFER
525 #endif
527 /* Minimum size of the code gen buffer. This number is randomly chosen,
528 but not so small that we can't have a fair number of TB's live. */
529 #define MIN_CODE_GEN_BUFFER_SIZE (1024u * 1024)
531 /* Maximum size of the code gen buffer we'd like to use. Unless otherwise
532 indicated, this is constrained by the range of direct branches on the
533 host cpu, as used by the TCG implementation of goto_tb. */
534 #if defined(__x86_64__)
535 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
536 #elif defined(__sparc__)
537 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
538 #elif defined(__powerpc64__)
539 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
540 #elif defined(__powerpc__)
541 # define MAX_CODE_GEN_BUFFER_SIZE (32u * 1024 * 1024)
542 #elif defined(__aarch64__)
543 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
544 #elif defined(__arm__)
545 # define MAX_CODE_GEN_BUFFER_SIZE (16u * 1024 * 1024)
546 #elif defined(__s390x__)
547 /* We have a +- 4GB range on the branches; leave some slop. */
548 # define MAX_CODE_GEN_BUFFER_SIZE (3ul * 1024 * 1024 * 1024)
549 #elif defined(__mips__)
550 /* We have a 256MB branch region, but leave room to make sure the
551 main executable is also within that region. */
552 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
553 #else
554 # define MAX_CODE_GEN_BUFFER_SIZE ((size_t)-1)
555 #endif
557 #define DEFAULT_CODE_GEN_BUFFER_SIZE_1 (32u * 1024 * 1024)
559 #define DEFAULT_CODE_GEN_BUFFER_SIZE \
560 (DEFAULT_CODE_GEN_BUFFER_SIZE_1 < MAX_CODE_GEN_BUFFER_SIZE \
561 ? DEFAULT_CODE_GEN_BUFFER_SIZE_1 : MAX_CODE_GEN_BUFFER_SIZE)
563 static inline size_t size_code_gen_buffer(size_t tb_size)
565 /* Size the buffer. */
566 if (tb_size == 0) {
567 #ifdef USE_STATIC_CODE_GEN_BUFFER
568 tb_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
569 #else
570 /* ??? Needs adjustments. */
571 /* ??? If we relax the requirement that CONFIG_USER_ONLY use the
572 static buffer, we could size this on RESERVED_VA, on the text
573 segment size of the executable, or continue to use the default. */
574 tb_size = (unsigned long)(ram_size / 4);
575 #endif
577 if (tb_size < MIN_CODE_GEN_BUFFER_SIZE) {
578 tb_size = MIN_CODE_GEN_BUFFER_SIZE;
580 if (tb_size > MAX_CODE_GEN_BUFFER_SIZE) {
581 tb_size = MAX_CODE_GEN_BUFFER_SIZE;
583 return tb_size;
586 #ifdef __mips__
587 /* In order to use J and JAL within the code_gen_buffer, we require
588 that the buffer not cross a 256MB boundary. */
589 static inline bool cross_256mb(void *addr, size_t size)
591 return ((uintptr_t)addr ^ ((uintptr_t)addr + size)) & ~0x0ffffffful;
594 /* We weren't able to allocate a buffer without crossing that boundary,
595 so make do with the larger portion of the buffer that doesn't cross.
596 Returns the new base of the buffer, and adjusts code_gen_buffer_size. */
597 static inline void *split_cross_256mb(void *buf1, size_t size1)
599 void *buf2 = (void *)(((uintptr_t)buf1 + size1) & ~0x0ffffffful);
600 size_t size2 = buf1 + size1 - buf2;
602 size1 = buf2 - buf1;
603 if (size1 < size2) {
604 size1 = size2;
605 buf1 = buf2;
608 tcg_ctx.code_gen_buffer_size = size1;
609 return buf1;
611 #endif
613 #ifdef USE_STATIC_CODE_GEN_BUFFER
614 static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
615 __attribute__((aligned(CODE_GEN_ALIGN)));
617 # ifdef _WIN32
618 static inline void do_protect(void *addr, long size, int prot)
620 DWORD old_protect;
621 VirtualProtect(addr, size, prot, &old_protect);
624 static inline void map_exec(void *addr, long size)
626 do_protect(addr, size, PAGE_EXECUTE_READWRITE);
629 static inline void map_none(void *addr, long size)
631 do_protect(addr, size, PAGE_NOACCESS);
633 # else
634 static inline void do_protect(void *addr, long size, int prot)
636 uintptr_t start, end;
638 start = (uintptr_t)addr;
639 start &= qemu_real_host_page_mask;
641 end = (uintptr_t)addr + size;
642 end = ROUND_UP(end, qemu_real_host_page_size);
644 mprotect((void *)start, end - start, prot);
647 static inline void map_exec(void *addr, long size)
649 do_protect(addr, size, PROT_READ | PROT_WRITE | PROT_EXEC);
652 static inline void map_none(void *addr, long size)
654 do_protect(addr, size, PROT_NONE);
656 # endif /* WIN32 */
658 static inline void *alloc_code_gen_buffer(void)
660 void *buf = static_code_gen_buffer;
661 size_t full_size, size;
663 /* The size of the buffer, rounded down to end on a page boundary. */
664 full_size = (((uintptr_t)buf + sizeof(static_code_gen_buffer))
665 & qemu_real_host_page_mask) - (uintptr_t)buf;
667 /* Reserve a guard page. */
668 size = full_size - qemu_real_host_page_size;
670 /* Honor a command-line option limiting the size of the buffer. */
671 if (size > tcg_ctx.code_gen_buffer_size) {
672 size = (((uintptr_t)buf + tcg_ctx.code_gen_buffer_size)
673 & qemu_real_host_page_mask) - (uintptr_t)buf;
675 tcg_ctx.code_gen_buffer_size = size;
677 #ifdef __mips__
678 if (cross_256mb(buf, size)) {
679 buf = split_cross_256mb(buf, size);
680 size = tcg_ctx.code_gen_buffer_size;
682 #endif
684 map_exec(buf, size);
685 map_none(buf + size, qemu_real_host_page_size);
686 qemu_madvise(buf, size, QEMU_MADV_HUGEPAGE);
688 return buf;
690 #elif defined(_WIN32)
691 static inline void *alloc_code_gen_buffer(void)
693 size_t size = tcg_ctx.code_gen_buffer_size;
694 void *buf1, *buf2;
696 /* Perform the allocation in two steps, so that the guard page
697 is reserved but uncommitted. */
698 buf1 = VirtualAlloc(NULL, size + qemu_real_host_page_size,
699 MEM_RESERVE, PAGE_NOACCESS);
700 if (buf1 != NULL) {
701 buf2 = VirtualAlloc(buf1, size, MEM_COMMIT, PAGE_EXECUTE_READWRITE);
702 assert(buf1 == buf2);
705 return buf1;
707 #else
708 static inline void *alloc_code_gen_buffer(void)
710 int flags = MAP_PRIVATE | MAP_ANONYMOUS;
711 uintptr_t start = 0;
712 size_t size = tcg_ctx.code_gen_buffer_size;
713 void *buf;
715 /* Constrain the position of the buffer based on the host cpu.
716 Note that these addresses are chosen in concert with the
717 addresses assigned in the relevant linker script file. */
718 # if defined(__PIE__) || defined(__PIC__)
719 /* Don't bother setting a preferred location if we're building
720 a position-independent executable. We're more likely to get
721 an address near the main executable if we let the kernel
722 choose the address. */
723 # elif defined(__x86_64__) && defined(MAP_32BIT)
724 /* Force the memory down into low memory with the executable.
725 Leave the choice of exact location with the kernel. */
726 flags |= MAP_32BIT;
727 /* Cannot expect to map more than 800MB in low memory. */
728 if (size > 800u * 1024 * 1024) {
729 tcg_ctx.code_gen_buffer_size = size = 800u * 1024 * 1024;
731 # elif defined(__sparc__)
732 start = 0x40000000ul;
733 # elif defined(__s390x__)
734 start = 0x90000000ul;
735 # elif defined(__mips__)
736 # if _MIPS_SIM == _ABI64
737 start = 0x128000000ul;
738 # else
739 start = 0x08000000ul;
740 # endif
741 # endif
743 buf = mmap((void *)start, size + qemu_real_host_page_size,
744 PROT_NONE, flags, -1, 0);
745 if (buf == MAP_FAILED) {
746 return NULL;
749 #ifdef __mips__
750 if (cross_256mb(buf, size)) {
751 /* Try again, with the original still mapped, to avoid re-acquiring
752 that 256mb crossing. This time don't specify an address. */
753 size_t size2;
754 void *buf2 = mmap(NULL, size + qemu_real_host_page_size,
755 PROT_NONE, flags, -1, 0);
756 switch ((int)(buf2 != MAP_FAILED)) {
757 case 1:
758 if (!cross_256mb(buf2, size)) {
759 /* Success! Use the new buffer. */
760 munmap(buf, size + qemu_real_host_page_size);
761 break;
763 /* Failure. Work with what we had. */
764 munmap(buf2, size + qemu_real_host_page_size);
765 /* fallthru */
766 default:
767 /* Split the original buffer. Free the smaller half. */
768 buf2 = split_cross_256mb(buf, size);
769 size2 = tcg_ctx.code_gen_buffer_size;
770 if (buf == buf2) {
771 munmap(buf + size2 + qemu_real_host_page_size, size - size2);
772 } else {
773 munmap(buf, size - size2);
775 size = size2;
776 break;
778 buf = buf2;
780 #endif
782 /* Make the final buffer accessible. The guard page at the end
783 will remain inaccessible with PROT_NONE. */
784 mprotect(buf, size, PROT_WRITE | PROT_READ | PROT_EXEC);
786 /* Request large pages for the buffer. */
787 qemu_madvise(buf, size, QEMU_MADV_HUGEPAGE);
789 return buf;
791 #endif /* USE_STATIC_CODE_GEN_BUFFER, WIN32, POSIX */
793 static inline void code_gen_alloc(size_t tb_size)
795 tcg_ctx.code_gen_buffer_size = size_code_gen_buffer(tb_size);
796 tcg_ctx.code_gen_buffer = alloc_code_gen_buffer();
797 if (tcg_ctx.code_gen_buffer == NULL) {
798 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
799 exit(1);
802 /* Estimate a good size for the number of TBs we can support. We
803 still haven't deducted the prologue from the buffer size here,
804 but that's minimal and won't affect the estimate much. */
805 tcg_ctx.code_gen_max_blocks
806 = tcg_ctx.code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
807 tcg_ctx.tb_ctx.tbs = g_new(TranslationBlock, tcg_ctx.code_gen_max_blocks);
809 qemu_mutex_init(&tcg_ctx.tb_ctx.tb_lock);
812 static void tb_htable_init(void)
814 unsigned int mode = QHT_MODE_AUTO_RESIZE;
816 qht_init(&tcg_ctx.tb_ctx.htable, CODE_GEN_HTABLE_SIZE, mode);
819 /* Must be called before using the QEMU cpus. 'tb_size' is the size
820 (in bytes) allocated to the translation buffer. Zero means default
821 size. */
822 void tcg_exec_init(unsigned long tb_size)
824 cpu_gen_init();
825 page_init();
826 tb_htable_init();
827 code_gen_alloc(tb_size);
828 #if defined(CONFIG_SOFTMMU)
829 /* There's no guest base to take into account, so go ahead and
830 initialize the prologue now. */
831 tcg_prologue_init(&tcg_ctx);
832 #endif
835 bool tcg_enabled(void)
837 return tcg_ctx.code_gen_buffer != NULL;
841 * Allocate a new translation block. Flush the translation buffer if
842 * too many translation blocks or too much generated code.
844 * Called with tb_lock held.
846 static TranslationBlock *tb_alloc(target_ulong pc)
848 TranslationBlock *tb;
850 assert_tb_lock();
852 if (tcg_ctx.tb_ctx.nb_tbs >= tcg_ctx.code_gen_max_blocks) {
853 return NULL;
855 tb = &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs++];
856 tb->pc = pc;
857 tb->cflags = 0;
858 tb->invalid = false;
859 return tb;
862 /* Called with tb_lock held. */
863 void tb_free(TranslationBlock *tb)
865 assert_tb_lock();
867 /* In practice this is mostly used for single use temporary TB
868 Ignore the hard cases and just back up if this TB happens to
869 be the last one generated. */
870 if (tcg_ctx.tb_ctx.nb_tbs > 0 &&
871 tb == &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs - 1]) {
872 tcg_ctx.code_gen_ptr = tb->tc_ptr;
873 tcg_ctx.tb_ctx.nb_tbs--;
877 static inline void invalidate_page_bitmap(PageDesc *p)
879 #ifdef CONFIG_SOFTMMU
880 g_free(p->code_bitmap);
881 p->code_bitmap = NULL;
882 p->code_write_count = 0;
883 #endif
886 /* Set to NULL all the 'first_tb' fields in all PageDescs. */
887 static void page_flush_tb_1(int level, void **lp)
889 int i;
891 if (*lp == NULL) {
892 return;
894 if (level == 0) {
895 PageDesc *pd = *lp;
897 for (i = 0; i < V_L2_SIZE; ++i) {
898 pd[i].first_tb = NULL;
899 invalidate_page_bitmap(pd + i);
901 } else {
902 void **pp = *lp;
904 for (i = 0; i < V_L2_SIZE; ++i) {
905 page_flush_tb_1(level - 1, pp + i);
910 static void page_flush_tb(void)
912 int i, l1_sz = v_l1_size;
914 for (i = 0; i < l1_sz; i++) {
915 page_flush_tb_1(v_l2_levels, l1_map + i);
919 /* flush all the translation blocks */
920 static void do_tb_flush(CPUState *cpu, run_on_cpu_data tb_flush_count)
922 tb_lock();
924 /* If it is already been done on request of another CPU,
925 * just retry.
927 if (tcg_ctx.tb_ctx.tb_flush_count != tb_flush_count.host_int) {
928 goto done;
931 #if defined(DEBUG_TB_FLUSH)
932 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
933 (unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer),
934 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.tb_ctx.nb_tbs > 0 ?
935 ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)) /
936 tcg_ctx.tb_ctx.nb_tbs : 0);
937 #endif
938 if ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)
939 > tcg_ctx.code_gen_buffer_size) {
940 cpu_abort(cpu, "Internal error: code buffer overflow\n");
943 CPU_FOREACH(cpu) {
944 int i;
946 for (i = 0; i < TB_JMP_CACHE_SIZE; ++i) {
947 atomic_set(&cpu->tb_jmp_cache[i], NULL);
951 tcg_ctx.tb_ctx.nb_tbs = 0;
952 qht_reset_size(&tcg_ctx.tb_ctx.htable, CODE_GEN_HTABLE_SIZE);
953 page_flush_tb();
955 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
956 /* XXX: flush processor icache at this point if cache flush is
957 expensive */
958 atomic_mb_set(&tcg_ctx.tb_ctx.tb_flush_count,
959 tcg_ctx.tb_ctx.tb_flush_count + 1);
961 done:
962 tb_unlock();
965 void tb_flush(CPUState *cpu)
967 if (tcg_enabled()) {
968 unsigned tb_flush_count = atomic_mb_read(&tcg_ctx.tb_ctx.tb_flush_count);
969 async_safe_run_on_cpu(cpu, do_tb_flush,
970 RUN_ON_CPU_HOST_INT(tb_flush_count));
974 #ifdef DEBUG_TB_CHECK
976 static void
977 do_tb_invalidate_check(struct qht *ht, void *p, uint32_t hash, void *userp)
979 TranslationBlock *tb = p;
980 target_ulong addr = *(target_ulong *)userp;
982 if (!(addr + TARGET_PAGE_SIZE <= tb->pc || addr >= tb->pc + tb->size)) {
983 printf("ERROR invalidate: address=" TARGET_FMT_lx
984 " PC=%08lx size=%04x\n", addr, (long)tb->pc, tb->size);
988 /* verify that all the pages have correct rights for code
990 * Called with tb_lock held.
992 static void tb_invalidate_check(target_ulong address)
994 address &= TARGET_PAGE_MASK;
995 qht_iter(&tcg_ctx.tb_ctx.htable, do_tb_invalidate_check, &address);
998 static void
999 do_tb_page_check(struct qht *ht, void *p, uint32_t hash, void *userp)
1001 TranslationBlock *tb = p;
1002 int flags1, flags2;
1004 flags1 = page_get_flags(tb->pc);
1005 flags2 = page_get_flags(tb->pc + tb->size - 1);
1006 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
1007 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
1008 (long)tb->pc, tb->size, flags1, flags2);
1012 /* verify that all the pages have correct rights for code */
1013 static void tb_page_check(void)
1015 qht_iter(&tcg_ctx.tb_ctx.htable, do_tb_page_check, NULL);
1018 #endif
1020 static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
1022 TranslationBlock *tb1;
1023 unsigned int n1;
1025 for (;;) {
1026 tb1 = *ptb;
1027 n1 = (uintptr_t)tb1 & 3;
1028 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
1029 if (tb1 == tb) {
1030 *ptb = tb1->page_next[n1];
1031 break;
1033 ptb = &tb1->page_next[n1];
1037 /* remove the TB from a list of TBs jumping to the n-th jump target of the TB */
1038 static inline void tb_remove_from_jmp_list(TranslationBlock *tb, int n)
1040 TranslationBlock *tb1;
1041 uintptr_t *ptb, ntb;
1042 unsigned int n1;
1044 ptb = &tb->jmp_list_next[n];
1045 if (*ptb) {
1046 /* find tb(n) in circular list */
1047 for (;;) {
1048 ntb = *ptb;
1049 n1 = ntb & 3;
1050 tb1 = (TranslationBlock *)(ntb & ~3);
1051 if (n1 == n && tb1 == tb) {
1052 break;
1054 if (n1 == 2) {
1055 ptb = &tb1->jmp_list_first;
1056 } else {
1057 ptb = &tb1->jmp_list_next[n1];
1060 /* now we can suppress tb(n) from the list */
1061 *ptb = tb->jmp_list_next[n];
1063 tb->jmp_list_next[n] = (uintptr_t)NULL;
1067 /* reset the jump entry 'n' of a TB so that it is not chained to
1068 another TB */
1069 static inline void tb_reset_jump(TranslationBlock *tb, int n)
1071 uintptr_t addr = (uintptr_t)(tb->tc_ptr + tb->jmp_reset_offset[n]);
1072 tb_set_jmp_target(tb, n, addr);
1075 /* remove any jumps to the TB */
1076 static inline void tb_jmp_unlink(TranslationBlock *tb)
1078 TranslationBlock *tb1;
1079 uintptr_t *ptb, ntb;
1080 unsigned int n1;
1082 ptb = &tb->jmp_list_first;
1083 for (;;) {
1084 ntb = *ptb;
1085 n1 = ntb & 3;
1086 tb1 = (TranslationBlock *)(ntb & ~3);
1087 if (n1 == 2) {
1088 break;
1090 tb_reset_jump(tb1, n1);
1091 *ptb = tb1->jmp_list_next[n1];
1092 tb1->jmp_list_next[n1] = (uintptr_t)NULL;
1096 /* invalidate one TB
1098 * Called with tb_lock held.
1100 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
1102 CPUState *cpu;
1103 PageDesc *p;
1104 uint32_t h;
1105 tb_page_addr_t phys_pc;
1107 assert_tb_lock();
1109 atomic_set(&tb->invalid, true);
1111 /* remove the TB from the hash list */
1112 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1113 h = tb_hash_func(phys_pc, tb->pc, tb->flags);
1114 qht_remove(&tcg_ctx.tb_ctx.htable, tb, h);
1116 /* remove the TB from the page list */
1117 if (tb->page_addr[0] != page_addr) {
1118 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
1119 tb_page_remove(&p->first_tb, tb);
1120 invalidate_page_bitmap(p);
1122 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
1123 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
1124 tb_page_remove(&p->first_tb, tb);
1125 invalidate_page_bitmap(p);
1128 /* remove the TB from the hash list */
1129 h = tb_jmp_cache_hash_func(tb->pc);
1130 CPU_FOREACH(cpu) {
1131 if (atomic_read(&cpu->tb_jmp_cache[h]) == tb) {
1132 atomic_set(&cpu->tb_jmp_cache[h], NULL);
1136 /* suppress this TB from the two jump lists */
1137 tb_remove_from_jmp_list(tb, 0);
1138 tb_remove_from_jmp_list(tb, 1);
1140 /* suppress any remaining jumps to this TB */
1141 tb_jmp_unlink(tb);
1143 tcg_ctx.tb_ctx.tb_phys_invalidate_count++;
1146 #ifdef CONFIG_SOFTMMU
1147 static void build_page_bitmap(PageDesc *p)
1149 int n, tb_start, tb_end;
1150 TranslationBlock *tb;
1152 p->code_bitmap = bitmap_new(TARGET_PAGE_SIZE);
1154 tb = p->first_tb;
1155 while (tb != NULL) {
1156 n = (uintptr_t)tb & 3;
1157 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1158 /* NOTE: this is subtle as a TB may span two physical pages */
1159 if (n == 0) {
1160 /* NOTE: tb_end may be after the end of the page, but
1161 it is not a problem */
1162 tb_start = tb->pc & ~TARGET_PAGE_MASK;
1163 tb_end = tb_start + tb->size;
1164 if (tb_end > TARGET_PAGE_SIZE) {
1165 tb_end = TARGET_PAGE_SIZE;
1167 } else {
1168 tb_start = 0;
1169 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1171 bitmap_set(p->code_bitmap, tb_start, tb_end - tb_start);
1172 tb = tb->page_next[n];
1175 #endif
1177 /* add the tb in the target page and protect it if necessary
1179 * Called with mmap_lock held for user-mode emulation.
1181 static inline void tb_alloc_page(TranslationBlock *tb,
1182 unsigned int n, tb_page_addr_t page_addr)
1184 PageDesc *p;
1185 #ifndef CONFIG_USER_ONLY
1186 bool page_already_protected;
1187 #endif
1189 assert_memory_lock();
1191 tb->page_addr[n] = page_addr;
1192 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
1193 tb->page_next[n] = p->first_tb;
1194 #ifndef CONFIG_USER_ONLY
1195 page_already_protected = p->first_tb != NULL;
1196 #endif
1197 p->first_tb = (TranslationBlock *)((uintptr_t)tb | n);
1198 invalidate_page_bitmap(p);
1200 #if defined(CONFIG_USER_ONLY)
1201 if (p->flags & PAGE_WRITE) {
1202 target_ulong addr;
1203 PageDesc *p2;
1204 int prot;
1206 /* force the host page as non writable (writes will have a
1207 page fault + mprotect overhead) */
1208 page_addr &= qemu_host_page_mask;
1209 prot = 0;
1210 for (addr = page_addr; addr < page_addr + qemu_host_page_size;
1211 addr += TARGET_PAGE_SIZE) {
1213 p2 = page_find(addr >> TARGET_PAGE_BITS);
1214 if (!p2) {
1215 continue;
1217 prot |= p2->flags;
1218 p2->flags &= ~PAGE_WRITE;
1220 mprotect(g2h(page_addr), qemu_host_page_size,
1221 (prot & PAGE_BITS) & ~PAGE_WRITE);
1222 #ifdef DEBUG_TB_INVALIDATE
1223 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
1224 page_addr);
1225 #endif
1227 #else
1228 /* if some code is already present, then the pages are already
1229 protected. So we handle the case where only the first TB is
1230 allocated in a physical page */
1231 if (!page_already_protected) {
1232 tlb_protect_code(page_addr);
1234 #endif
1237 /* add a new TB and link it to the physical page tables. phys_page2 is
1238 * (-1) to indicate that only one page contains the TB.
1240 * Called with mmap_lock held for user-mode emulation.
1242 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
1243 tb_page_addr_t phys_page2)
1245 uint32_t h;
1247 assert_memory_lock();
1249 /* add in the page list */
1250 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1251 if (phys_page2 != -1) {
1252 tb_alloc_page(tb, 1, phys_page2);
1253 } else {
1254 tb->page_addr[1] = -1;
1257 /* add in the hash table */
1258 h = tb_hash_func(phys_pc, tb->pc, tb->flags);
1259 qht_insert(&tcg_ctx.tb_ctx.htable, tb, h);
1261 #ifdef DEBUG_TB_CHECK
1262 tb_page_check();
1263 #endif
1266 /* Called with mmap_lock held for user mode emulation. */
1267 TranslationBlock *tb_gen_code(CPUState *cpu,
1268 target_ulong pc, target_ulong cs_base,
1269 uint32_t flags, int cflags)
1271 CPUArchState *env = cpu->env_ptr;
1272 TranslationBlock *tb;
1273 tb_page_addr_t phys_pc, phys_page2;
1274 target_ulong virt_page2;
1275 tcg_insn_unit *gen_code_buf;
1276 int gen_code_size, search_size;
1277 #ifdef CONFIG_PROFILER
1278 int64_t ti;
1279 #endif
1280 assert_memory_lock();
1282 phys_pc = get_page_addr_code(env, pc);
1283 if (use_icount && !(cflags & CF_IGNORE_ICOUNT)) {
1284 cflags |= CF_USE_ICOUNT;
1287 tb = tb_alloc(pc);
1288 if (unlikely(!tb)) {
1289 buffer_overflow:
1290 /* flush must be done */
1291 tb_flush(cpu);
1292 mmap_unlock();
1293 /* Make the execution loop process the flush as soon as possible. */
1294 cpu->exception_index = EXCP_INTERRUPT;
1295 cpu_loop_exit(cpu);
1298 gen_code_buf = tcg_ctx.code_gen_ptr;
1299 tb->tc_ptr = gen_code_buf;
1300 tb->cs_base = cs_base;
1301 tb->flags = flags;
1302 tb->cflags = cflags;
1304 #ifdef CONFIG_PROFILER
1305 tcg_ctx.tb_count1++; /* includes aborted translations because of
1306 exceptions */
1307 ti = profile_getclock();
1308 #endif
1310 tcg_func_start(&tcg_ctx);
1312 tcg_ctx.cpu = ENV_GET_CPU(env);
1313 gen_intermediate_code(env, tb);
1314 tcg_ctx.cpu = NULL;
1316 trace_translate_block(tb, tb->pc, tb->tc_ptr);
1318 /* generate machine code */
1319 tb->jmp_reset_offset[0] = TB_JMP_RESET_OFFSET_INVALID;
1320 tb->jmp_reset_offset[1] = TB_JMP_RESET_OFFSET_INVALID;
1321 tcg_ctx.tb_jmp_reset_offset = tb->jmp_reset_offset;
1322 #ifdef USE_DIRECT_JUMP
1323 tcg_ctx.tb_jmp_insn_offset = tb->jmp_insn_offset;
1324 tcg_ctx.tb_jmp_target_addr = NULL;
1325 #else
1326 tcg_ctx.tb_jmp_insn_offset = NULL;
1327 tcg_ctx.tb_jmp_target_addr = tb->jmp_target_addr;
1328 #endif
1330 #ifdef CONFIG_PROFILER
1331 tcg_ctx.tb_count++;
1332 tcg_ctx.interm_time += profile_getclock() - ti;
1333 tcg_ctx.code_time -= profile_getclock();
1334 #endif
1336 /* ??? Overflow could be handled better here. In particular, we
1337 don't need to re-do gen_intermediate_code, nor should we re-do
1338 the tcg optimization currently hidden inside tcg_gen_code. All
1339 that should be required is to flush the TBs, allocate a new TB,
1340 re-initialize it per above, and re-do the actual code generation. */
1341 gen_code_size = tcg_gen_code(&tcg_ctx, tb);
1342 if (unlikely(gen_code_size < 0)) {
1343 goto buffer_overflow;
1345 search_size = encode_search(tb, (void *)gen_code_buf + gen_code_size);
1346 if (unlikely(search_size < 0)) {
1347 goto buffer_overflow;
1350 #ifdef CONFIG_PROFILER
1351 tcg_ctx.code_time += profile_getclock();
1352 tcg_ctx.code_in_len += tb->size;
1353 tcg_ctx.code_out_len += gen_code_size;
1354 tcg_ctx.search_out_len += search_size;
1355 #endif
1357 #ifdef DEBUG_DISAS
1358 if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM) &&
1359 qemu_log_in_addr_range(tb->pc)) {
1360 qemu_log_lock();
1361 qemu_log("OUT: [size=%d]\n", gen_code_size);
1362 log_disas(tb->tc_ptr, gen_code_size);
1363 qemu_log("\n");
1364 qemu_log_flush();
1365 qemu_log_unlock();
1367 #endif
1369 tcg_ctx.code_gen_ptr = (void *)
1370 ROUND_UP((uintptr_t)gen_code_buf + gen_code_size + search_size,
1371 CODE_GEN_ALIGN);
1373 /* init jump list */
1374 assert(((uintptr_t)tb & 3) == 0);
1375 tb->jmp_list_first = (uintptr_t)tb | 2;
1376 tb->jmp_list_next[0] = (uintptr_t)NULL;
1377 tb->jmp_list_next[1] = (uintptr_t)NULL;
1379 /* init original jump addresses wich has been set during tcg_gen_code() */
1380 if (tb->jmp_reset_offset[0] != TB_JMP_RESET_OFFSET_INVALID) {
1381 tb_reset_jump(tb, 0);
1383 if (tb->jmp_reset_offset[1] != TB_JMP_RESET_OFFSET_INVALID) {
1384 tb_reset_jump(tb, 1);
1387 /* check next page if needed */
1388 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
1389 phys_page2 = -1;
1390 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
1391 phys_page2 = get_page_addr_code(env, virt_page2);
1393 /* As long as consistency of the TB stuff is provided by tb_lock in user
1394 * mode and is implicit in single-threaded softmmu emulation, no explicit
1395 * memory barrier is required before tb_link_page() makes the TB visible
1396 * through the physical hash table and physical page list.
1398 tb_link_page(tb, phys_pc, phys_page2);
1399 return tb;
1403 * Invalidate all TBs which intersect with the target physical address range
1404 * [start;end[. NOTE: start and end may refer to *different* physical pages.
1405 * 'is_cpu_write_access' should be true if called from a real cpu write
1406 * access: the virtual CPU will exit the current TB if code is modified inside
1407 * this TB.
1409 * Called with mmap_lock held for user-mode emulation, grabs tb_lock
1410 * Called with tb_lock held for system-mode emulation
1412 static void tb_invalidate_phys_range_1(tb_page_addr_t start, tb_page_addr_t end)
1414 while (start < end) {
1415 tb_invalidate_phys_page_range(start, end, 0);
1416 start &= TARGET_PAGE_MASK;
1417 start += TARGET_PAGE_SIZE;
1421 #ifdef CONFIG_SOFTMMU
1422 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end)
1424 assert_tb_lock();
1425 tb_invalidate_phys_range_1(start, end);
1427 #else
1428 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end)
1430 assert_memory_lock();
1431 tb_lock();
1432 tb_invalidate_phys_range_1(start, end);
1433 tb_unlock();
1435 #endif
1437 * Invalidate all TBs which intersect with the target physical address range
1438 * [start;end[. NOTE: start and end must refer to the *same* physical page.
1439 * 'is_cpu_write_access' should be true if called from a real cpu write
1440 * access: the virtual CPU will exit the current TB if code is modified inside
1441 * this TB.
1443 * Called with tb_lock/mmap_lock held for user-mode emulation
1444 * Called with tb_lock held for system-mode emulation
1446 void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
1447 int is_cpu_write_access)
1449 TranslationBlock *tb, *tb_next;
1450 #if defined(TARGET_HAS_PRECISE_SMC)
1451 CPUState *cpu = current_cpu;
1452 CPUArchState *env = NULL;
1453 #endif
1454 tb_page_addr_t tb_start, tb_end;
1455 PageDesc *p;
1456 int n;
1457 #ifdef TARGET_HAS_PRECISE_SMC
1458 int current_tb_not_found = is_cpu_write_access;
1459 TranslationBlock *current_tb = NULL;
1460 int current_tb_modified = 0;
1461 target_ulong current_pc = 0;
1462 target_ulong current_cs_base = 0;
1463 uint32_t current_flags = 0;
1464 #endif /* TARGET_HAS_PRECISE_SMC */
1466 assert_memory_lock();
1467 assert_tb_lock();
1469 p = page_find(start >> TARGET_PAGE_BITS);
1470 if (!p) {
1471 return;
1473 #if defined(TARGET_HAS_PRECISE_SMC)
1474 if (cpu != NULL) {
1475 env = cpu->env_ptr;
1477 #endif
1479 /* we remove all the TBs in the range [start, end[ */
1480 /* XXX: see if in some cases it could be faster to invalidate all
1481 the code */
1482 tb = p->first_tb;
1483 while (tb != NULL) {
1484 n = (uintptr_t)tb & 3;
1485 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1486 tb_next = tb->page_next[n];
1487 /* NOTE: this is subtle as a TB may span two physical pages */
1488 if (n == 0) {
1489 /* NOTE: tb_end may be after the end of the page, but
1490 it is not a problem */
1491 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1492 tb_end = tb_start + tb->size;
1493 } else {
1494 tb_start = tb->page_addr[1];
1495 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1497 if (!(tb_end <= start || tb_start >= end)) {
1498 #ifdef TARGET_HAS_PRECISE_SMC
1499 if (current_tb_not_found) {
1500 current_tb_not_found = 0;
1501 current_tb = NULL;
1502 if (cpu->mem_io_pc) {
1503 /* now we have a real cpu fault */
1504 current_tb = tb_find_pc(cpu->mem_io_pc);
1507 if (current_tb == tb &&
1508 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1509 /* If we are modifying the current TB, we must stop
1510 its execution. We could be more precise by checking
1511 that the modification is after the current PC, but it
1512 would require a specialized function to partially
1513 restore the CPU state */
1515 current_tb_modified = 1;
1516 cpu_restore_state_from_tb(cpu, current_tb, cpu->mem_io_pc);
1517 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1518 &current_flags);
1520 #endif /* TARGET_HAS_PRECISE_SMC */
1521 tb_phys_invalidate(tb, -1);
1523 tb = tb_next;
1525 #if !defined(CONFIG_USER_ONLY)
1526 /* if no code remaining, no need to continue to use slow writes */
1527 if (!p->first_tb) {
1528 invalidate_page_bitmap(p);
1529 tlb_unprotect_code(start);
1531 #endif
1532 #ifdef TARGET_HAS_PRECISE_SMC
1533 if (current_tb_modified) {
1534 /* we generate a block containing just the instruction
1535 modifying the memory. It will ensure that it cannot modify
1536 itself */
1537 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1538 cpu_loop_exit_noexc(cpu);
1540 #endif
1543 #ifdef CONFIG_SOFTMMU
1544 /* len must be <= 8 and start must be a multiple of len.
1545 * Called via softmmu_template.h when code areas are written to with
1546 * tb_lock held.
1548 void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
1550 PageDesc *p;
1552 #if 0
1553 if (1) {
1554 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1555 cpu_single_env->mem_io_vaddr, len,
1556 cpu_single_env->eip,
1557 cpu_single_env->eip +
1558 (intptr_t)cpu_single_env->segs[R_CS].base);
1560 #endif
1561 assert_memory_lock();
1563 p = page_find(start >> TARGET_PAGE_BITS);
1564 if (!p) {
1565 return;
1567 if (!p->code_bitmap &&
1568 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD) {
1569 /* build code bitmap. FIXME: writes should be protected by
1570 * tb_lock, reads by tb_lock or RCU.
1572 build_page_bitmap(p);
1574 if (p->code_bitmap) {
1575 unsigned int nr;
1576 unsigned long b;
1578 nr = start & ~TARGET_PAGE_MASK;
1579 b = p->code_bitmap[BIT_WORD(nr)] >> (nr & (BITS_PER_LONG - 1));
1580 if (b & ((1 << len) - 1)) {
1581 goto do_invalidate;
1583 } else {
1584 do_invalidate:
1585 tb_invalidate_phys_page_range(start, start + len, 1);
1588 #else
1589 /* Called with mmap_lock held. If pc is not 0 then it indicates the
1590 * host PC of the faulting store instruction that caused this invalidate.
1591 * Returns true if the caller needs to abort execution of the current
1592 * TB (because it was modified by this store and the guest CPU has
1593 * precise-SMC semantics).
1595 static bool tb_invalidate_phys_page(tb_page_addr_t addr, uintptr_t pc)
1597 TranslationBlock *tb;
1598 PageDesc *p;
1599 int n;
1600 #ifdef TARGET_HAS_PRECISE_SMC
1601 TranslationBlock *current_tb = NULL;
1602 CPUState *cpu = current_cpu;
1603 CPUArchState *env = NULL;
1604 int current_tb_modified = 0;
1605 target_ulong current_pc = 0;
1606 target_ulong current_cs_base = 0;
1607 uint32_t current_flags = 0;
1608 #endif
1610 assert_memory_lock();
1612 addr &= TARGET_PAGE_MASK;
1613 p = page_find(addr >> TARGET_PAGE_BITS);
1614 if (!p) {
1615 return false;
1618 tb_lock();
1619 tb = p->first_tb;
1620 #ifdef TARGET_HAS_PRECISE_SMC
1621 if (tb && pc != 0) {
1622 current_tb = tb_find_pc(pc);
1624 if (cpu != NULL) {
1625 env = cpu->env_ptr;
1627 #endif
1628 while (tb != NULL) {
1629 n = (uintptr_t)tb & 3;
1630 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1631 #ifdef TARGET_HAS_PRECISE_SMC
1632 if (current_tb == tb &&
1633 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1634 /* If we are modifying the current TB, we must stop
1635 its execution. We could be more precise by checking
1636 that the modification is after the current PC, but it
1637 would require a specialized function to partially
1638 restore the CPU state */
1640 current_tb_modified = 1;
1641 cpu_restore_state_from_tb(cpu, current_tb, pc);
1642 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1643 &current_flags);
1645 #endif /* TARGET_HAS_PRECISE_SMC */
1646 tb_phys_invalidate(tb, addr);
1647 tb = tb->page_next[n];
1649 p->first_tb = NULL;
1650 #ifdef TARGET_HAS_PRECISE_SMC
1651 if (current_tb_modified) {
1652 /* we generate a block containing just the instruction
1653 modifying the memory. It will ensure that it cannot modify
1654 itself */
1655 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1656 /* tb_lock will be reset after cpu_loop_exit_noexc longjmps
1657 * back into the cpu_exec loop. */
1658 return true;
1660 #endif
1661 tb_unlock();
1663 return false;
1665 #endif
1667 /* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1668 tb[1].tc_ptr. Return NULL if not found */
1669 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr)
1671 int m_min, m_max, m;
1672 uintptr_t v;
1673 TranslationBlock *tb;
1675 if (tcg_ctx.tb_ctx.nb_tbs <= 0) {
1676 return NULL;
1678 if (tc_ptr < (uintptr_t)tcg_ctx.code_gen_buffer ||
1679 tc_ptr >= (uintptr_t)tcg_ctx.code_gen_ptr) {
1680 return NULL;
1682 /* binary search (cf Knuth) */
1683 m_min = 0;
1684 m_max = tcg_ctx.tb_ctx.nb_tbs - 1;
1685 while (m_min <= m_max) {
1686 m = (m_min + m_max) >> 1;
1687 tb = &tcg_ctx.tb_ctx.tbs[m];
1688 v = (uintptr_t)tb->tc_ptr;
1689 if (v == tc_ptr) {
1690 return tb;
1691 } else if (tc_ptr < v) {
1692 m_max = m - 1;
1693 } else {
1694 m_min = m + 1;
1697 return &tcg_ctx.tb_ctx.tbs[m_max];
1700 #if !defined(CONFIG_USER_ONLY)
1701 void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr)
1703 ram_addr_t ram_addr;
1704 MemoryRegion *mr;
1705 hwaddr l = 1;
1707 rcu_read_lock();
1708 mr = address_space_translate(as, addr, &addr, &l, false);
1709 if (!(memory_region_is_ram(mr)
1710 || memory_region_is_romd(mr))) {
1711 rcu_read_unlock();
1712 return;
1714 ram_addr = memory_region_get_ram_addr(mr) + addr;
1715 tb_lock();
1716 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
1717 tb_unlock();
1718 rcu_read_unlock();
1720 #endif /* !defined(CONFIG_USER_ONLY) */
1722 /* Called with tb_lock held. */
1723 void tb_check_watchpoint(CPUState *cpu)
1725 TranslationBlock *tb;
1727 tb = tb_find_pc(cpu->mem_io_pc);
1728 if (tb) {
1729 /* We can use retranslation to find the PC. */
1730 cpu_restore_state_from_tb(cpu, tb, cpu->mem_io_pc);
1731 tb_phys_invalidate(tb, -1);
1732 } else {
1733 /* The exception probably happened in a helper. The CPU state should
1734 have been saved before calling it. Fetch the PC from there. */
1735 CPUArchState *env = cpu->env_ptr;
1736 target_ulong pc, cs_base;
1737 tb_page_addr_t addr;
1738 uint32_t flags;
1740 cpu_get_tb_cpu_state(env, &pc, &cs_base, &flags);
1741 addr = get_page_addr_code(env, pc);
1742 tb_invalidate_phys_range(addr, addr + 1);
1746 #ifndef CONFIG_USER_ONLY
1747 /* in deterministic execution mode, instructions doing device I/Os
1748 must be at the end of the TB */
1749 void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr)
1751 #if defined(TARGET_MIPS) || defined(TARGET_SH4)
1752 CPUArchState *env = cpu->env_ptr;
1753 #endif
1754 TranslationBlock *tb;
1755 uint32_t n, cflags;
1756 target_ulong pc, cs_base;
1757 uint32_t flags;
1759 tb_lock();
1760 tb = tb_find_pc(retaddr);
1761 if (!tb) {
1762 cpu_abort(cpu, "cpu_io_recompile: could not find TB for pc=%p",
1763 (void *)retaddr);
1765 n = cpu->icount_decr.u16.low + tb->icount;
1766 cpu_restore_state_from_tb(cpu, tb, retaddr);
1767 /* Calculate how many instructions had been executed before the fault
1768 occurred. */
1769 n = n - cpu->icount_decr.u16.low;
1770 /* Generate a new TB ending on the I/O insn. */
1771 n++;
1772 /* On MIPS and SH, delay slot instructions can only be restarted if
1773 they were already the first instruction in the TB. If this is not
1774 the first instruction in a TB then re-execute the preceding
1775 branch. */
1776 #if defined(TARGET_MIPS)
1777 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
1778 env->active_tc.PC -= (env->hflags & MIPS_HFLAG_B16 ? 2 : 4);
1779 cpu->icount_decr.u16.low++;
1780 env->hflags &= ~MIPS_HFLAG_BMASK;
1782 #elif defined(TARGET_SH4)
1783 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
1784 && n > 1) {
1785 env->pc -= 2;
1786 cpu->icount_decr.u16.low++;
1787 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
1789 #endif
1790 /* This should never happen. */
1791 if (n > CF_COUNT_MASK) {
1792 cpu_abort(cpu, "TB too big during recompile");
1795 cflags = n | CF_LAST_IO;
1796 pc = tb->pc;
1797 cs_base = tb->cs_base;
1798 flags = tb->flags;
1799 tb_phys_invalidate(tb, -1);
1800 if (tb->cflags & CF_NOCACHE) {
1801 if (tb->orig_tb) {
1802 /* Invalidate original TB if this TB was generated in
1803 * cpu_exec_nocache() */
1804 tb_phys_invalidate(tb->orig_tb, -1);
1806 tb_free(tb);
1808 /* FIXME: In theory this could raise an exception. In practice
1809 we have already translated the block once so it's probably ok. */
1810 tb_gen_code(cpu, pc, cs_base, flags, cflags);
1812 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
1813 * the first in the TB) then we end up generating a whole new TB and
1814 * repeating the fault, which is horribly inefficient.
1815 * Better would be to execute just this insn uncached, or generate a
1816 * second new TB.
1818 * cpu_loop_exit_noexc will longjmp back to cpu_exec where the
1819 * tb_lock gets reset.
1821 cpu_loop_exit_noexc(cpu);
1824 void tb_flush_jmp_cache(CPUState *cpu, target_ulong addr)
1826 unsigned int i;
1828 /* Discard jump cache entries for any tb which might potentially
1829 overlap the flushed page. */
1830 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1831 memset(&cpu->tb_jmp_cache[i], 0,
1832 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1834 i = tb_jmp_cache_hash_page(addr);
1835 memset(&cpu->tb_jmp_cache[i], 0,
1836 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1839 static void print_qht_statistics(FILE *f, fprintf_function cpu_fprintf,
1840 struct qht_stats hst)
1842 uint32_t hgram_opts;
1843 size_t hgram_bins;
1844 char *hgram;
1846 if (!hst.head_buckets) {
1847 return;
1849 cpu_fprintf(f, "TB hash buckets %zu/%zu (%0.2f%% head buckets used)\n",
1850 hst.used_head_buckets, hst.head_buckets,
1851 (double)hst.used_head_buckets / hst.head_buckets * 100);
1853 hgram_opts = QDIST_PR_BORDER | QDIST_PR_LABELS;
1854 hgram_opts |= QDIST_PR_100X | QDIST_PR_PERCENT;
1855 if (qdist_xmax(&hst.occupancy) - qdist_xmin(&hst.occupancy) == 1) {
1856 hgram_opts |= QDIST_PR_NODECIMAL;
1858 hgram = qdist_pr(&hst.occupancy, 10, hgram_opts);
1859 cpu_fprintf(f, "TB hash occupancy %0.2f%% avg chain occ. Histogram: %s\n",
1860 qdist_avg(&hst.occupancy) * 100, hgram);
1861 g_free(hgram);
1863 hgram_opts = QDIST_PR_BORDER | QDIST_PR_LABELS;
1864 hgram_bins = qdist_xmax(&hst.chain) - qdist_xmin(&hst.chain);
1865 if (hgram_bins > 10) {
1866 hgram_bins = 10;
1867 } else {
1868 hgram_bins = 0;
1869 hgram_opts |= QDIST_PR_NODECIMAL | QDIST_PR_NOBINRANGE;
1871 hgram = qdist_pr(&hst.chain, hgram_bins, hgram_opts);
1872 cpu_fprintf(f, "TB hash avg chain %0.3f buckets. Histogram: %s\n",
1873 qdist_avg(&hst.chain), hgram);
1874 g_free(hgram);
1877 void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
1879 int i, target_code_size, max_target_code_size;
1880 int direct_jmp_count, direct_jmp2_count, cross_page;
1881 TranslationBlock *tb;
1882 struct qht_stats hst;
1884 tb_lock();
1886 target_code_size = 0;
1887 max_target_code_size = 0;
1888 cross_page = 0;
1889 direct_jmp_count = 0;
1890 direct_jmp2_count = 0;
1891 for (i = 0; i < tcg_ctx.tb_ctx.nb_tbs; i++) {
1892 tb = &tcg_ctx.tb_ctx.tbs[i];
1893 target_code_size += tb->size;
1894 if (tb->size > max_target_code_size) {
1895 max_target_code_size = tb->size;
1897 if (tb->page_addr[1] != -1) {
1898 cross_page++;
1900 if (tb->jmp_reset_offset[0] != TB_JMP_RESET_OFFSET_INVALID) {
1901 direct_jmp_count++;
1902 if (tb->jmp_reset_offset[1] != TB_JMP_RESET_OFFSET_INVALID) {
1903 direct_jmp2_count++;
1907 /* XXX: avoid using doubles ? */
1908 cpu_fprintf(f, "Translation buffer state:\n");
1909 cpu_fprintf(f, "gen code size %td/%zd\n",
1910 tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer,
1911 tcg_ctx.code_gen_highwater - tcg_ctx.code_gen_buffer);
1912 cpu_fprintf(f, "TB count %d/%d\n",
1913 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.code_gen_max_blocks);
1914 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
1915 tcg_ctx.tb_ctx.nb_tbs ? target_code_size /
1916 tcg_ctx.tb_ctx.nb_tbs : 0,
1917 max_target_code_size);
1918 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
1919 tcg_ctx.tb_ctx.nb_tbs ? (tcg_ctx.code_gen_ptr -
1920 tcg_ctx.code_gen_buffer) /
1921 tcg_ctx.tb_ctx.nb_tbs : 0,
1922 target_code_size ? (double) (tcg_ctx.code_gen_ptr -
1923 tcg_ctx.code_gen_buffer) /
1924 target_code_size : 0);
1925 cpu_fprintf(f, "cross page TB count %d (%d%%)\n", cross_page,
1926 tcg_ctx.tb_ctx.nb_tbs ? (cross_page * 100) /
1927 tcg_ctx.tb_ctx.nb_tbs : 0);
1928 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
1929 direct_jmp_count,
1930 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp_count * 100) /
1931 tcg_ctx.tb_ctx.nb_tbs : 0,
1932 direct_jmp2_count,
1933 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp2_count * 100) /
1934 tcg_ctx.tb_ctx.nb_tbs : 0);
1936 qht_statistics_init(&tcg_ctx.tb_ctx.htable, &hst);
1937 print_qht_statistics(f, cpu_fprintf, hst);
1938 qht_statistics_destroy(&hst);
1940 cpu_fprintf(f, "\nStatistics:\n");
1941 cpu_fprintf(f, "TB flush count %u\n",
1942 atomic_read(&tcg_ctx.tb_ctx.tb_flush_count));
1943 cpu_fprintf(f, "TB invalidate count %d\n",
1944 tcg_ctx.tb_ctx.tb_phys_invalidate_count);
1945 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
1946 tcg_dump_info(f, cpu_fprintf);
1948 tb_unlock();
1951 void dump_opcount_info(FILE *f, fprintf_function cpu_fprintf)
1953 tcg_dump_op_count(f, cpu_fprintf);
1956 #else /* CONFIG_USER_ONLY */
1958 void cpu_interrupt(CPUState *cpu, int mask)
1960 cpu->interrupt_request |= mask;
1961 cpu->tcg_exit_req = 1;
1965 * Walks guest process memory "regions" one by one
1966 * and calls callback function 'fn' for each region.
1968 struct walk_memory_regions_data {
1969 walk_memory_regions_fn fn;
1970 void *priv;
1971 target_ulong start;
1972 int prot;
1975 static int walk_memory_regions_end(struct walk_memory_regions_data *data,
1976 target_ulong end, int new_prot)
1978 if (data->start != -1u) {
1979 int rc = data->fn(data->priv, data->start, end, data->prot);
1980 if (rc != 0) {
1981 return rc;
1985 data->start = (new_prot ? end : -1u);
1986 data->prot = new_prot;
1988 return 0;
1991 static int walk_memory_regions_1(struct walk_memory_regions_data *data,
1992 target_ulong base, int level, void **lp)
1994 target_ulong pa;
1995 int i, rc;
1997 if (*lp == NULL) {
1998 return walk_memory_regions_end(data, base, 0);
2001 if (level == 0) {
2002 PageDesc *pd = *lp;
2004 for (i = 0; i < V_L2_SIZE; ++i) {
2005 int prot = pd[i].flags;
2007 pa = base | (i << TARGET_PAGE_BITS);
2008 if (prot != data->prot) {
2009 rc = walk_memory_regions_end(data, pa, prot);
2010 if (rc != 0) {
2011 return rc;
2015 } else {
2016 void **pp = *lp;
2018 for (i = 0; i < V_L2_SIZE; ++i) {
2019 pa = base | ((target_ulong)i <<
2020 (TARGET_PAGE_BITS + V_L2_BITS * level));
2021 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2022 if (rc != 0) {
2023 return rc;
2028 return 0;
2031 int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2033 struct walk_memory_regions_data data;
2034 uintptr_t i, l1_sz = v_l1_size;
2036 data.fn = fn;
2037 data.priv = priv;
2038 data.start = -1u;
2039 data.prot = 0;
2041 for (i = 0; i < l1_sz; i++) {
2042 target_ulong base = i << (v_l1_shift + TARGET_PAGE_BITS);
2043 int rc = walk_memory_regions_1(&data, base, v_l2_levels, l1_map + i);
2044 if (rc != 0) {
2045 return rc;
2049 return walk_memory_regions_end(&data, 0, 0);
2052 static int dump_region(void *priv, target_ulong start,
2053 target_ulong end, unsigned long prot)
2055 FILE *f = (FILE *)priv;
2057 (void) fprintf(f, TARGET_FMT_lx"-"TARGET_FMT_lx
2058 " "TARGET_FMT_lx" %c%c%c\n",
2059 start, end, end - start,
2060 ((prot & PAGE_READ) ? 'r' : '-'),
2061 ((prot & PAGE_WRITE) ? 'w' : '-'),
2062 ((prot & PAGE_EXEC) ? 'x' : '-'));
2064 return 0;
2067 /* dump memory mappings */
2068 void page_dump(FILE *f)
2070 const int length = sizeof(target_ulong) * 2;
2071 (void) fprintf(f, "%-*s %-*s %-*s %s\n",
2072 length, "start", length, "end", length, "size", "prot");
2073 walk_memory_regions(f, dump_region);
2076 int page_get_flags(target_ulong address)
2078 PageDesc *p;
2080 p = page_find(address >> TARGET_PAGE_BITS);
2081 if (!p) {
2082 return 0;
2084 return p->flags;
2087 /* Modify the flags of a page and invalidate the code if necessary.
2088 The flag PAGE_WRITE_ORG is positioned automatically depending
2089 on PAGE_WRITE. The mmap_lock should already be held. */
2090 void page_set_flags(target_ulong start, target_ulong end, int flags)
2092 target_ulong addr, len;
2094 /* This function should never be called with addresses outside the
2095 guest address space. If this assert fires, it probably indicates
2096 a missing call to h2g_valid. */
2097 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2098 assert(end < ((target_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2099 #endif
2100 assert(start < end);
2101 assert_memory_lock();
2103 start = start & TARGET_PAGE_MASK;
2104 end = TARGET_PAGE_ALIGN(end);
2106 if (flags & PAGE_WRITE) {
2107 flags |= PAGE_WRITE_ORG;
2110 for (addr = start, len = end - start;
2111 len != 0;
2112 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2113 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2115 /* If the write protection bit is set, then we invalidate
2116 the code inside. */
2117 if (!(p->flags & PAGE_WRITE) &&
2118 (flags & PAGE_WRITE) &&
2119 p->first_tb) {
2120 tb_invalidate_phys_page(addr, 0);
2122 p->flags = flags;
2126 int page_check_range(target_ulong start, target_ulong len, int flags)
2128 PageDesc *p;
2129 target_ulong end;
2130 target_ulong addr;
2132 /* This function should never be called with addresses outside the
2133 guest address space. If this assert fires, it probably indicates
2134 a missing call to h2g_valid. */
2135 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2136 assert(start < ((target_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2137 #endif
2139 if (len == 0) {
2140 return 0;
2142 if (start + len - 1 < start) {
2143 /* We've wrapped around. */
2144 return -1;
2147 /* must do before we loose bits in the next step */
2148 end = TARGET_PAGE_ALIGN(start + len);
2149 start = start & TARGET_PAGE_MASK;
2151 for (addr = start, len = end - start;
2152 len != 0;
2153 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2154 p = page_find(addr >> TARGET_PAGE_BITS);
2155 if (!p) {
2156 return -1;
2158 if (!(p->flags & PAGE_VALID)) {
2159 return -1;
2162 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ)) {
2163 return -1;
2165 if (flags & PAGE_WRITE) {
2166 if (!(p->flags & PAGE_WRITE_ORG)) {
2167 return -1;
2169 /* unprotect the page if it was put read-only because it
2170 contains translated code */
2171 if (!(p->flags & PAGE_WRITE)) {
2172 if (!page_unprotect(addr, 0)) {
2173 return -1;
2178 return 0;
2181 /* called from signal handler: invalidate the code and unprotect the
2182 * page. Return 0 if the fault was not handled, 1 if it was handled,
2183 * and 2 if it was handled but the caller must cause the TB to be
2184 * immediately exited. (We can only return 2 if the 'pc' argument is
2185 * non-zero.)
2187 int page_unprotect(target_ulong address, uintptr_t pc)
2189 unsigned int prot;
2190 bool current_tb_invalidated;
2191 PageDesc *p;
2192 target_ulong host_start, host_end, addr;
2194 /* Technically this isn't safe inside a signal handler. However we
2195 know this only ever happens in a synchronous SEGV handler, so in
2196 practice it seems to be ok. */
2197 mmap_lock();
2199 p = page_find(address >> TARGET_PAGE_BITS);
2200 if (!p) {
2201 mmap_unlock();
2202 return 0;
2205 /* if the page was really writable, then we change its
2206 protection back to writable */
2207 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
2208 host_start = address & qemu_host_page_mask;
2209 host_end = host_start + qemu_host_page_size;
2211 prot = 0;
2212 current_tb_invalidated = false;
2213 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
2214 p = page_find(addr >> TARGET_PAGE_BITS);
2215 p->flags |= PAGE_WRITE;
2216 prot |= p->flags;
2218 /* and since the content will be modified, we must invalidate
2219 the corresponding translated code. */
2220 current_tb_invalidated |= tb_invalidate_phys_page(addr, pc);
2221 #ifdef DEBUG_TB_CHECK
2222 tb_invalidate_check(addr);
2223 #endif
2225 mprotect((void *)g2h(host_start), qemu_host_page_size,
2226 prot & PAGE_BITS);
2228 mmap_unlock();
2229 /* If current TB was invalidated return to main loop */
2230 return current_tb_invalidated ? 2 : 1;
2232 mmap_unlock();
2233 return 0;
2235 #endif /* CONFIG_USER_ONLY */