make cpu_physical_memory_set_dirty_tracking equal to upstream
[qemu-kvm/amd-iommu.git] / exec.c
blobe8fe3c4daa7b77f472034b05a4cde25b3de443f8
1 /*
2 * virtual page mapping and translated block handling
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
19 #include "config.h"
20 #ifdef _WIN32
21 #include <windows.h>
22 #else
23 #include <sys/types.h>
24 #include <sys/mman.h>
25 #endif
26 #include <stdlib.h>
27 #include <stdio.h>
28 #include <stdarg.h>
29 #include <string.h>
30 #include <errno.h>
31 #include <unistd.h>
32 #include <inttypes.h>
34 #include "cpu.h"
35 #include "exec-all.h"
36 #include "qemu-common.h"
37 #include "cache-utils.h"
39 #if !defined(TARGET_IA64)
40 #include "tcg.h"
41 #endif
42 #include "qemu-kvm.h"
44 #include "hw/hw.h"
45 #include "osdep.h"
46 #include "kvm.h"
47 #if defined(CONFIG_USER_ONLY)
48 #include <qemu.h>
49 #include <signal.h>
50 #endif
52 //#define DEBUG_TB_INVALIDATE
53 //#define DEBUG_FLUSH
54 //#define DEBUG_TLB
55 //#define DEBUG_UNASSIGNED
57 /* make various TB consistency checks */
58 //#define DEBUG_TB_CHECK
59 //#define DEBUG_TLB_CHECK
61 //#define DEBUG_IOPORT
62 //#define DEBUG_SUBPAGE
64 #if !defined(CONFIG_USER_ONLY)
65 /* TB consistency checks only implemented for usermode emulation. */
66 #undef DEBUG_TB_CHECK
67 #endif
69 #define SMC_BITMAP_USE_THRESHOLD 10
71 static TranslationBlock *tbs;
72 int code_gen_max_blocks;
73 TranslationBlock *tb_phys_hash[CODE_GEN_PHYS_HASH_SIZE];
74 static int nb_tbs;
75 /* any access to the tbs or the page table must use this lock */
76 spinlock_t tb_lock = SPIN_LOCK_UNLOCKED;
78 #if defined(__arm__) || defined(__sparc_v9__)
79 /* The prologue must be reachable with a direct jump. ARM and Sparc64
80 have limited branch ranges (possibly also PPC) so place it in a
81 section close to code segment. */
82 #define code_gen_section \
83 __attribute__((__section__(".gen_code"))) \
84 __attribute__((aligned (32)))
85 #elif defined(_WIN32)
86 /* Maximum alignment for Win32 is 16. */
87 #define code_gen_section \
88 __attribute__((aligned (16)))
89 #else
90 #define code_gen_section \
91 __attribute__((aligned (32)))
92 #endif
94 uint8_t code_gen_prologue[1024] code_gen_section;
95 static uint8_t *code_gen_buffer;
96 static unsigned long code_gen_buffer_size;
97 /* threshold to flush the translated code buffer */
98 static unsigned long code_gen_buffer_max_size;
99 uint8_t *code_gen_ptr;
101 #if !defined(CONFIG_USER_ONLY)
102 int phys_ram_fd;
103 uint8_t *phys_ram_dirty;
104 uint8_t *bios_mem;
105 static int in_migration;
107 typedef struct RAMBlock {
108 uint8_t *host;
109 ram_addr_t offset;
110 ram_addr_t length;
111 struct RAMBlock *next;
112 } RAMBlock;
114 static RAMBlock *ram_blocks;
115 /* TODO: When we implement (and use) ram deallocation (e.g. for hotplug)
116 then we can no longer assume contiguous ram offsets, and external uses
117 of this variable will break. */
118 ram_addr_t last_ram_offset;
119 #endif
121 CPUState *first_cpu;
122 /* current CPU in the current thread. It is only valid inside
123 cpu_exec() */
124 CPUState *cpu_single_env;
125 /* 0 = Do not count executed instructions.
126 1 = Precise instruction counting.
127 2 = Adaptive rate instruction counting. */
128 int use_icount = 0;
129 /* Current instruction counter. While executing translated code this may
130 include some instructions that have not yet been executed. */
131 int64_t qemu_icount;
133 typedef struct PageDesc {
134 /* list of TBs intersecting this ram page */
135 TranslationBlock *first_tb;
136 /* in order to optimize self modifying code, we count the number
137 of lookups we do to a given page to use a bitmap */
138 unsigned int code_write_count;
139 uint8_t *code_bitmap;
140 #if defined(CONFIG_USER_ONLY)
141 unsigned long flags;
142 #endif
143 } PageDesc;
145 /* In system mode we want L1_MAP to be based on ram offsets,
146 while in user mode we want it to be based on virtual addresses. */
147 #if !defined(CONFIG_USER_ONLY)
148 #if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
149 # define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
150 #else
151 # define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
152 #endif
153 #else
154 # define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
155 #endif
157 /* Size of the L2 (and L3, etc) page tables. */
158 #define L2_BITS 10
159 #define L2_SIZE (1 << L2_BITS)
161 /* The bits remaining after N lower levels of page tables. */
162 #define P_L1_BITS_REM \
163 ((TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
164 #define V_L1_BITS_REM \
165 ((L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
167 /* Size of the L1 page table. Avoid silly small sizes. */
168 #if P_L1_BITS_REM < 4
169 #define P_L1_BITS (P_L1_BITS_REM + L2_BITS)
170 #else
171 #define P_L1_BITS P_L1_BITS_REM
172 #endif
174 #if V_L1_BITS_REM < 4
175 #define V_L1_BITS (V_L1_BITS_REM + L2_BITS)
176 #else
177 #define V_L1_BITS V_L1_BITS_REM
178 #endif
180 #define P_L1_SIZE ((target_phys_addr_t)1 << P_L1_BITS)
181 #define V_L1_SIZE ((target_ulong)1 << V_L1_BITS)
183 #define P_L1_SHIFT (TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS - P_L1_BITS)
184 #define V_L1_SHIFT (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - V_L1_BITS)
186 unsigned long qemu_real_host_page_size;
187 unsigned long qemu_host_page_bits;
188 unsigned long qemu_host_page_size;
189 unsigned long qemu_host_page_mask;
191 /* This is a multi-level map on the virtual address space.
192 The bottom level has pointers to PageDesc. */
193 static void *l1_map[V_L1_SIZE];
195 #if !defined(CONFIG_USER_ONLY)
196 typedef struct PhysPageDesc {
197 /* offset in host memory of the page + io_index in the low bits */
198 ram_addr_t phys_offset;
199 ram_addr_t region_offset;
200 } PhysPageDesc;
202 /* This is a multi-level map on the physical address space.
203 The bottom level has pointers to PhysPageDesc. */
204 static void *l1_phys_map[P_L1_SIZE];
206 static void io_mem_init(void);
208 /* io memory support */
209 CPUWriteMemoryFunc *io_mem_write[IO_MEM_NB_ENTRIES][4];
210 CPUReadMemoryFunc *io_mem_read[IO_MEM_NB_ENTRIES][4];
211 void *io_mem_opaque[IO_MEM_NB_ENTRIES];
212 static char io_mem_used[IO_MEM_NB_ENTRIES];
213 static int io_mem_watch;
214 #endif
216 /* log support */
217 #ifdef WIN32
218 static const char *logfilename = "qemu.log";
219 #else
220 static const char *logfilename = "/tmp/qemu.log";
221 #endif
222 FILE *logfile;
223 int loglevel;
224 static int log_append = 0;
226 /* statistics */
227 #if !defined(CONFIG_USER_ONLY)
228 static int tlb_flush_count;
229 #endif
230 static int tb_flush_count;
231 static int tb_phys_invalidate_count;
233 #ifdef _WIN32
234 static void map_exec(void *addr, long size)
236 DWORD old_protect;
237 VirtualProtect(addr, size,
238 PAGE_EXECUTE_READWRITE, &old_protect);
241 #else
242 static void map_exec(void *addr, long size)
244 unsigned long start, end, page_size;
246 page_size = getpagesize();
247 start = (unsigned long)addr;
248 start &= ~(page_size - 1);
250 end = (unsigned long)addr + size;
251 end += page_size - 1;
252 end &= ~(page_size - 1);
254 mprotect((void *)start, end - start,
255 PROT_READ | PROT_WRITE | PROT_EXEC);
257 #endif
259 static void page_init(void)
261 /* NOTE: we can always suppose that qemu_host_page_size >=
262 TARGET_PAGE_SIZE */
263 #ifdef _WIN32
265 SYSTEM_INFO system_info;
267 GetSystemInfo(&system_info);
268 qemu_real_host_page_size = system_info.dwPageSize;
270 #else
271 qemu_real_host_page_size = getpagesize();
272 #endif
273 if (qemu_host_page_size == 0)
274 qemu_host_page_size = qemu_real_host_page_size;
275 if (qemu_host_page_size < TARGET_PAGE_SIZE)
276 qemu_host_page_size = TARGET_PAGE_SIZE;
277 qemu_host_page_bits = 0;
278 while ((1 << qemu_host_page_bits) < qemu_host_page_size)
279 qemu_host_page_bits++;
280 qemu_host_page_mask = ~(qemu_host_page_size - 1);
282 #if !defined(_WIN32) && defined(CONFIG_USER_ONLY)
284 FILE *f;
286 last_brk = (unsigned long)sbrk(0);
288 f = fopen("/proc/self/maps", "r");
289 if (f) {
290 mmap_lock();
292 do {
293 unsigned long startaddr, endaddr;
294 int n;
296 n = fscanf (f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
298 if (n == 2 && h2g_valid(startaddr)) {
299 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
301 if (h2g_valid(endaddr)) {
302 endaddr = h2g(endaddr);
303 } else {
304 endaddr = ~0ul;
306 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
308 } while (!feof(f));
310 fclose(f);
311 mmap_unlock();
314 #endif
317 static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
319 PageDesc *pd;
320 void **lp;
321 int i;
323 #if defined(CONFIG_USER_ONLY)
324 /* We can't use qemu_malloc because it may recurse into a locked mutex.
325 Neither can we record the new pages we reserve while allocating a
326 given page because that may recurse into an unallocated page table
327 entry. Stuff the allocations we do make into a queue and process
328 them after having completed one entire page table allocation. */
330 unsigned long reserve[2 * (V_L1_SHIFT / L2_BITS)];
331 int reserve_idx = 0;
333 # define ALLOC(P, SIZE) \
334 do { \
335 P = mmap(NULL, SIZE, PROT_READ | PROT_WRITE, \
336 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); \
337 if (h2g_valid(P)) { \
338 reserve[reserve_idx] = h2g(P); \
339 reserve[reserve_idx + 1] = SIZE; \
340 reserve_idx += 2; \
342 } while (0)
343 #else
344 # define ALLOC(P, SIZE) \
345 do { P = qemu_mallocz(SIZE); } while (0)
346 #endif
348 /* Level 1. Always allocated. */
349 lp = l1_map + ((index >> V_L1_SHIFT) & (V_L1_SIZE - 1));
351 /* Level 2..N-1. */
352 for (i = V_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
353 void **p = *lp;
355 if (p == NULL) {
356 if (!alloc) {
357 return NULL;
359 ALLOC(p, sizeof(void *) * L2_SIZE);
360 *lp = p;
363 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
366 pd = *lp;
367 if (pd == NULL) {
368 if (!alloc) {
369 return NULL;
371 ALLOC(pd, sizeof(PageDesc) * L2_SIZE);
372 *lp = pd;
375 #undef ALLOC
376 #if defined(CONFIG_USER_ONLY)
377 for (i = 0; i < reserve_idx; i += 2) {
378 unsigned long addr = reserve[i];
379 unsigned long len = reserve[i + 1];
381 page_set_flags(addr & TARGET_PAGE_MASK,
382 TARGET_PAGE_ALIGN(addr + len),
383 PAGE_RESERVED);
385 #endif
387 return pd + (index & (L2_SIZE - 1));
390 static inline PageDesc *page_find(tb_page_addr_t index)
392 return page_find_alloc(index, 0);
395 #if !defined(CONFIG_USER_ONLY)
396 static PhysPageDesc *phys_page_find_alloc(target_phys_addr_t index, int alloc)
398 PhysPageDesc *pd;
399 void **lp;
400 int i;
402 /* Level 1. Always allocated. */
403 lp = l1_phys_map + ((index >> P_L1_SHIFT) & (P_L1_SIZE - 1));
405 /* Level 2..N-1. */
406 for (i = P_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
407 void **p = *lp;
408 if (p == NULL) {
409 if (!alloc) {
410 return NULL;
412 *lp = p = qemu_mallocz(sizeof(void *) * L2_SIZE);
414 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
417 pd = *lp;
418 if (pd == NULL) {
419 int i;
421 if (!alloc) {
422 return NULL;
425 *lp = pd = qemu_malloc(sizeof(PhysPageDesc) * L2_SIZE);
427 for (i = 0; i < L2_SIZE; i++) {
428 pd[i].phys_offset = IO_MEM_UNASSIGNED;
429 pd[i].region_offset = (index + i) << TARGET_PAGE_BITS;
433 return pd + (index & (L2_SIZE - 1));
436 static inline PhysPageDesc *phys_page_find(target_phys_addr_t index)
438 return phys_page_find_alloc(index, 0);
441 static void tlb_protect_code(ram_addr_t ram_addr);
442 static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
443 target_ulong vaddr);
444 #define mmap_lock() do { } while(0)
445 #define mmap_unlock() do { } while(0)
446 #endif
448 #define DEFAULT_CODE_GEN_BUFFER_SIZE (32 * 1024 * 1024)
450 #if defined(CONFIG_USER_ONLY)
451 /* Currently it is not recommended to allocate big chunks of data in
452 user mode. It will change when a dedicated libc will be used */
453 #define USE_STATIC_CODE_GEN_BUFFER
454 #endif
456 #ifdef USE_STATIC_CODE_GEN_BUFFER
457 static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE];
458 #endif
460 static void code_gen_alloc(unsigned long tb_size)
462 if (kvm_enabled())
463 return;
465 #ifdef USE_STATIC_CODE_GEN_BUFFER
466 code_gen_buffer = static_code_gen_buffer;
467 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
468 map_exec(code_gen_buffer, code_gen_buffer_size);
469 #else
470 code_gen_buffer_size = tb_size;
471 if (code_gen_buffer_size == 0) {
472 #if defined(CONFIG_USER_ONLY)
473 /* in user mode, phys_ram_size is not meaningful */
474 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
475 #else
476 /* XXX: needs adjustments */
477 code_gen_buffer_size = (unsigned long)(ram_size / 4);
478 #endif
480 if (code_gen_buffer_size < MIN_CODE_GEN_BUFFER_SIZE)
481 code_gen_buffer_size = MIN_CODE_GEN_BUFFER_SIZE;
482 /* The code gen buffer location may have constraints depending on
483 the host cpu and OS */
484 #if defined(__linux__)
486 int flags;
487 void *start = NULL;
489 flags = MAP_PRIVATE | MAP_ANONYMOUS;
490 #if defined(__x86_64__)
491 flags |= MAP_32BIT;
492 /* Cannot map more than that */
493 if (code_gen_buffer_size > (800 * 1024 * 1024))
494 code_gen_buffer_size = (800 * 1024 * 1024);
495 #elif defined(__sparc_v9__)
496 // Map the buffer below 2G, so we can use direct calls and branches
497 flags |= MAP_FIXED;
498 start = (void *) 0x60000000UL;
499 if (code_gen_buffer_size > (512 * 1024 * 1024))
500 code_gen_buffer_size = (512 * 1024 * 1024);
501 #elif defined(__arm__)
502 /* Map the buffer below 32M, so we can use direct calls and branches */
503 flags |= MAP_FIXED;
504 start = (void *) 0x01000000UL;
505 if (code_gen_buffer_size > 16 * 1024 * 1024)
506 code_gen_buffer_size = 16 * 1024 * 1024;
507 #endif
508 code_gen_buffer = mmap(start, code_gen_buffer_size,
509 PROT_WRITE | PROT_READ | PROT_EXEC,
510 flags, -1, 0);
511 if (code_gen_buffer == MAP_FAILED) {
512 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
513 exit(1);
516 #elif defined(__FreeBSD__) || defined(__FreeBSD_kernel__) || defined(__DragonFly__)
518 int flags;
519 void *addr = NULL;
520 flags = MAP_PRIVATE | MAP_ANONYMOUS;
521 #if defined(__x86_64__)
522 /* FreeBSD doesn't have MAP_32BIT, use MAP_FIXED and assume
523 * 0x40000000 is free */
524 flags |= MAP_FIXED;
525 addr = (void *)0x40000000;
526 /* Cannot map more than that */
527 if (code_gen_buffer_size > (800 * 1024 * 1024))
528 code_gen_buffer_size = (800 * 1024 * 1024);
529 #endif
530 code_gen_buffer = mmap(addr, code_gen_buffer_size,
531 PROT_WRITE | PROT_READ | PROT_EXEC,
532 flags, -1, 0);
533 if (code_gen_buffer == MAP_FAILED) {
534 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
535 exit(1);
538 #else
539 code_gen_buffer = qemu_malloc(code_gen_buffer_size);
540 map_exec(code_gen_buffer, code_gen_buffer_size);
541 #endif
542 #endif /* !USE_STATIC_CODE_GEN_BUFFER */
543 map_exec(code_gen_prologue, sizeof(code_gen_prologue));
544 code_gen_buffer_max_size = code_gen_buffer_size -
545 code_gen_max_block_size();
546 code_gen_max_blocks = code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
547 tbs = qemu_malloc(code_gen_max_blocks * sizeof(TranslationBlock));
550 /* Must be called before using the QEMU cpus. 'tb_size' is the size
551 (in bytes) allocated to the translation buffer. Zero means default
552 size. */
553 void cpu_exec_init_all(unsigned long tb_size)
555 cpu_gen_init();
556 code_gen_alloc(tb_size);
557 code_gen_ptr = code_gen_buffer;
558 page_init();
559 #if !defined(CONFIG_USER_ONLY)
560 io_mem_init();
561 #endif
564 #if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
566 static int cpu_common_post_load(void *opaque, int version_id)
568 CPUState *env = opaque;
570 /* 0x01 was CPU_INTERRUPT_EXIT. This line can be removed when the
571 version_id is increased. */
572 env->interrupt_request &= ~0x01;
573 tlb_flush(env, 1);
575 return 0;
578 static const VMStateDescription vmstate_cpu_common = {
579 .name = "cpu_common",
580 .version_id = 1,
581 .minimum_version_id = 1,
582 .minimum_version_id_old = 1,
583 .post_load = cpu_common_post_load,
584 .fields = (VMStateField []) {
585 VMSTATE_UINT32(halted, CPUState),
586 VMSTATE_UINT32(interrupt_request, CPUState),
587 VMSTATE_END_OF_LIST()
590 #endif
592 CPUState *qemu_get_cpu(int cpu)
594 CPUState *env = first_cpu;
596 while (env) {
597 if (env->cpu_index == cpu)
598 break;
599 env = env->next_cpu;
602 return env;
605 void cpu_exec_init(CPUState *env)
607 CPUState **penv;
608 int cpu_index;
610 #if defined(CONFIG_USER_ONLY)
611 cpu_list_lock();
612 #endif
613 env->next_cpu = NULL;
614 penv = &first_cpu;
615 cpu_index = 0;
616 while (*penv != NULL) {
617 penv = &(*penv)->next_cpu;
618 cpu_index++;
620 env->cpu_index = cpu_index;
621 env->numa_node = 0;
622 QTAILQ_INIT(&env->breakpoints);
623 QTAILQ_INIT(&env->watchpoints);
624 #ifdef __WIN32
625 env->thread_id = GetCurrentProcessId();
626 #else
627 env->thread_id = getpid();
628 #endif
629 *penv = env;
630 #if defined(CONFIG_USER_ONLY)
631 cpu_list_unlock();
632 #endif
633 #if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
634 vmstate_register(cpu_index, &vmstate_cpu_common, env);
635 register_savevm("cpu", cpu_index, CPU_SAVE_VERSION,
636 cpu_save, cpu_load, env);
637 #endif
640 static inline void invalidate_page_bitmap(PageDesc *p)
642 if (p->code_bitmap) {
643 qemu_free(p->code_bitmap);
644 p->code_bitmap = NULL;
646 p->code_write_count = 0;
649 /* Set to NULL all the 'first_tb' fields in all PageDescs. */
651 static void page_flush_tb_1 (int level, void **lp)
653 int i;
655 if (*lp == NULL) {
656 return;
658 if (level == 0) {
659 PageDesc *pd = *lp;
660 for (i = 0; i < L2_SIZE; ++i) {
661 pd[i].first_tb = NULL;
662 invalidate_page_bitmap(pd + i);
664 } else {
665 void **pp = *lp;
666 for (i = 0; i < L2_SIZE; ++i) {
667 page_flush_tb_1 (level - 1, pp + i);
672 static void page_flush_tb(void)
674 int i;
675 for (i = 0; i < V_L1_SIZE; i++) {
676 page_flush_tb_1(V_L1_SHIFT / L2_BITS - 1, l1_map + i);
680 /* flush all the translation blocks */
681 /* XXX: tb_flush is currently not thread safe */
682 void tb_flush(CPUState *env1)
684 CPUState *env;
685 #if defined(DEBUG_FLUSH)
686 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
687 (unsigned long)(code_gen_ptr - code_gen_buffer),
688 nb_tbs, nb_tbs > 0 ?
689 ((unsigned long)(code_gen_ptr - code_gen_buffer)) / nb_tbs : 0);
690 #endif
691 if ((unsigned long)(code_gen_ptr - code_gen_buffer) > code_gen_buffer_size)
692 cpu_abort(env1, "Internal error: code buffer overflow\n");
694 nb_tbs = 0;
696 for(env = first_cpu; env != NULL; env = env->next_cpu) {
697 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
700 memset (tb_phys_hash, 0, CODE_GEN_PHYS_HASH_SIZE * sizeof (void *));
701 page_flush_tb();
703 code_gen_ptr = code_gen_buffer;
704 /* XXX: flush processor icache at this point if cache flush is
705 expensive */
706 tb_flush_count++;
709 #ifdef DEBUG_TB_CHECK
711 static void tb_invalidate_check(target_ulong address)
713 TranslationBlock *tb;
714 int i;
715 address &= TARGET_PAGE_MASK;
716 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
717 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
718 if (!(address + TARGET_PAGE_SIZE <= tb->pc ||
719 address >= tb->pc + tb->size)) {
720 printf("ERROR invalidate: address=" TARGET_FMT_lx
721 " PC=%08lx size=%04x\n",
722 address, (long)tb->pc, tb->size);
728 /* verify that all the pages have correct rights for code */
729 static void tb_page_check(void)
731 TranslationBlock *tb;
732 int i, flags1, flags2;
734 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
735 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
736 flags1 = page_get_flags(tb->pc);
737 flags2 = page_get_flags(tb->pc + tb->size - 1);
738 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
739 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
740 (long)tb->pc, tb->size, flags1, flags2);
746 #endif
748 /* invalidate one TB */
749 static inline void tb_remove(TranslationBlock **ptb, TranslationBlock *tb,
750 int next_offset)
752 TranslationBlock *tb1;
753 for(;;) {
754 tb1 = *ptb;
755 if (tb1 == tb) {
756 *ptb = *(TranslationBlock **)((char *)tb1 + next_offset);
757 break;
759 ptb = (TranslationBlock **)((char *)tb1 + next_offset);
763 static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
765 TranslationBlock *tb1;
766 unsigned int n1;
768 for(;;) {
769 tb1 = *ptb;
770 n1 = (long)tb1 & 3;
771 tb1 = (TranslationBlock *)((long)tb1 & ~3);
772 if (tb1 == tb) {
773 *ptb = tb1->page_next[n1];
774 break;
776 ptb = &tb1->page_next[n1];
780 static inline void tb_jmp_remove(TranslationBlock *tb, int n)
782 TranslationBlock *tb1, **ptb;
783 unsigned int n1;
785 ptb = &tb->jmp_next[n];
786 tb1 = *ptb;
787 if (tb1) {
788 /* find tb(n) in circular list */
789 for(;;) {
790 tb1 = *ptb;
791 n1 = (long)tb1 & 3;
792 tb1 = (TranslationBlock *)((long)tb1 & ~3);
793 if (n1 == n && tb1 == tb)
794 break;
795 if (n1 == 2) {
796 ptb = &tb1->jmp_first;
797 } else {
798 ptb = &tb1->jmp_next[n1];
801 /* now we can suppress tb(n) from the list */
802 *ptb = tb->jmp_next[n];
804 tb->jmp_next[n] = NULL;
808 /* reset the jump entry 'n' of a TB so that it is not chained to
809 another TB */
810 static inline void tb_reset_jump(TranslationBlock *tb, int n)
812 tb_set_jmp_target(tb, n, (unsigned long)(tb->tc_ptr + tb->tb_next_offset[n]));
815 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
817 CPUState *env;
818 PageDesc *p;
819 unsigned int h, n1;
820 tb_page_addr_t phys_pc;
821 TranslationBlock *tb1, *tb2;
823 /* remove the TB from the hash list */
824 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
825 h = tb_phys_hash_func(phys_pc);
826 tb_remove(&tb_phys_hash[h], tb,
827 offsetof(TranslationBlock, phys_hash_next));
829 /* remove the TB from the page list */
830 if (tb->page_addr[0] != page_addr) {
831 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
832 tb_page_remove(&p->first_tb, tb);
833 invalidate_page_bitmap(p);
835 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
836 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
837 tb_page_remove(&p->first_tb, tb);
838 invalidate_page_bitmap(p);
841 tb_invalidated_flag = 1;
843 /* remove the TB from the hash list */
844 h = tb_jmp_cache_hash_func(tb->pc);
845 for(env = first_cpu; env != NULL; env = env->next_cpu) {
846 if (env->tb_jmp_cache[h] == tb)
847 env->tb_jmp_cache[h] = NULL;
850 /* suppress this TB from the two jump lists */
851 tb_jmp_remove(tb, 0);
852 tb_jmp_remove(tb, 1);
854 /* suppress any remaining jumps to this TB */
855 tb1 = tb->jmp_first;
856 for(;;) {
857 n1 = (long)tb1 & 3;
858 if (n1 == 2)
859 break;
860 tb1 = (TranslationBlock *)((long)tb1 & ~3);
861 tb2 = tb1->jmp_next[n1];
862 tb_reset_jump(tb1, n1);
863 tb1->jmp_next[n1] = NULL;
864 tb1 = tb2;
866 tb->jmp_first = (TranslationBlock *)((long)tb | 2); /* fail safe */
868 tb_phys_invalidate_count++;
871 static inline void set_bits(uint8_t *tab, int start, int len)
873 int end, mask, end1;
875 end = start + len;
876 tab += start >> 3;
877 mask = 0xff << (start & 7);
878 if ((start & ~7) == (end & ~7)) {
879 if (start < end) {
880 mask &= ~(0xff << (end & 7));
881 *tab |= mask;
883 } else {
884 *tab++ |= mask;
885 start = (start + 8) & ~7;
886 end1 = end & ~7;
887 while (start < end1) {
888 *tab++ = 0xff;
889 start += 8;
891 if (start < end) {
892 mask = ~(0xff << (end & 7));
893 *tab |= mask;
898 static void build_page_bitmap(PageDesc *p)
900 int n, tb_start, tb_end;
901 TranslationBlock *tb;
903 p->code_bitmap = qemu_mallocz(TARGET_PAGE_SIZE / 8);
905 tb = p->first_tb;
906 while (tb != NULL) {
907 n = (long)tb & 3;
908 tb = (TranslationBlock *)((long)tb & ~3);
909 /* NOTE: this is subtle as a TB may span two physical pages */
910 if (n == 0) {
911 /* NOTE: tb_end may be after the end of the page, but
912 it is not a problem */
913 tb_start = tb->pc & ~TARGET_PAGE_MASK;
914 tb_end = tb_start + tb->size;
915 if (tb_end > TARGET_PAGE_SIZE)
916 tb_end = TARGET_PAGE_SIZE;
917 } else {
918 tb_start = 0;
919 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
921 set_bits(p->code_bitmap, tb_start, tb_end - tb_start);
922 tb = tb->page_next[n];
926 TranslationBlock *tb_gen_code(CPUState *env,
927 target_ulong pc, target_ulong cs_base,
928 int flags, int cflags)
930 TranslationBlock *tb;
931 uint8_t *tc_ptr;
932 tb_page_addr_t phys_pc, phys_page2;
933 target_ulong virt_page2;
934 int code_gen_size;
936 phys_pc = get_page_addr_code(env, pc);
937 tb = tb_alloc(pc);
938 if (!tb) {
939 /* flush must be done */
940 tb_flush(env);
941 /* cannot fail at this point */
942 tb = tb_alloc(pc);
943 /* Don't forget to invalidate previous TB info. */
944 tb_invalidated_flag = 1;
946 tc_ptr = code_gen_ptr;
947 tb->tc_ptr = tc_ptr;
948 tb->cs_base = cs_base;
949 tb->flags = flags;
950 tb->cflags = cflags;
951 cpu_gen_code(env, tb, &code_gen_size);
952 code_gen_ptr = (void *)(((unsigned long)code_gen_ptr + code_gen_size + CODE_GEN_ALIGN - 1) & ~(CODE_GEN_ALIGN - 1));
954 /* check next page if needed */
955 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
956 phys_page2 = -1;
957 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
958 phys_page2 = get_page_addr_code(env, virt_page2);
960 tb_link_page(tb, phys_pc, phys_page2);
961 return tb;
964 /* invalidate all TBs which intersect with the target physical page
965 starting in range [start;end[. NOTE: start and end must refer to
966 the same physical page. 'is_cpu_write_access' should be true if called
967 from a real cpu write access: the virtual CPU will exit the current
968 TB if code is modified inside this TB. */
969 void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
970 int is_cpu_write_access)
972 TranslationBlock *tb, *tb_next, *saved_tb;
973 CPUState *env = cpu_single_env;
974 tb_page_addr_t tb_start, tb_end;
975 PageDesc *p;
976 int n;
977 #ifdef TARGET_HAS_PRECISE_SMC
978 int current_tb_not_found = is_cpu_write_access;
979 TranslationBlock *current_tb = NULL;
980 int current_tb_modified = 0;
981 target_ulong current_pc = 0;
982 target_ulong current_cs_base = 0;
983 int current_flags = 0;
984 #endif /* TARGET_HAS_PRECISE_SMC */
986 p = page_find(start >> TARGET_PAGE_BITS);
987 if (!p)
988 return;
989 if (!p->code_bitmap &&
990 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD &&
991 is_cpu_write_access) {
992 /* build code bitmap */
993 build_page_bitmap(p);
996 /* we remove all the TBs in the range [start, end[ */
997 /* XXX: see if in some cases it could be faster to invalidate all the code */
998 tb = p->first_tb;
999 while (tb != NULL) {
1000 n = (long)tb & 3;
1001 tb = (TranslationBlock *)((long)tb & ~3);
1002 tb_next = tb->page_next[n];
1003 /* NOTE: this is subtle as a TB may span two physical pages */
1004 if (n == 0) {
1005 /* NOTE: tb_end may be after the end of the page, but
1006 it is not a problem */
1007 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1008 tb_end = tb_start + tb->size;
1009 } else {
1010 tb_start = tb->page_addr[1];
1011 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1013 if (!(tb_end <= start || tb_start >= end)) {
1014 #ifdef TARGET_HAS_PRECISE_SMC
1015 if (current_tb_not_found) {
1016 current_tb_not_found = 0;
1017 current_tb = NULL;
1018 if (env->mem_io_pc) {
1019 /* now we have a real cpu fault */
1020 current_tb = tb_find_pc(env->mem_io_pc);
1023 if (current_tb == tb &&
1024 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1025 /* If we are modifying the current TB, we must stop
1026 its execution. We could be more precise by checking
1027 that the modification is after the current PC, but it
1028 would require a specialized function to partially
1029 restore the CPU state */
1031 current_tb_modified = 1;
1032 cpu_restore_state(current_tb, env,
1033 env->mem_io_pc, NULL);
1034 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1035 &current_flags);
1037 #endif /* TARGET_HAS_PRECISE_SMC */
1038 /* we need to do that to handle the case where a signal
1039 occurs while doing tb_phys_invalidate() */
1040 saved_tb = NULL;
1041 if (env) {
1042 saved_tb = env->current_tb;
1043 env->current_tb = NULL;
1045 tb_phys_invalidate(tb, -1);
1046 if (env) {
1047 env->current_tb = saved_tb;
1048 if (env->interrupt_request && env->current_tb)
1049 cpu_interrupt(env, env->interrupt_request);
1052 tb = tb_next;
1054 #if !defined(CONFIG_USER_ONLY)
1055 /* if no code remaining, no need to continue to use slow writes */
1056 if (!p->first_tb) {
1057 invalidate_page_bitmap(p);
1058 if (is_cpu_write_access) {
1059 tlb_unprotect_code_phys(env, start, env->mem_io_vaddr);
1062 #endif
1063 #ifdef TARGET_HAS_PRECISE_SMC
1064 if (current_tb_modified) {
1065 /* we generate a block containing just the instruction
1066 modifying the memory. It will ensure that it cannot modify
1067 itself */
1068 env->current_tb = NULL;
1069 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
1070 cpu_resume_from_signal(env, NULL);
1072 #endif
1075 /* len must be <= 8 and start must be a multiple of len */
1076 static inline void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
1078 PageDesc *p;
1079 int offset, b;
1080 #if 0
1081 if (1) {
1082 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1083 cpu_single_env->mem_io_vaddr, len,
1084 cpu_single_env->eip,
1085 cpu_single_env->eip + (long)cpu_single_env->segs[R_CS].base);
1087 #endif
1088 p = page_find(start >> TARGET_PAGE_BITS);
1089 if (!p)
1090 return;
1091 if (p->code_bitmap) {
1092 offset = start & ~TARGET_PAGE_MASK;
1093 b = p->code_bitmap[offset >> 3] >> (offset & 7);
1094 if (b & ((1 << len) - 1))
1095 goto do_invalidate;
1096 } else {
1097 do_invalidate:
1098 tb_invalidate_phys_page_range(start, start + len, 1);
1102 #if !defined(CONFIG_SOFTMMU)
1103 static void tb_invalidate_phys_page(tb_page_addr_t addr,
1104 unsigned long pc, void *puc)
1106 TranslationBlock *tb;
1107 PageDesc *p;
1108 int n;
1109 #ifdef TARGET_HAS_PRECISE_SMC
1110 TranslationBlock *current_tb = NULL;
1111 CPUState *env = cpu_single_env;
1112 int current_tb_modified = 0;
1113 target_ulong current_pc = 0;
1114 target_ulong current_cs_base = 0;
1115 int current_flags = 0;
1116 #endif
1118 addr &= TARGET_PAGE_MASK;
1119 p = page_find(addr >> TARGET_PAGE_BITS);
1120 if (!p)
1121 return;
1122 tb = p->first_tb;
1123 #ifdef TARGET_HAS_PRECISE_SMC
1124 if (tb && pc != 0) {
1125 current_tb = tb_find_pc(pc);
1127 #endif
1128 while (tb != NULL) {
1129 n = (long)tb & 3;
1130 tb = (TranslationBlock *)((long)tb & ~3);
1131 #ifdef TARGET_HAS_PRECISE_SMC
1132 if (current_tb == tb &&
1133 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1134 /* If we are modifying the current TB, we must stop
1135 its execution. We could be more precise by checking
1136 that the modification is after the current PC, but it
1137 would require a specialized function to partially
1138 restore the CPU state */
1140 current_tb_modified = 1;
1141 cpu_restore_state(current_tb, env, pc, puc);
1142 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1143 &current_flags);
1145 #endif /* TARGET_HAS_PRECISE_SMC */
1146 tb_phys_invalidate(tb, addr);
1147 tb = tb->page_next[n];
1149 p->first_tb = NULL;
1150 #ifdef TARGET_HAS_PRECISE_SMC
1151 if (current_tb_modified) {
1152 /* we generate a block containing just the instruction
1153 modifying the memory. It will ensure that it cannot modify
1154 itself */
1155 env->current_tb = NULL;
1156 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
1157 cpu_resume_from_signal(env, puc);
1159 #endif
1161 #endif
1163 /* add the tb in the target page and protect it if necessary */
1164 static inline void tb_alloc_page(TranslationBlock *tb,
1165 unsigned int n, tb_page_addr_t page_addr)
1167 PageDesc *p;
1168 TranslationBlock *last_first_tb;
1170 tb->page_addr[n] = page_addr;
1171 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
1172 tb->page_next[n] = p->first_tb;
1173 last_first_tb = p->first_tb;
1174 p->first_tb = (TranslationBlock *)((long)tb | n);
1175 invalidate_page_bitmap(p);
1177 #if defined(TARGET_HAS_SMC) || 1
1179 #if defined(CONFIG_USER_ONLY)
1180 if (p->flags & PAGE_WRITE) {
1181 target_ulong addr;
1182 PageDesc *p2;
1183 int prot;
1185 /* force the host page as non writable (writes will have a
1186 page fault + mprotect overhead) */
1187 page_addr &= qemu_host_page_mask;
1188 prot = 0;
1189 for(addr = page_addr; addr < page_addr + qemu_host_page_size;
1190 addr += TARGET_PAGE_SIZE) {
1192 p2 = page_find (addr >> TARGET_PAGE_BITS);
1193 if (!p2)
1194 continue;
1195 prot |= p2->flags;
1196 p2->flags &= ~PAGE_WRITE;
1197 page_get_flags(addr);
1199 mprotect(g2h(page_addr), qemu_host_page_size,
1200 (prot & PAGE_BITS) & ~PAGE_WRITE);
1201 #ifdef DEBUG_TB_INVALIDATE
1202 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
1203 page_addr);
1204 #endif
1206 #else
1207 /* if some code is already present, then the pages are already
1208 protected. So we handle the case where only the first TB is
1209 allocated in a physical page */
1210 if (!last_first_tb) {
1211 tlb_protect_code(page_addr);
1213 #endif
1215 #endif /* TARGET_HAS_SMC */
1218 /* Allocate a new translation block. Flush the translation buffer if
1219 too many translation blocks or too much generated code. */
1220 TranslationBlock *tb_alloc(target_ulong pc)
1222 TranslationBlock *tb;
1224 if (nb_tbs >= code_gen_max_blocks ||
1225 (code_gen_ptr - code_gen_buffer) >= code_gen_buffer_max_size)
1226 return NULL;
1227 tb = &tbs[nb_tbs++];
1228 tb->pc = pc;
1229 tb->cflags = 0;
1230 return tb;
1233 void tb_free(TranslationBlock *tb)
1235 /* In practice this is mostly used for single use temporary TB
1236 Ignore the hard cases and just back up if this TB happens to
1237 be the last one generated. */
1238 if (nb_tbs > 0 && tb == &tbs[nb_tbs - 1]) {
1239 code_gen_ptr = tb->tc_ptr;
1240 nb_tbs--;
1244 /* add a new TB and link it to the physical page tables. phys_page2 is
1245 (-1) to indicate that only one page contains the TB. */
1246 void tb_link_page(TranslationBlock *tb,
1247 tb_page_addr_t phys_pc, tb_page_addr_t phys_page2)
1249 unsigned int h;
1250 TranslationBlock **ptb;
1252 /* Grab the mmap lock to stop another thread invalidating this TB
1253 before we are done. */
1254 mmap_lock();
1255 /* add in the physical hash table */
1256 h = tb_phys_hash_func(phys_pc);
1257 ptb = &tb_phys_hash[h];
1258 tb->phys_hash_next = *ptb;
1259 *ptb = tb;
1261 /* add in the page list */
1262 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1263 if (phys_page2 != -1)
1264 tb_alloc_page(tb, 1, phys_page2);
1265 else
1266 tb->page_addr[1] = -1;
1268 tb->jmp_first = (TranslationBlock *)((long)tb | 2);
1269 tb->jmp_next[0] = NULL;
1270 tb->jmp_next[1] = NULL;
1272 /* init original jump addresses */
1273 if (tb->tb_next_offset[0] != 0xffff)
1274 tb_reset_jump(tb, 0);
1275 if (tb->tb_next_offset[1] != 0xffff)
1276 tb_reset_jump(tb, 1);
1278 #ifdef DEBUG_TB_CHECK
1279 tb_page_check();
1280 #endif
1281 mmap_unlock();
1284 /* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1285 tb[1].tc_ptr. Return NULL if not found */
1286 TranslationBlock *tb_find_pc(unsigned long tc_ptr)
1288 int m_min, m_max, m;
1289 unsigned long v;
1290 TranslationBlock *tb;
1292 if (nb_tbs <= 0)
1293 return NULL;
1294 if (tc_ptr < (unsigned long)code_gen_buffer ||
1295 tc_ptr >= (unsigned long)code_gen_ptr)
1296 return NULL;
1297 /* binary search (cf Knuth) */
1298 m_min = 0;
1299 m_max = nb_tbs - 1;
1300 while (m_min <= m_max) {
1301 m = (m_min + m_max) >> 1;
1302 tb = &tbs[m];
1303 v = (unsigned long)tb->tc_ptr;
1304 if (v == tc_ptr)
1305 return tb;
1306 else if (tc_ptr < v) {
1307 m_max = m - 1;
1308 } else {
1309 m_min = m + 1;
1312 return &tbs[m_max];
1315 static void tb_reset_jump_recursive(TranslationBlock *tb);
1317 static inline void tb_reset_jump_recursive2(TranslationBlock *tb, int n)
1319 TranslationBlock *tb1, *tb_next, **ptb;
1320 unsigned int n1;
1322 tb1 = tb->jmp_next[n];
1323 if (tb1 != NULL) {
1324 /* find head of list */
1325 for(;;) {
1326 n1 = (long)tb1 & 3;
1327 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1328 if (n1 == 2)
1329 break;
1330 tb1 = tb1->jmp_next[n1];
1332 /* we are now sure now that tb jumps to tb1 */
1333 tb_next = tb1;
1335 /* remove tb from the jmp_first list */
1336 ptb = &tb_next->jmp_first;
1337 for(;;) {
1338 tb1 = *ptb;
1339 n1 = (long)tb1 & 3;
1340 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1341 if (n1 == n && tb1 == tb)
1342 break;
1343 ptb = &tb1->jmp_next[n1];
1345 *ptb = tb->jmp_next[n];
1346 tb->jmp_next[n] = NULL;
1348 /* suppress the jump to next tb in generated code */
1349 tb_reset_jump(tb, n);
1351 /* suppress jumps in the tb on which we could have jumped */
1352 tb_reset_jump_recursive(tb_next);
1356 static void tb_reset_jump_recursive(TranslationBlock *tb)
1358 tb_reset_jump_recursive2(tb, 0);
1359 tb_reset_jump_recursive2(tb, 1);
1362 #if defined(TARGET_HAS_ICE)
1363 #if defined(CONFIG_USER_ONLY)
1364 static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1366 tb_invalidate_phys_page_range(pc, pc + 1, 0);
1368 #else
1369 static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1371 target_phys_addr_t addr;
1372 target_ulong pd;
1373 ram_addr_t ram_addr;
1374 PhysPageDesc *p;
1376 addr = cpu_get_phys_page_debug(env, pc);
1377 p = phys_page_find(addr >> TARGET_PAGE_BITS);
1378 if (!p) {
1379 pd = IO_MEM_UNASSIGNED;
1380 } else {
1381 pd = p->phys_offset;
1383 ram_addr = (pd & TARGET_PAGE_MASK) | (pc & ~TARGET_PAGE_MASK);
1384 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
1386 #endif
1387 #endif /* TARGET_HAS_ICE */
1389 #if defined(CONFIG_USER_ONLY)
1390 void cpu_watchpoint_remove_all(CPUState *env, int mask)
1395 int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1396 int flags, CPUWatchpoint **watchpoint)
1398 return -ENOSYS;
1400 #else
1401 /* Add a watchpoint. */
1402 int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1403 int flags, CPUWatchpoint **watchpoint)
1405 target_ulong len_mask = ~(len - 1);
1406 CPUWatchpoint *wp;
1408 /* sanity checks: allow power-of-2 lengths, deny unaligned watchpoints */
1409 if ((len != 1 && len != 2 && len != 4 && len != 8) || (addr & ~len_mask)) {
1410 fprintf(stderr, "qemu: tried to set invalid watchpoint at "
1411 TARGET_FMT_lx ", len=" TARGET_FMT_lu "\n", addr, len);
1412 return -EINVAL;
1414 wp = qemu_malloc(sizeof(*wp));
1416 wp->vaddr = addr;
1417 wp->len_mask = len_mask;
1418 wp->flags = flags;
1420 /* keep all GDB-injected watchpoints in front */
1421 if (flags & BP_GDB)
1422 QTAILQ_INSERT_HEAD(&env->watchpoints, wp, entry);
1423 else
1424 QTAILQ_INSERT_TAIL(&env->watchpoints, wp, entry);
1426 tlb_flush_page(env, addr);
1428 if (watchpoint)
1429 *watchpoint = wp;
1430 return 0;
1433 /* Remove a specific watchpoint. */
1434 int cpu_watchpoint_remove(CPUState *env, target_ulong addr, target_ulong len,
1435 int flags)
1437 target_ulong len_mask = ~(len - 1);
1438 CPUWatchpoint *wp;
1440 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
1441 if (addr == wp->vaddr && len_mask == wp->len_mask
1442 && flags == (wp->flags & ~BP_WATCHPOINT_HIT)) {
1443 cpu_watchpoint_remove_by_ref(env, wp);
1444 return 0;
1447 return -ENOENT;
1450 /* Remove a specific watchpoint by reference. */
1451 void cpu_watchpoint_remove_by_ref(CPUState *env, CPUWatchpoint *watchpoint)
1453 QTAILQ_REMOVE(&env->watchpoints, watchpoint, entry);
1455 tlb_flush_page(env, watchpoint->vaddr);
1457 qemu_free(watchpoint);
1460 /* Remove all matching watchpoints. */
1461 void cpu_watchpoint_remove_all(CPUState *env, int mask)
1463 CPUWatchpoint *wp, *next;
1465 QTAILQ_FOREACH_SAFE(wp, &env->watchpoints, entry, next) {
1466 if (wp->flags & mask)
1467 cpu_watchpoint_remove_by_ref(env, wp);
1470 #endif
1472 /* Add a breakpoint. */
1473 int cpu_breakpoint_insert(CPUState *env, target_ulong pc, int flags,
1474 CPUBreakpoint **breakpoint)
1476 #if defined(TARGET_HAS_ICE)
1477 CPUBreakpoint *bp;
1479 bp = qemu_malloc(sizeof(*bp));
1481 bp->pc = pc;
1482 bp->flags = flags;
1484 /* keep all GDB-injected breakpoints in front */
1485 if (flags & BP_GDB)
1486 QTAILQ_INSERT_HEAD(&env->breakpoints, bp, entry);
1487 else
1488 QTAILQ_INSERT_TAIL(&env->breakpoints, bp, entry);
1490 breakpoint_invalidate(env, pc);
1492 if (breakpoint)
1493 *breakpoint = bp;
1494 return 0;
1495 #else
1496 return -ENOSYS;
1497 #endif
1500 /* Remove a specific breakpoint. */
1501 int cpu_breakpoint_remove(CPUState *env, target_ulong pc, int flags)
1503 #if defined(TARGET_HAS_ICE)
1504 CPUBreakpoint *bp;
1506 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
1507 if (bp->pc == pc && bp->flags == flags) {
1508 cpu_breakpoint_remove_by_ref(env, bp);
1509 return 0;
1512 return -ENOENT;
1513 #else
1514 return -ENOSYS;
1515 #endif
1518 /* Remove a specific breakpoint by reference. */
1519 void cpu_breakpoint_remove_by_ref(CPUState *env, CPUBreakpoint *breakpoint)
1521 #if defined(TARGET_HAS_ICE)
1522 QTAILQ_REMOVE(&env->breakpoints, breakpoint, entry);
1524 breakpoint_invalidate(env, breakpoint->pc);
1526 qemu_free(breakpoint);
1527 #endif
1530 /* Remove all matching breakpoints. */
1531 void cpu_breakpoint_remove_all(CPUState *env, int mask)
1533 #if defined(TARGET_HAS_ICE)
1534 CPUBreakpoint *bp, *next;
1536 QTAILQ_FOREACH_SAFE(bp, &env->breakpoints, entry, next) {
1537 if (bp->flags & mask)
1538 cpu_breakpoint_remove_by_ref(env, bp);
1540 #endif
1543 /* enable or disable single step mode. EXCP_DEBUG is returned by the
1544 CPU loop after each instruction */
1545 void cpu_single_step(CPUState *env, int enabled)
1547 #if defined(TARGET_HAS_ICE)
1548 if (env->singlestep_enabled != enabled) {
1549 env->singlestep_enabled = enabled;
1550 if (kvm_enabled())
1551 kvm_update_guest_debug(env, 0);
1552 else {
1553 /* must flush all the translated code to avoid inconsistencies */
1554 /* XXX: only flush what is necessary */
1555 tb_flush(env);
1558 #endif
1561 /* enable or disable low levels log */
1562 void cpu_set_log(int log_flags)
1564 loglevel = log_flags;
1565 if (loglevel && !logfile) {
1566 logfile = fopen(logfilename, log_append ? "a" : "w");
1567 if (!logfile) {
1568 perror(logfilename);
1569 _exit(1);
1571 #if !defined(CONFIG_SOFTMMU)
1572 /* must avoid mmap() usage of glibc by setting a buffer "by hand" */
1574 static char logfile_buf[4096];
1575 setvbuf(logfile, logfile_buf, _IOLBF, sizeof(logfile_buf));
1577 #elif !defined(_WIN32)
1578 /* Win32 doesn't support line-buffering and requires size >= 2 */
1579 setvbuf(logfile, NULL, _IOLBF, 0);
1580 #endif
1581 log_append = 1;
1583 if (!loglevel && logfile) {
1584 fclose(logfile);
1585 logfile = NULL;
1589 void cpu_set_log_filename(const char *filename)
1591 logfilename = strdup(filename);
1592 if (logfile) {
1593 fclose(logfile);
1594 logfile = NULL;
1596 cpu_set_log(loglevel);
1599 static void cpu_unlink_tb(CPUState *env)
1601 /* FIXME: TB unchaining isn't SMP safe. For now just ignore the
1602 problem and hope the cpu will stop of its own accord. For userspace
1603 emulation this often isn't actually as bad as it sounds. Often
1604 signals are used primarily to interrupt blocking syscalls. */
1605 TranslationBlock *tb;
1606 static spinlock_t interrupt_lock = SPIN_LOCK_UNLOCKED;
1608 spin_lock(&interrupt_lock);
1609 tb = env->current_tb;
1610 /* if the cpu is currently executing code, we must unlink it and
1611 all the potentially executing TB */
1612 if (tb) {
1613 env->current_tb = NULL;
1614 tb_reset_jump_recursive(tb);
1616 spin_unlock(&interrupt_lock);
1619 /* mask must never be zero, except for A20 change call */
1620 void cpu_interrupt(CPUState *env, int mask)
1622 int old_mask;
1624 old_mask = env->interrupt_request;
1625 env->interrupt_request |= mask;
1626 if (kvm_enabled() && !kvm_irqchip_in_kernel())
1627 kvm_update_interrupt_request(env);
1629 #ifndef CONFIG_USER_ONLY
1631 * If called from iothread context, wake the target cpu in
1632 * case its halted.
1634 if (!qemu_cpu_self(env)) {
1635 qemu_cpu_kick(env);
1636 return;
1638 #endif
1640 if (use_icount) {
1641 env->icount_decr.u16.high = 0xffff;
1642 #ifndef CONFIG_USER_ONLY
1643 if (!can_do_io(env)
1644 && (mask & ~old_mask) != 0) {
1645 cpu_abort(env, "Raised interrupt while not in I/O function");
1647 #endif
1648 } else {
1649 cpu_unlink_tb(env);
1653 void cpu_reset_interrupt(CPUState *env, int mask)
1655 env->interrupt_request &= ~mask;
1658 void cpu_exit(CPUState *env)
1660 env->exit_request = 1;
1661 cpu_unlink_tb(env);
1664 const CPULogItem cpu_log_items[] = {
1665 { CPU_LOG_TB_OUT_ASM, "out_asm",
1666 "show generated host assembly code for each compiled TB" },
1667 { CPU_LOG_TB_IN_ASM, "in_asm",
1668 "show target assembly code for each compiled TB" },
1669 { CPU_LOG_TB_OP, "op",
1670 "show micro ops for each compiled TB" },
1671 { CPU_LOG_TB_OP_OPT, "op_opt",
1672 "show micro ops "
1673 #ifdef TARGET_I386
1674 "before eflags optimization and "
1675 #endif
1676 "after liveness analysis" },
1677 { CPU_LOG_INT, "int",
1678 "show interrupts/exceptions in short format" },
1679 { CPU_LOG_EXEC, "exec",
1680 "show trace before each executed TB (lots of logs)" },
1681 { CPU_LOG_TB_CPU, "cpu",
1682 "show CPU state before block translation" },
1683 #ifdef TARGET_I386
1684 { CPU_LOG_PCALL, "pcall",
1685 "show protected mode far calls/returns/exceptions" },
1686 { CPU_LOG_RESET, "cpu_reset",
1687 "show CPU state before CPU resets" },
1688 #endif
1689 #ifdef DEBUG_IOPORT
1690 { CPU_LOG_IOPORT, "ioport",
1691 "show all i/o ports accesses" },
1692 #endif
1693 { 0, NULL, NULL },
1696 #ifndef CONFIG_USER_ONLY
1697 static QLIST_HEAD(memory_client_list, CPUPhysMemoryClient) memory_client_list
1698 = QLIST_HEAD_INITIALIZER(memory_client_list);
1700 static void cpu_notify_set_memory(target_phys_addr_t start_addr,
1701 ram_addr_t size,
1702 ram_addr_t phys_offset)
1704 CPUPhysMemoryClient *client;
1705 QLIST_FOREACH(client, &memory_client_list, list) {
1706 client->set_memory(client, start_addr, size, phys_offset);
1710 static int cpu_notify_sync_dirty_bitmap(target_phys_addr_t start,
1711 target_phys_addr_t end)
1713 CPUPhysMemoryClient *client;
1714 QLIST_FOREACH(client, &memory_client_list, list) {
1715 int r = client->sync_dirty_bitmap(client, start, end);
1716 if (r < 0)
1717 return r;
1719 return 0;
1722 static int cpu_notify_migration_log(int enable)
1724 CPUPhysMemoryClient *client;
1725 QLIST_FOREACH(client, &memory_client_list, list) {
1726 int r = client->migration_log(client, enable);
1727 if (r < 0)
1728 return r;
1730 return 0;
1733 static void phys_page_for_each_1(CPUPhysMemoryClient *client,
1734 int level, void **lp)
1736 int i;
1738 if (*lp == NULL) {
1739 return;
1741 if (level == 0) {
1742 PhysPageDesc *pd = *lp;
1743 for (i = 0; i < L2_SIZE; ++i) {
1744 if (pd[i].phys_offset != IO_MEM_UNASSIGNED) {
1745 client->set_memory(client, pd[i].region_offset,
1746 TARGET_PAGE_SIZE, pd[i].phys_offset);
1749 } else {
1750 void **pp = *lp;
1751 for (i = 0; i < L2_SIZE; ++i) {
1752 phys_page_for_each_1(client, level - 1, pp + i);
1757 static void phys_page_for_each(CPUPhysMemoryClient *client)
1759 int i;
1760 for (i = 0; i < P_L1_SIZE; ++i) {
1761 phys_page_for_each_1(client, P_L1_SHIFT / L2_BITS - 1,
1762 l1_phys_map + 1);
1766 void cpu_register_phys_memory_client(CPUPhysMemoryClient *client)
1768 QLIST_INSERT_HEAD(&memory_client_list, client, list);
1769 phys_page_for_each(client);
1772 void cpu_unregister_phys_memory_client(CPUPhysMemoryClient *client)
1774 QLIST_REMOVE(client, list);
1776 #endif
1778 static int cmp1(const char *s1, int n, const char *s2)
1780 if (strlen(s2) != n)
1781 return 0;
1782 return memcmp(s1, s2, n) == 0;
1785 /* takes a comma separated list of log masks. Return 0 if error. */
1786 int cpu_str_to_log_mask(const char *str)
1788 const CPULogItem *item;
1789 int mask;
1790 const char *p, *p1;
1792 p = str;
1793 mask = 0;
1794 for(;;) {
1795 p1 = strchr(p, ',');
1796 if (!p1)
1797 p1 = p + strlen(p);
1798 if(cmp1(p,p1-p,"all")) {
1799 for(item = cpu_log_items; item->mask != 0; item++) {
1800 mask |= item->mask;
1802 } else {
1803 for(item = cpu_log_items; item->mask != 0; item++) {
1804 if (cmp1(p, p1 - p, item->name))
1805 goto found;
1807 return 0;
1809 found:
1810 mask |= item->mask;
1811 if (*p1 != ',')
1812 break;
1813 p = p1 + 1;
1815 return mask;
1818 void cpu_abort(CPUState *env, const char *fmt, ...)
1820 va_list ap;
1821 va_list ap2;
1823 va_start(ap, fmt);
1824 va_copy(ap2, ap);
1825 fprintf(stderr, "qemu: fatal: ");
1826 vfprintf(stderr, fmt, ap);
1827 fprintf(stderr, "\n");
1828 #ifdef TARGET_I386
1829 cpu_dump_state(env, stderr, fprintf, X86_DUMP_FPU | X86_DUMP_CCOP);
1830 #else
1831 cpu_dump_state(env, stderr, fprintf, 0);
1832 #endif
1833 if (qemu_log_enabled()) {
1834 qemu_log("qemu: fatal: ");
1835 qemu_log_vprintf(fmt, ap2);
1836 qemu_log("\n");
1837 #ifdef TARGET_I386
1838 log_cpu_state(env, X86_DUMP_FPU | X86_DUMP_CCOP);
1839 #else
1840 log_cpu_state(env, 0);
1841 #endif
1842 qemu_log_flush();
1843 qemu_log_close();
1845 va_end(ap2);
1846 va_end(ap);
1847 #if defined(CONFIG_USER_ONLY)
1849 struct sigaction act;
1850 sigfillset(&act.sa_mask);
1851 act.sa_handler = SIG_DFL;
1852 sigaction(SIGABRT, &act, NULL);
1854 #endif
1855 abort();
1858 CPUState *cpu_copy(CPUState *env)
1860 CPUState *new_env = cpu_init(env->cpu_model_str);
1861 CPUState *next_cpu = new_env->next_cpu;
1862 int cpu_index = new_env->cpu_index;
1863 #if defined(TARGET_HAS_ICE)
1864 CPUBreakpoint *bp;
1865 CPUWatchpoint *wp;
1866 #endif
1868 memcpy(new_env, env, sizeof(CPUState));
1870 /* Preserve chaining and index. */
1871 new_env->next_cpu = next_cpu;
1872 new_env->cpu_index = cpu_index;
1874 /* Clone all break/watchpoints.
1875 Note: Once we support ptrace with hw-debug register access, make sure
1876 BP_CPU break/watchpoints are handled correctly on clone. */
1877 QTAILQ_INIT(&env->breakpoints);
1878 QTAILQ_INIT(&env->watchpoints);
1879 #if defined(TARGET_HAS_ICE)
1880 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
1881 cpu_breakpoint_insert(new_env, bp->pc, bp->flags, NULL);
1883 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
1884 cpu_watchpoint_insert(new_env, wp->vaddr, (~wp->len_mask) + 1,
1885 wp->flags, NULL);
1887 #endif
1889 return new_env;
1892 #if !defined(CONFIG_USER_ONLY)
1894 static inline void tlb_flush_jmp_cache(CPUState *env, target_ulong addr)
1896 unsigned int i;
1898 /* Discard jump cache entries for any tb which might potentially
1899 overlap the flushed page. */
1900 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1901 memset (&env->tb_jmp_cache[i], 0,
1902 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1904 i = tb_jmp_cache_hash_page(addr);
1905 memset (&env->tb_jmp_cache[i], 0,
1906 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1909 static CPUTLBEntry s_cputlb_empty_entry = {
1910 .addr_read = -1,
1911 .addr_write = -1,
1912 .addr_code = -1,
1913 .addend = -1,
1916 /* NOTE: if flush_global is true, also flush global entries (not
1917 implemented yet) */
1918 void tlb_flush(CPUState *env, int flush_global)
1920 int i;
1922 #if defined(DEBUG_TLB)
1923 printf("tlb_flush:\n");
1924 #endif
1925 /* must reset current TB so that interrupts cannot modify the
1926 links while we are modifying them */
1927 env->current_tb = NULL;
1929 for(i = 0; i < CPU_TLB_SIZE; i++) {
1930 int mmu_idx;
1931 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
1932 env->tlb_table[mmu_idx][i] = s_cputlb_empty_entry;
1936 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
1938 tlb_flush_count++;
1941 static inline void tlb_flush_entry(CPUTLBEntry *tlb_entry, target_ulong addr)
1943 if (addr == (tlb_entry->addr_read &
1944 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
1945 addr == (tlb_entry->addr_write &
1946 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
1947 addr == (tlb_entry->addr_code &
1948 (TARGET_PAGE_MASK | TLB_INVALID_MASK))) {
1949 *tlb_entry = s_cputlb_empty_entry;
1953 void tlb_flush_page(CPUState *env, target_ulong addr)
1955 int i;
1956 int mmu_idx;
1958 #if defined(DEBUG_TLB)
1959 printf("tlb_flush_page: " TARGET_FMT_lx "\n", addr);
1960 #endif
1961 /* must reset current TB so that interrupts cannot modify the
1962 links while we are modifying them */
1963 env->current_tb = NULL;
1965 addr &= TARGET_PAGE_MASK;
1966 i = (addr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
1967 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
1968 tlb_flush_entry(&env->tlb_table[mmu_idx][i], addr);
1970 tlb_flush_jmp_cache(env, addr);
1973 /* update the TLBs so that writes to code in the virtual page 'addr'
1974 can be detected */
1975 static void tlb_protect_code(ram_addr_t ram_addr)
1977 cpu_physical_memory_reset_dirty(ram_addr,
1978 ram_addr + TARGET_PAGE_SIZE,
1979 CODE_DIRTY_FLAG);
1982 /* update the TLB so that writes in physical page 'phys_addr' are no longer
1983 tested for self modifying code */
1984 static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
1985 target_ulong vaddr)
1987 phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS] |= CODE_DIRTY_FLAG;
1990 static inline void tlb_reset_dirty_range(CPUTLBEntry *tlb_entry,
1991 unsigned long start, unsigned long length)
1993 unsigned long addr;
1994 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
1995 addr = (tlb_entry->addr_write & TARGET_PAGE_MASK) + tlb_entry->addend;
1996 if ((addr - start) < length) {
1997 tlb_entry->addr_write = (tlb_entry->addr_write & TARGET_PAGE_MASK) | TLB_NOTDIRTY;
2002 /* Note: start and end must be within the same ram block. */
2003 void cpu_physical_memory_reset_dirty(ram_addr_t start, ram_addr_t end,
2004 int dirty_flags)
2006 CPUState *env;
2007 unsigned long length, start1;
2008 int i, mask, len;
2009 uint8_t *p;
2011 start &= TARGET_PAGE_MASK;
2012 end = TARGET_PAGE_ALIGN(end);
2014 length = end - start;
2015 if (length == 0)
2016 return;
2017 len = length >> TARGET_PAGE_BITS;
2018 mask = ~dirty_flags;
2019 p = phys_ram_dirty + (start >> TARGET_PAGE_BITS);
2020 for(i = 0; i < len; i++)
2021 p[i] &= mask;
2023 /* we modify the TLB cache so that the dirty bit will be set again
2024 when accessing the range */
2025 start1 = (unsigned long)qemu_get_ram_ptr(start);
2026 /* Chek that we don't span multiple blocks - this breaks the
2027 address comparisons below. */
2028 if ((unsigned long)qemu_get_ram_ptr(end - 1) - start1
2029 != (end - 1) - start) {
2030 abort();
2033 for(env = first_cpu; env != NULL; env = env->next_cpu) {
2034 int mmu_idx;
2035 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2036 for(i = 0; i < CPU_TLB_SIZE; i++)
2037 tlb_reset_dirty_range(&env->tlb_table[mmu_idx][i],
2038 start1, length);
2043 int cpu_physical_memory_set_dirty_tracking(int enable)
2045 int ret = 0;
2046 in_migration = enable;
2047 ret = cpu_notify_migration_log(!!enable);
2048 return ret;
2051 int cpu_physical_memory_get_dirty_tracking(void)
2053 return in_migration;
2056 int cpu_physical_sync_dirty_bitmap(target_phys_addr_t start_addr,
2057 target_phys_addr_t end_addr)
2059 int ret;
2061 ret = cpu_notify_sync_dirty_bitmap(start_addr, end_addr);
2062 return ret;
2065 static inline void tlb_update_dirty(CPUTLBEntry *tlb_entry)
2067 ram_addr_t ram_addr;
2068 void *p;
2070 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
2071 p = (void *)(unsigned long)((tlb_entry->addr_write & TARGET_PAGE_MASK)
2072 + tlb_entry->addend);
2073 ram_addr = qemu_ram_addr_from_host(p);
2074 if (!cpu_physical_memory_is_dirty(ram_addr)) {
2075 tlb_entry->addr_write |= TLB_NOTDIRTY;
2080 /* update the TLB according to the current state of the dirty bits */
2081 void cpu_tlb_update_dirty(CPUState *env)
2083 int i;
2084 int mmu_idx;
2085 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2086 for(i = 0; i < CPU_TLB_SIZE; i++)
2087 tlb_update_dirty(&env->tlb_table[mmu_idx][i]);
2091 static inline void tlb_set_dirty1(CPUTLBEntry *tlb_entry, target_ulong vaddr)
2093 if (tlb_entry->addr_write == (vaddr | TLB_NOTDIRTY))
2094 tlb_entry->addr_write = vaddr;
2097 /* update the TLB corresponding to virtual page vaddr
2098 so that it is no longer dirty */
2099 static inline void tlb_set_dirty(CPUState *env, target_ulong vaddr)
2101 int i;
2102 int mmu_idx;
2104 vaddr &= TARGET_PAGE_MASK;
2105 i = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
2106 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2107 tlb_set_dirty1(&env->tlb_table[mmu_idx][i], vaddr);
2110 /* add a new TLB entry. At most one entry for a given virtual address
2111 is permitted. Return 0 if OK or 2 if the page could not be mapped
2112 (can only happen in non SOFTMMU mode for I/O pages or pages
2113 conflicting with the host address space). */
2114 int tlb_set_page_exec(CPUState *env, target_ulong vaddr,
2115 target_phys_addr_t paddr, int prot,
2116 int mmu_idx, int is_softmmu)
2118 PhysPageDesc *p;
2119 unsigned long pd;
2120 unsigned int index;
2121 target_ulong address;
2122 target_ulong code_address;
2123 target_phys_addr_t addend;
2124 int ret;
2125 CPUTLBEntry *te;
2126 CPUWatchpoint *wp;
2127 target_phys_addr_t iotlb;
2129 p = phys_page_find(paddr >> TARGET_PAGE_BITS);
2130 if (!p) {
2131 pd = IO_MEM_UNASSIGNED;
2132 } else {
2133 pd = p->phys_offset;
2135 #if defined(DEBUG_TLB)
2136 printf("tlb_set_page: vaddr=" TARGET_FMT_lx " paddr=0x%08x prot=%x idx=%d smmu=%d pd=0x%08lx\n",
2137 vaddr, (int)paddr, prot, mmu_idx, is_softmmu, pd);
2138 #endif
2140 ret = 0;
2141 address = vaddr;
2142 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM && !(pd & IO_MEM_ROMD)) {
2143 /* IO memory case (romd handled later) */
2144 address |= TLB_MMIO;
2146 addend = (unsigned long)qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
2147 if ((pd & ~TARGET_PAGE_MASK) <= IO_MEM_ROM) {
2148 /* Normal RAM. */
2149 iotlb = pd & TARGET_PAGE_MASK;
2150 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
2151 iotlb |= IO_MEM_NOTDIRTY;
2152 else
2153 iotlb |= IO_MEM_ROM;
2154 } else {
2155 /* IO handlers are currently passed a physical address.
2156 It would be nice to pass an offset from the base address
2157 of that region. This would avoid having to special case RAM,
2158 and avoid full address decoding in every device.
2159 We can't use the high bits of pd for this because
2160 IO_MEM_ROMD uses these as a ram address. */
2161 iotlb = (pd & ~TARGET_PAGE_MASK);
2162 if (p) {
2163 iotlb += p->region_offset;
2164 } else {
2165 iotlb += paddr;
2169 code_address = address;
2170 /* Make accesses to pages with watchpoints go via the
2171 watchpoint trap routines. */
2172 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
2173 if (vaddr == (wp->vaddr & TARGET_PAGE_MASK)) {
2174 iotlb = io_mem_watch + paddr;
2175 /* TODO: The memory case can be optimized by not trapping
2176 reads of pages with a write breakpoint. */
2177 address |= TLB_MMIO;
2181 index = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
2182 env->iotlb[mmu_idx][index] = iotlb - vaddr;
2183 te = &env->tlb_table[mmu_idx][index];
2184 te->addend = addend - vaddr;
2185 if (prot & PAGE_READ) {
2186 te->addr_read = address;
2187 } else {
2188 te->addr_read = -1;
2191 if (prot & PAGE_EXEC) {
2192 te->addr_code = code_address;
2193 } else {
2194 te->addr_code = -1;
2196 if (prot & PAGE_WRITE) {
2197 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_ROM ||
2198 (pd & IO_MEM_ROMD)) {
2199 /* Write access calls the I/O callback. */
2200 te->addr_write = address | TLB_MMIO;
2201 } else if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM &&
2202 !cpu_physical_memory_is_dirty(pd)) {
2203 te->addr_write = address | TLB_NOTDIRTY;
2204 } else {
2205 te->addr_write = address;
2207 } else {
2208 te->addr_write = -1;
2210 return ret;
2213 #else
2215 void tlb_flush(CPUState *env, int flush_global)
2219 void tlb_flush_page(CPUState *env, target_ulong addr)
2224 * Walks guest process memory "regions" one by one
2225 * and calls callback function 'fn' for each region.
2228 struct walk_memory_regions_data
2230 walk_memory_regions_fn fn;
2231 void *priv;
2232 unsigned long start;
2233 int prot;
2236 static int walk_memory_regions_end(struct walk_memory_regions_data *data,
2237 abi_ulong end, int new_prot)
2239 if (data->start != -1ul) {
2240 int rc = data->fn(data->priv, data->start, end, data->prot);
2241 if (rc != 0) {
2242 return rc;
2246 data->start = (new_prot ? end : -1ul);
2247 data->prot = new_prot;
2249 return 0;
2252 static int walk_memory_regions_1(struct walk_memory_regions_data *data,
2253 abi_ulong base, int level, void **lp)
2255 abi_ulong pa;
2256 int i, rc;
2258 if (*lp == NULL) {
2259 return walk_memory_regions_end(data, base, 0);
2262 if (level == 0) {
2263 PageDesc *pd = *lp;
2264 for (i = 0; i < L2_SIZE; ++i) {
2265 int prot = pd[i].flags;
2267 pa = base | (i << TARGET_PAGE_BITS);
2268 if (prot != data->prot) {
2269 rc = walk_memory_regions_end(data, pa, prot);
2270 if (rc != 0) {
2271 return rc;
2275 } else {
2276 void **pp = *lp;
2277 for (i = 0; i < L2_SIZE; ++i) {
2278 pa = base | ((abi_ulong)i <<
2279 (TARGET_PAGE_BITS + L2_BITS * level));
2280 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2281 if (rc != 0) {
2282 return rc;
2287 return 0;
2290 int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2292 struct walk_memory_regions_data data;
2293 unsigned long i;
2295 data.fn = fn;
2296 data.priv = priv;
2297 data.start = -1ul;
2298 data.prot = 0;
2300 for (i = 0; i < V_L1_SIZE; i++) {
2301 int rc = walk_memory_regions_1(&data, (abi_ulong)i << V_L1_SHIFT,
2302 V_L1_SHIFT / L2_BITS - 1, l1_map + i);
2303 if (rc != 0) {
2304 return rc;
2308 return walk_memory_regions_end(&data, 0, 0);
2311 static int dump_region(void *priv, abi_ulong start,
2312 abi_ulong end, unsigned long prot)
2314 FILE *f = (FILE *)priv;
2316 (void) fprintf(f, TARGET_ABI_FMT_lx"-"TARGET_ABI_FMT_lx
2317 " "TARGET_ABI_FMT_lx" %c%c%c\n",
2318 start, end, end - start,
2319 ((prot & PAGE_READ) ? 'r' : '-'),
2320 ((prot & PAGE_WRITE) ? 'w' : '-'),
2321 ((prot & PAGE_EXEC) ? 'x' : '-'));
2323 return (0);
2326 /* dump memory mappings */
2327 void page_dump(FILE *f)
2329 (void) fprintf(f, "%-8s %-8s %-8s %s\n",
2330 "start", "end", "size", "prot");
2331 walk_memory_regions(f, dump_region);
2334 int page_get_flags(target_ulong address)
2336 PageDesc *p;
2338 p = page_find(address >> TARGET_PAGE_BITS);
2339 if (!p)
2340 return 0;
2341 return p->flags;
2344 /* Modify the flags of a page and invalidate the code if necessary.
2345 The flag PAGE_WRITE_ORG is positioned automatically depending
2346 on PAGE_WRITE. The mmap_lock should already be held. */
2347 void page_set_flags(target_ulong start, target_ulong end, int flags)
2349 target_ulong addr, len;
2351 /* This function should never be called with addresses outside the
2352 guest address space. If this assert fires, it probably indicates
2353 a missing call to h2g_valid. */
2354 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2355 assert(end < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2356 #endif
2357 assert(start < end);
2359 start = start & TARGET_PAGE_MASK;
2360 end = TARGET_PAGE_ALIGN(end);
2362 if (flags & PAGE_WRITE) {
2363 flags |= PAGE_WRITE_ORG;
2366 for (addr = start, len = end - start;
2367 len != 0;
2368 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2369 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2371 /* If the write protection bit is set, then we invalidate
2372 the code inside. */
2373 if (!(p->flags & PAGE_WRITE) &&
2374 (flags & PAGE_WRITE) &&
2375 p->first_tb) {
2376 tb_invalidate_phys_page(addr, 0, NULL);
2378 p->flags = flags;
2382 int page_check_range(target_ulong start, target_ulong len, int flags)
2384 PageDesc *p;
2385 target_ulong end;
2386 target_ulong addr;
2388 /* This function should never be called with addresses outside the
2389 guest address space. If this assert fires, it probably indicates
2390 a missing call to h2g_valid. */
2391 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2392 assert(start < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2393 #endif
2395 if (start + len - 1 < start) {
2396 /* We've wrapped around. */
2397 return -1;
2400 end = TARGET_PAGE_ALIGN(start+len); /* must do before we loose bits in the next step */
2401 start = start & TARGET_PAGE_MASK;
2403 for (addr = start, len = end - start;
2404 len != 0;
2405 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2406 p = page_find(addr >> TARGET_PAGE_BITS);
2407 if( !p )
2408 return -1;
2409 if( !(p->flags & PAGE_VALID) )
2410 return -1;
2412 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ))
2413 return -1;
2414 if (flags & PAGE_WRITE) {
2415 if (!(p->flags & PAGE_WRITE_ORG))
2416 return -1;
2417 /* unprotect the page if it was put read-only because it
2418 contains translated code */
2419 if (!(p->flags & PAGE_WRITE)) {
2420 if (!page_unprotect(addr, 0, NULL))
2421 return -1;
2423 return 0;
2426 return 0;
2429 /* called from signal handler: invalidate the code and unprotect the
2430 page. Return TRUE if the fault was successfully handled. */
2431 int page_unprotect(target_ulong address, unsigned long pc, void *puc)
2433 unsigned int page_index, prot, pindex;
2434 PageDesc *p, *p1;
2435 target_ulong host_start, host_end, addr;
2437 /* Technically this isn't safe inside a signal handler. However we
2438 know this only ever happens in a synchronous SEGV handler, so in
2439 practice it seems to be ok. */
2440 mmap_lock();
2442 host_start = address & qemu_host_page_mask;
2443 page_index = host_start >> TARGET_PAGE_BITS;
2444 p1 = page_find(page_index);
2445 if (!p1) {
2446 mmap_unlock();
2447 return 0;
2449 host_end = host_start + qemu_host_page_size;
2450 p = p1;
2451 prot = 0;
2452 for(addr = host_start;addr < host_end; addr += TARGET_PAGE_SIZE) {
2453 prot |= p->flags;
2454 p++;
2456 /* if the page was really writable, then we change its
2457 protection back to writable */
2458 if (prot & PAGE_WRITE_ORG) {
2459 pindex = (address - host_start) >> TARGET_PAGE_BITS;
2460 if (!(p1[pindex].flags & PAGE_WRITE)) {
2461 mprotect((void *)g2h(host_start), qemu_host_page_size,
2462 (prot & PAGE_BITS) | PAGE_WRITE);
2463 p1[pindex].flags |= PAGE_WRITE;
2464 /* and since the content will be modified, we must invalidate
2465 the corresponding translated code. */
2466 tb_invalidate_phys_page(address, pc, puc);
2467 #ifdef DEBUG_TB_CHECK
2468 tb_invalidate_check(address);
2469 #endif
2470 mmap_unlock();
2471 return 1;
2474 mmap_unlock();
2475 return 0;
2478 static inline void tlb_set_dirty(CPUState *env,
2479 unsigned long addr, target_ulong vaddr)
2482 #endif /* defined(CONFIG_USER_ONLY) */
2484 #if !defined(CONFIG_USER_ONLY)
2486 #define SUBPAGE_IDX(addr) ((addr) & ~TARGET_PAGE_MASK)
2487 typedef struct subpage_t {
2488 target_phys_addr_t base;
2489 CPUReadMemoryFunc * const *mem_read[TARGET_PAGE_SIZE][4];
2490 CPUWriteMemoryFunc * const *mem_write[TARGET_PAGE_SIZE][4];
2491 void *opaque[TARGET_PAGE_SIZE][2][4];
2492 ram_addr_t region_offset[TARGET_PAGE_SIZE][2][4];
2493 } subpage_t;
2495 static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
2496 ram_addr_t memory, ram_addr_t region_offset);
2497 static void *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
2498 ram_addr_t orig_memory, ram_addr_t region_offset);
2499 #define CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2, \
2500 need_subpage) \
2501 do { \
2502 if (addr > start_addr) \
2503 start_addr2 = 0; \
2504 else { \
2505 start_addr2 = start_addr & ~TARGET_PAGE_MASK; \
2506 if (start_addr2 > 0) \
2507 need_subpage = 1; \
2510 if ((start_addr + orig_size) - addr >= TARGET_PAGE_SIZE) \
2511 end_addr2 = TARGET_PAGE_SIZE - 1; \
2512 else { \
2513 end_addr2 = (start_addr + orig_size - 1) & ~TARGET_PAGE_MASK; \
2514 if (end_addr2 < TARGET_PAGE_SIZE - 1) \
2515 need_subpage = 1; \
2517 } while (0)
2519 /* register physical memory.
2520 For RAM, 'size' must be a multiple of the target page size.
2521 If (phys_offset & ~TARGET_PAGE_MASK) != 0, then it is an
2522 io memory page. The address used when calling the IO function is
2523 the offset from the start of the region, plus region_offset. Both
2524 start_addr and region_offset are rounded down to a page boundary
2525 before calculating this offset. This should not be a problem unless
2526 the low bits of start_addr and region_offset differ. */
2527 void cpu_register_physical_memory_offset(target_phys_addr_t start_addr,
2528 ram_addr_t size,
2529 ram_addr_t phys_offset,
2530 ram_addr_t region_offset)
2532 target_phys_addr_t addr, end_addr;
2533 PhysPageDesc *p;
2534 CPUState *env;
2535 ram_addr_t orig_size = size;
2536 void *subpage;
2538 cpu_notify_set_memory(start_addr, size, phys_offset);
2540 if (phys_offset == IO_MEM_UNASSIGNED) {
2541 region_offset = start_addr;
2543 region_offset &= TARGET_PAGE_MASK;
2544 size = (size + TARGET_PAGE_SIZE - 1) & TARGET_PAGE_MASK;
2545 end_addr = start_addr + (target_phys_addr_t)size;
2546 for(addr = start_addr; addr != end_addr; addr += TARGET_PAGE_SIZE) {
2547 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2548 if (p && p->phys_offset != IO_MEM_UNASSIGNED) {
2549 ram_addr_t orig_memory = p->phys_offset;
2550 target_phys_addr_t start_addr2, end_addr2;
2551 int need_subpage = 0;
2553 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2,
2554 need_subpage);
2555 if (need_subpage || phys_offset & IO_MEM_SUBWIDTH) {
2556 if (!(orig_memory & IO_MEM_SUBPAGE)) {
2557 subpage = subpage_init((addr & TARGET_PAGE_MASK),
2558 &p->phys_offset, orig_memory,
2559 p->region_offset);
2560 } else {
2561 subpage = io_mem_opaque[(orig_memory & ~TARGET_PAGE_MASK)
2562 >> IO_MEM_SHIFT];
2564 subpage_register(subpage, start_addr2, end_addr2, phys_offset,
2565 region_offset);
2566 p->region_offset = 0;
2567 } else {
2568 p->phys_offset = phys_offset;
2569 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
2570 (phys_offset & IO_MEM_ROMD))
2571 phys_offset += TARGET_PAGE_SIZE;
2573 } else {
2574 p = phys_page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2575 p->phys_offset = phys_offset;
2576 p->region_offset = region_offset;
2577 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
2578 (phys_offset & IO_MEM_ROMD)) {
2579 phys_offset += TARGET_PAGE_SIZE;
2580 } else {
2581 target_phys_addr_t start_addr2, end_addr2;
2582 int need_subpage = 0;
2584 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr,
2585 end_addr2, need_subpage);
2587 if (need_subpage || phys_offset & IO_MEM_SUBWIDTH) {
2588 subpage = subpage_init((addr & TARGET_PAGE_MASK),
2589 &p->phys_offset, IO_MEM_UNASSIGNED,
2590 addr & TARGET_PAGE_MASK);
2591 subpage_register(subpage, start_addr2, end_addr2,
2592 phys_offset, region_offset);
2593 p->region_offset = 0;
2597 region_offset += TARGET_PAGE_SIZE;
2600 /* since each CPU stores ram addresses in its TLB cache, we must
2601 reset the modified entries */
2602 /* XXX: slow ! */
2603 for(env = first_cpu; env != NULL; env = env->next_cpu) {
2604 tlb_flush(env, 1);
2608 /* XXX: temporary until new memory mapping API */
2609 ram_addr_t cpu_get_physical_page_desc(target_phys_addr_t addr)
2611 PhysPageDesc *p;
2613 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2614 if (!p)
2615 return IO_MEM_UNASSIGNED;
2616 return p->phys_offset;
2619 void qemu_register_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
2621 if (kvm_enabled())
2622 kvm_coalesce_mmio_region(addr, size);
2625 void qemu_unregister_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
2627 if (kvm_enabled())
2628 kvm_uncoalesce_mmio_region(addr, size);
2631 void qemu_flush_coalesced_mmio_buffer(void)
2633 if (kvm_enabled())
2634 kvm_flush_coalesced_mmio_buffer();
2637 #if defined(__linux__) && !defined(TARGET_S390X)
2639 #include <sys/vfs.h>
2641 #define HUGETLBFS_MAGIC 0x958458f6
2643 static long gethugepagesize(const char *path)
2645 struct statfs fs;
2646 int ret;
2648 do {
2649 ret = statfs(path, &fs);
2650 } while (ret != 0 && errno == EINTR);
2652 if (ret != 0) {
2653 perror("statfs");
2654 return 0;
2657 if (fs.f_type != HUGETLBFS_MAGIC)
2658 fprintf(stderr, "Warning: path not on HugeTLBFS: %s\n", path);
2660 return fs.f_bsize;
2663 static void *file_ram_alloc(ram_addr_t memory, const char *path)
2665 char *filename;
2666 void *area;
2667 int fd;
2668 #ifdef MAP_POPULATE
2669 int flags;
2670 #endif
2671 unsigned long hpagesize;
2673 hpagesize = gethugepagesize(path);
2674 if (!hpagesize) {
2675 return NULL;
2678 if (memory < hpagesize) {
2679 return NULL;
2682 if (kvm_enabled() && !kvm_has_sync_mmu()) {
2683 fprintf(stderr, "host lacks kvm mmu notifiers, -mem-path unsupported\n");
2684 return NULL;
2687 if (asprintf(&filename, "%s/qemu_back_mem.XXXXXX", path) == -1) {
2688 return NULL;
2691 fd = mkstemp(filename);
2692 if (fd < 0) {
2693 perror("mkstemp");
2694 free(filename);
2695 return NULL;
2697 unlink(filename);
2698 free(filename);
2700 memory = (memory+hpagesize-1) & ~(hpagesize-1);
2703 * ftruncate is not supported by hugetlbfs in older
2704 * hosts, so don't bother bailing out on errors.
2705 * If anything goes wrong with it under other filesystems,
2706 * mmap will fail.
2708 if (ftruncate(fd, memory))
2709 perror("ftruncate");
2711 #ifdef MAP_POPULATE
2712 /* NB: MAP_POPULATE won't exhaustively alloc all phys pages in the case
2713 * MAP_PRIVATE is requested. For mem_prealloc we mmap as MAP_SHARED
2714 * to sidestep this quirk.
2716 flags = mem_prealloc ? MAP_POPULATE | MAP_SHARED : MAP_PRIVATE;
2717 area = mmap(0, memory, PROT_READ | PROT_WRITE, flags, fd, 0);
2718 #else
2719 area = mmap(0, memory, PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
2720 #endif
2721 if (area == MAP_FAILED) {
2722 perror("file_ram_alloc: can't mmap RAM pages");
2723 close(fd);
2724 return (NULL);
2726 return area;
2728 #endif
2730 ram_addr_t qemu_ram_alloc(ram_addr_t size)
2732 RAMBlock *new_block;
2734 size = TARGET_PAGE_ALIGN(size);
2735 new_block = qemu_malloc(sizeof(*new_block));
2737 if (mem_path) {
2738 #if defined (__linux__) && !defined(TARGET_S390X)
2739 new_block->host = file_ram_alloc(size, mem_path);
2740 if (!new_block->host)
2741 exit(1);
2742 #else
2743 fprintf(stderr, "-mem-path option unsupported\n");
2744 exit(1);
2745 #endif
2746 } else {
2747 #if defined(TARGET_S390X) && defined(CONFIG_KVM)
2748 /* XXX S390 KVM requires the topmost vma of the RAM to be < 256GB */
2749 new_block->host = mmap((void*)0x1000000, size,
2750 PROT_EXEC|PROT_READ|PROT_WRITE,
2751 MAP_SHARED | MAP_ANONYMOUS, -1, 0);
2752 #else
2753 new_block->host = qemu_vmalloc(size);
2754 #endif
2755 #ifdef MADV_MERGEABLE
2756 madvise(new_block->host, size, MADV_MERGEABLE);
2757 #endif
2759 new_block->offset = last_ram_offset;
2760 new_block->length = size;
2762 new_block->next = ram_blocks;
2763 ram_blocks = new_block;
2765 phys_ram_dirty = qemu_realloc(phys_ram_dirty,
2766 (last_ram_offset + size) >> TARGET_PAGE_BITS);
2767 memset(phys_ram_dirty + (last_ram_offset >> TARGET_PAGE_BITS),
2768 0xff, size >> TARGET_PAGE_BITS);
2770 last_ram_offset += size;
2772 if (kvm_enabled())
2773 kvm_setup_guest_memory(new_block->host, size);
2775 return new_block->offset;
2778 void qemu_ram_free(ram_addr_t addr)
2780 /* TODO: implement this. */
2783 /* Return a host pointer to ram allocated with qemu_ram_alloc.
2784 With the exception of the softmmu code in this file, this should
2785 only be used for local memory (e.g. video ram) that the device owns,
2786 and knows it isn't going to access beyond the end of the block.
2788 It should not be used for general purpose DMA.
2789 Use cpu_physical_memory_map/cpu_physical_memory_rw instead.
2791 void *qemu_get_ram_ptr(ram_addr_t addr)
2793 RAMBlock *prev;
2794 RAMBlock **prevp;
2795 RAMBlock *block;
2797 prev = NULL;
2798 prevp = &ram_blocks;
2799 block = ram_blocks;
2800 while (block && (block->offset > addr
2801 || block->offset + block->length <= addr)) {
2802 if (prev)
2803 prevp = &prev->next;
2804 prev = block;
2805 block = block->next;
2807 if (!block) {
2808 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
2809 abort();
2811 /* Move this entry to to start of the list. */
2812 if (prev) {
2813 prev->next = block->next;
2814 block->next = *prevp;
2815 *prevp = block;
2817 return block->host + (addr - block->offset);
2820 int do_qemu_ram_addr_from_host(void *ptr, ram_addr_t *ram_addr)
2822 RAMBlock *prev;
2823 RAMBlock *block;
2824 uint8_t *host = ptr;
2826 prev = NULL;
2827 block = ram_blocks;
2828 while (block && (block->host > host
2829 || block->host + block->length <= host)) {
2830 prev = block;
2831 block = block->next;
2833 if (!block)
2834 return -1;
2835 *ram_addr = block->offset + (host - block->host);
2836 return 0;
2839 /* Some of the softmmu routines need to translate from a host pointer
2840 (typically a TLB entry) back to a ram offset. */
2841 ram_addr_t qemu_ram_addr_from_host(void *ptr)
2843 ram_addr_t ram_addr;
2845 if (do_qemu_ram_addr_from_host(ptr, &ram_addr)) {
2846 fprintf(stderr, "Bad ram pointer %p\n", ptr);
2847 abort();
2849 return ram_addr;
2852 static uint32_t unassigned_mem_readb(void *opaque, target_phys_addr_t addr)
2854 #ifdef DEBUG_UNASSIGNED
2855 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
2856 #endif
2857 #if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
2858 do_unassigned_access(addr, 0, 0, 0, 1);
2859 #endif
2860 return 0;
2863 static uint32_t unassigned_mem_readw(void *opaque, target_phys_addr_t addr)
2865 #ifdef DEBUG_UNASSIGNED
2866 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
2867 #endif
2868 #if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
2869 do_unassigned_access(addr, 0, 0, 0, 2);
2870 #endif
2871 return 0;
2874 static uint32_t unassigned_mem_readl(void *opaque, target_phys_addr_t addr)
2876 #ifdef DEBUG_UNASSIGNED
2877 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
2878 #endif
2879 #if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
2880 do_unassigned_access(addr, 0, 0, 0, 4);
2881 #endif
2882 return 0;
2885 static void unassigned_mem_writeb(void *opaque, target_phys_addr_t addr, uint32_t val)
2887 #ifdef DEBUG_UNASSIGNED
2888 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
2889 #endif
2890 #if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
2891 do_unassigned_access(addr, 1, 0, 0, 1);
2892 #endif
2895 static void unassigned_mem_writew(void *opaque, target_phys_addr_t addr, uint32_t val)
2897 #ifdef DEBUG_UNASSIGNED
2898 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
2899 #endif
2900 #if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
2901 do_unassigned_access(addr, 1, 0, 0, 2);
2902 #endif
2905 static void unassigned_mem_writel(void *opaque, target_phys_addr_t addr, uint32_t val)
2907 #ifdef DEBUG_UNASSIGNED
2908 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
2909 #endif
2910 #if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
2911 do_unassigned_access(addr, 1, 0, 0, 4);
2912 #endif
2915 static CPUReadMemoryFunc * const unassigned_mem_read[3] = {
2916 unassigned_mem_readb,
2917 unassigned_mem_readw,
2918 unassigned_mem_readl,
2921 static CPUWriteMemoryFunc * const unassigned_mem_write[3] = {
2922 unassigned_mem_writeb,
2923 unassigned_mem_writew,
2924 unassigned_mem_writel,
2927 static void notdirty_mem_writeb(void *opaque, target_phys_addr_t ram_addr,
2928 uint32_t val)
2930 int dirty_flags;
2931 dirty_flags = phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS];
2932 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
2933 #if !defined(CONFIG_USER_ONLY)
2934 tb_invalidate_phys_page_fast(ram_addr, 1);
2935 dirty_flags = phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS];
2936 #endif
2938 stb_p(qemu_get_ram_ptr(ram_addr), val);
2939 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
2940 phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS] = dirty_flags;
2941 /* we remove the notdirty callback only if the code has been
2942 flushed */
2943 if (dirty_flags == 0xff)
2944 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
2947 static void notdirty_mem_writew(void *opaque, target_phys_addr_t ram_addr,
2948 uint32_t val)
2950 int dirty_flags;
2951 dirty_flags = phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS];
2952 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
2953 #if !defined(CONFIG_USER_ONLY)
2954 tb_invalidate_phys_page_fast(ram_addr, 2);
2955 dirty_flags = phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS];
2956 #endif
2958 stw_p(qemu_get_ram_ptr(ram_addr), val);
2959 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
2960 phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS] = dirty_flags;
2961 /* we remove the notdirty callback only if the code has been
2962 flushed */
2963 if (dirty_flags == 0xff)
2964 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
2967 static void notdirty_mem_writel(void *opaque, target_phys_addr_t ram_addr,
2968 uint32_t val)
2970 int dirty_flags;
2971 dirty_flags = phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS];
2972 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
2973 #if !defined(CONFIG_USER_ONLY)
2974 tb_invalidate_phys_page_fast(ram_addr, 4);
2975 dirty_flags = phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS];
2976 #endif
2978 stl_p(qemu_get_ram_ptr(ram_addr), val);
2979 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
2980 phys_ram_dirty[ram_addr >> TARGET_PAGE_BITS] = dirty_flags;
2981 /* we remove the notdirty callback only if the code has been
2982 flushed */
2983 if (dirty_flags == 0xff)
2984 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
2987 static CPUReadMemoryFunc * const error_mem_read[3] = {
2988 NULL, /* never used */
2989 NULL, /* never used */
2990 NULL, /* never used */
2993 static CPUWriteMemoryFunc * const notdirty_mem_write[3] = {
2994 notdirty_mem_writeb,
2995 notdirty_mem_writew,
2996 notdirty_mem_writel,
2999 /* Generate a debug exception if a watchpoint has been hit. */
3000 static void check_watchpoint(int offset, int len_mask, int flags)
3002 CPUState *env = cpu_single_env;
3003 target_ulong pc, cs_base;
3004 TranslationBlock *tb;
3005 target_ulong vaddr;
3006 CPUWatchpoint *wp;
3007 int cpu_flags;
3009 if (env->watchpoint_hit) {
3010 /* We re-entered the check after replacing the TB. Now raise
3011 * the debug interrupt so that is will trigger after the
3012 * current instruction. */
3013 cpu_interrupt(env, CPU_INTERRUPT_DEBUG);
3014 return;
3016 vaddr = (env->mem_io_vaddr & TARGET_PAGE_MASK) + offset;
3017 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
3018 if ((vaddr == (wp->vaddr & len_mask) ||
3019 (vaddr & wp->len_mask) == wp->vaddr) && (wp->flags & flags)) {
3020 wp->flags |= BP_WATCHPOINT_HIT;
3021 if (!env->watchpoint_hit) {
3022 env->watchpoint_hit = wp;
3023 tb = tb_find_pc(env->mem_io_pc);
3024 if (!tb) {
3025 cpu_abort(env, "check_watchpoint: could not find TB for "
3026 "pc=%p", (void *)env->mem_io_pc);
3028 cpu_restore_state(tb, env, env->mem_io_pc, NULL);
3029 tb_phys_invalidate(tb, -1);
3030 if (wp->flags & BP_STOP_BEFORE_ACCESS) {
3031 env->exception_index = EXCP_DEBUG;
3032 } else {
3033 cpu_get_tb_cpu_state(env, &pc, &cs_base, &cpu_flags);
3034 tb_gen_code(env, pc, cs_base, cpu_flags, 1);
3036 cpu_resume_from_signal(env, NULL);
3038 } else {
3039 wp->flags &= ~BP_WATCHPOINT_HIT;
3044 /* Watchpoint access routines. Watchpoints are inserted using TLB tricks,
3045 so these check for a hit then pass through to the normal out-of-line
3046 phys routines. */
3047 static uint32_t watch_mem_readb(void *opaque, target_phys_addr_t addr)
3049 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_READ);
3050 return ldub_phys(addr);
3053 static uint32_t watch_mem_readw(void *opaque, target_phys_addr_t addr)
3055 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_READ);
3056 return lduw_phys(addr);
3059 static uint32_t watch_mem_readl(void *opaque, target_phys_addr_t addr)
3061 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_READ);
3062 return ldl_phys(addr);
3065 static void watch_mem_writeb(void *opaque, target_phys_addr_t addr,
3066 uint32_t val)
3068 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_WRITE);
3069 stb_phys(addr, val);
3072 static void watch_mem_writew(void *opaque, target_phys_addr_t addr,
3073 uint32_t val)
3075 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_WRITE);
3076 stw_phys(addr, val);
3079 static void watch_mem_writel(void *opaque, target_phys_addr_t addr,
3080 uint32_t val)
3082 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_WRITE);
3083 stl_phys(addr, val);
3086 static CPUReadMemoryFunc * const watch_mem_read[3] = {
3087 watch_mem_readb,
3088 watch_mem_readw,
3089 watch_mem_readl,
3092 static CPUWriteMemoryFunc * const watch_mem_write[3] = {
3093 watch_mem_writeb,
3094 watch_mem_writew,
3095 watch_mem_writel,
3098 static inline uint32_t subpage_readlen (subpage_t *mmio, target_phys_addr_t addr,
3099 unsigned int len)
3101 uint32_t ret;
3102 unsigned int idx;
3104 idx = SUBPAGE_IDX(addr);
3105 #if defined(DEBUG_SUBPAGE)
3106 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d\n", __func__,
3107 mmio, len, addr, idx);
3108 #endif
3109 ret = (**mmio->mem_read[idx][len])(mmio->opaque[idx][0][len],
3110 addr + mmio->region_offset[idx][0][len]);
3112 return ret;
3115 static inline void subpage_writelen (subpage_t *mmio, target_phys_addr_t addr,
3116 uint32_t value, unsigned int len)
3118 unsigned int idx;
3120 idx = SUBPAGE_IDX(addr);
3121 #if defined(DEBUG_SUBPAGE)
3122 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d value %08x\n", __func__,
3123 mmio, len, addr, idx, value);
3124 #endif
3125 (**mmio->mem_write[idx][len])(mmio->opaque[idx][1][len],
3126 addr + mmio->region_offset[idx][1][len],
3127 value);
3130 static uint32_t subpage_readb (void *opaque, target_phys_addr_t addr)
3132 #if defined(DEBUG_SUBPAGE)
3133 printf("%s: addr " TARGET_FMT_plx "\n", __func__, addr);
3134 #endif
3136 return subpage_readlen(opaque, addr, 0);
3139 static void subpage_writeb (void *opaque, target_phys_addr_t addr,
3140 uint32_t value)
3142 #if defined(DEBUG_SUBPAGE)
3143 printf("%s: addr " TARGET_FMT_plx " val %08x\n", __func__, addr, value);
3144 #endif
3145 subpage_writelen(opaque, addr, value, 0);
3148 static uint32_t subpage_readw (void *opaque, target_phys_addr_t addr)
3150 #if defined(DEBUG_SUBPAGE)
3151 printf("%s: addr " TARGET_FMT_plx "\n", __func__, addr);
3152 #endif
3154 return subpage_readlen(opaque, addr, 1);
3157 static void subpage_writew (void *opaque, target_phys_addr_t addr,
3158 uint32_t value)
3160 #if defined(DEBUG_SUBPAGE)
3161 printf("%s: addr " TARGET_FMT_plx " val %08x\n", __func__, addr, value);
3162 #endif
3163 subpage_writelen(opaque, addr, value, 1);
3166 static uint32_t subpage_readl (void *opaque, target_phys_addr_t addr)
3168 #if defined(DEBUG_SUBPAGE)
3169 printf("%s: addr " TARGET_FMT_plx "\n", __func__, addr);
3170 #endif
3172 return subpage_readlen(opaque, addr, 2);
3175 static void subpage_writel (void *opaque,
3176 target_phys_addr_t addr, uint32_t value)
3178 #if defined(DEBUG_SUBPAGE)
3179 printf("%s: addr " TARGET_FMT_plx " val %08x\n", __func__, addr, value);
3180 #endif
3181 subpage_writelen(opaque, addr, value, 2);
3184 static CPUReadMemoryFunc * const subpage_read[] = {
3185 &subpage_readb,
3186 &subpage_readw,
3187 &subpage_readl,
3190 static CPUWriteMemoryFunc * const subpage_write[] = {
3191 &subpage_writeb,
3192 &subpage_writew,
3193 &subpage_writel,
3196 static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
3197 ram_addr_t memory, ram_addr_t region_offset)
3199 int idx, eidx;
3200 unsigned int i;
3202 if (start >= TARGET_PAGE_SIZE || end >= TARGET_PAGE_SIZE)
3203 return -1;
3204 idx = SUBPAGE_IDX(start);
3205 eidx = SUBPAGE_IDX(end);
3206 #if defined(DEBUG_SUBPAGE)
3207 printf("%s: %p start %08x end %08x idx %08x eidx %08x mem %ld\n", __func__,
3208 mmio, start, end, idx, eidx, memory);
3209 #endif
3210 memory >>= IO_MEM_SHIFT;
3211 for (; idx <= eidx; idx++) {
3212 for (i = 0; i < 4; i++) {
3213 if (io_mem_read[memory][i]) {
3214 mmio->mem_read[idx][i] = &io_mem_read[memory][i];
3215 mmio->opaque[idx][0][i] = io_mem_opaque[memory];
3216 mmio->region_offset[idx][0][i] = region_offset;
3218 if (io_mem_write[memory][i]) {
3219 mmio->mem_write[idx][i] = &io_mem_write[memory][i];
3220 mmio->opaque[idx][1][i] = io_mem_opaque[memory];
3221 mmio->region_offset[idx][1][i] = region_offset;
3226 return 0;
3229 static void *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
3230 ram_addr_t orig_memory, ram_addr_t region_offset)
3232 subpage_t *mmio;
3233 int subpage_memory;
3235 mmio = qemu_mallocz(sizeof(subpage_t));
3237 mmio->base = base;
3238 subpage_memory = cpu_register_io_memory(subpage_read, subpage_write, mmio);
3239 #if defined(DEBUG_SUBPAGE)
3240 printf("%s: %p base " TARGET_FMT_plx " len %08x %d\n", __func__,
3241 mmio, base, TARGET_PAGE_SIZE, subpage_memory);
3242 #endif
3243 *phys = subpage_memory | IO_MEM_SUBPAGE;
3244 subpage_register(mmio, 0, TARGET_PAGE_SIZE - 1, orig_memory,
3245 region_offset);
3247 return mmio;
3250 static int get_free_io_mem_idx(void)
3252 int i;
3254 for (i = 0; i<IO_MEM_NB_ENTRIES; i++)
3255 if (!io_mem_used[i]) {
3256 io_mem_used[i] = 1;
3257 return i;
3259 fprintf(stderr, "RAN out out io_mem_idx, max %d !\n", IO_MEM_NB_ENTRIES);
3260 return -1;
3263 /* mem_read and mem_write are arrays of functions containing the
3264 function to access byte (index 0), word (index 1) and dword (index
3265 2). Functions can be omitted with a NULL function pointer.
3266 If io_index is non zero, the corresponding io zone is
3267 modified. If it is zero, a new io zone is allocated. The return
3268 value can be used with cpu_register_physical_memory(). (-1) is
3269 returned if error. */
3270 static int cpu_register_io_memory_fixed(int io_index,
3271 CPUReadMemoryFunc * const *mem_read,
3272 CPUWriteMemoryFunc * const *mem_write,
3273 void *opaque)
3275 int i, subwidth = 0;
3277 if (io_index <= 0) {
3278 io_index = get_free_io_mem_idx();
3279 if (io_index == -1)
3280 return io_index;
3281 } else {
3282 io_index >>= IO_MEM_SHIFT;
3283 if (io_index >= IO_MEM_NB_ENTRIES)
3284 return -1;
3287 for(i = 0;i < 3; i++) {
3288 if (!mem_read[i] || !mem_write[i])
3289 subwidth = IO_MEM_SUBWIDTH;
3290 io_mem_read[io_index][i] = mem_read[i];
3291 io_mem_write[io_index][i] = mem_write[i];
3293 io_mem_opaque[io_index] = opaque;
3294 return (io_index << IO_MEM_SHIFT) | subwidth;
3297 int cpu_register_io_memory(CPUReadMemoryFunc * const *mem_read,
3298 CPUWriteMemoryFunc * const *mem_write,
3299 void *opaque)
3301 return cpu_register_io_memory_fixed(0, mem_read, mem_write, opaque);
3304 void cpu_unregister_io_memory(int io_table_address)
3306 int i;
3307 int io_index = io_table_address >> IO_MEM_SHIFT;
3309 for (i=0;i < 3; i++) {
3310 io_mem_read[io_index][i] = unassigned_mem_read[i];
3311 io_mem_write[io_index][i] = unassigned_mem_write[i];
3313 io_mem_opaque[io_index] = NULL;
3314 io_mem_used[io_index] = 0;
3317 static void io_mem_init(void)
3319 int i;
3321 cpu_register_io_memory_fixed(IO_MEM_ROM, error_mem_read, unassigned_mem_write, NULL);
3322 cpu_register_io_memory_fixed(IO_MEM_UNASSIGNED, unassigned_mem_read, unassigned_mem_write, NULL);
3323 cpu_register_io_memory_fixed(IO_MEM_NOTDIRTY, error_mem_read, notdirty_mem_write, NULL);
3324 for (i=0; i<5; i++)
3325 io_mem_used[i] = 1;
3327 io_mem_watch = cpu_register_io_memory(watch_mem_read,
3328 watch_mem_write, NULL);
3331 #endif /* !defined(CONFIG_USER_ONLY) */
3333 /* physical memory access (slow version, mainly for debug) */
3334 #if defined(CONFIG_USER_ONLY)
3335 int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
3336 uint8_t *buf, int len, int is_write)
3338 int l, flags;
3339 target_ulong page;
3340 void * p;
3342 while (len > 0) {
3343 page = addr & TARGET_PAGE_MASK;
3344 l = (page + TARGET_PAGE_SIZE) - addr;
3345 if (l > len)
3346 l = len;
3347 flags = page_get_flags(page);
3348 if (!(flags & PAGE_VALID))
3349 return -1;
3350 if (is_write) {
3351 if (!(flags & PAGE_WRITE))
3352 return -1;
3353 /* XXX: this code should not depend on lock_user */
3354 if (!(p = lock_user(VERIFY_WRITE, addr, l, 0)))
3355 return -1;
3356 memcpy(p, buf, l);
3357 unlock_user(p, addr, l);
3358 } else {
3359 if (!(flags & PAGE_READ))
3360 return -1;
3361 /* XXX: this code should not depend on lock_user */
3362 if (!(p = lock_user(VERIFY_READ, addr, l, 1)))
3363 return -1;
3364 memcpy(buf, p, l);
3365 unlock_user(p, addr, 0);
3367 len -= l;
3368 buf += l;
3369 addr += l;
3371 return 0;
3374 #else
3375 void cpu_physical_memory_rw(target_phys_addr_t addr, uint8_t *buf,
3376 int len, int is_write)
3378 int l, io_index;
3379 uint8_t *ptr;
3380 uint32_t val;
3381 target_phys_addr_t page;
3382 unsigned long pd;
3383 PhysPageDesc *p;
3385 while (len > 0) {
3386 page = addr & TARGET_PAGE_MASK;
3387 l = (page + TARGET_PAGE_SIZE) - addr;
3388 if (l > len)
3389 l = len;
3390 p = phys_page_find(page >> TARGET_PAGE_BITS);
3391 if (!p) {
3392 pd = IO_MEM_UNASSIGNED;
3393 } else {
3394 pd = p->phys_offset;
3397 if (is_write) {
3398 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
3399 target_phys_addr_t addr1 = addr;
3400 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3401 if (p)
3402 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3403 /* XXX: could force cpu_single_env to NULL to avoid
3404 potential bugs */
3405 if (l >= 4 && ((addr1 & 3) == 0)) {
3406 /* 32 bit write access */
3407 val = ldl_p(buf);
3408 io_mem_write[io_index][2](io_mem_opaque[io_index], addr1, val);
3409 l = 4;
3410 } else if (l >= 2 && ((addr1 & 1) == 0)) {
3411 /* 16 bit write access */
3412 val = lduw_p(buf);
3413 io_mem_write[io_index][1](io_mem_opaque[io_index], addr1, val);
3414 l = 2;
3415 } else {
3416 /* 8 bit write access */
3417 val = ldub_p(buf);
3418 io_mem_write[io_index][0](io_mem_opaque[io_index], addr1, val);
3419 l = 1;
3421 } else {
3422 unsigned long addr1;
3423 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
3424 /* RAM case */
3425 ptr = qemu_get_ram_ptr(addr1);
3426 memcpy(ptr, buf, l);
3427 if (!cpu_physical_memory_is_dirty(addr1)) {
3428 /* invalidate code */
3429 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
3430 /* set dirty bit */
3431 phys_ram_dirty[addr1 >> TARGET_PAGE_BITS] |=
3432 (0xff & ~CODE_DIRTY_FLAG);
3434 /* qemu doesn't execute guest code directly, but kvm does
3435 therefore flush instruction caches */
3436 if (kvm_enabled())
3437 flush_icache_range((unsigned long)ptr,
3438 ((unsigned long)ptr)+l);
3440 } else {
3441 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
3442 !(pd & IO_MEM_ROMD)) {
3443 target_phys_addr_t addr1 = addr;
3444 /* I/O case */
3445 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3446 if (p)
3447 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3448 if (l >= 4 && ((addr1 & 3) == 0)) {
3449 /* 32 bit read access */
3450 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr1);
3451 stl_p(buf, val);
3452 l = 4;
3453 } else if (l >= 2 && ((addr1 & 1) == 0)) {
3454 /* 16 bit read access */
3455 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr1);
3456 stw_p(buf, val);
3457 l = 2;
3458 } else {
3459 /* 8 bit read access */
3460 val = io_mem_read[io_index][0](io_mem_opaque[io_index], addr1);
3461 stb_p(buf, val);
3462 l = 1;
3464 } else {
3465 /* RAM case */
3466 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
3467 (addr & ~TARGET_PAGE_MASK);
3468 memcpy(buf, ptr, l);
3471 len -= l;
3472 buf += l;
3473 addr += l;
3477 /* used for ROM loading : can write in RAM and ROM */
3478 void cpu_physical_memory_write_rom(target_phys_addr_t addr,
3479 const uint8_t *buf, int len)
3481 int l;
3482 uint8_t *ptr;
3483 target_phys_addr_t page;
3484 unsigned long pd;
3485 PhysPageDesc *p;
3487 while (len > 0) {
3488 page = addr & TARGET_PAGE_MASK;
3489 l = (page + TARGET_PAGE_SIZE) - addr;
3490 if (l > len)
3491 l = len;
3492 p = phys_page_find(page >> TARGET_PAGE_BITS);
3493 if (!p) {
3494 pd = IO_MEM_UNASSIGNED;
3495 } else {
3496 pd = p->phys_offset;
3499 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM &&
3500 (pd & ~TARGET_PAGE_MASK) != IO_MEM_ROM &&
3501 !(pd & IO_MEM_ROMD)) {
3502 /* do nothing */
3503 } else {
3504 unsigned long addr1;
3505 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
3506 /* ROM/RAM case */
3507 ptr = qemu_get_ram_ptr(addr1);
3508 memcpy(ptr, buf, l);
3510 len -= l;
3511 buf += l;
3512 addr += l;
3516 typedef struct {
3517 void *buffer;
3518 target_phys_addr_t addr;
3519 target_phys_addr_t len;
3520 } BounceBuffer;
3522 static BounceBuffer bounce;
3524 typedef struct MapClient {
3525 void *opaque;
3526 void (*callback)(void *opaque);
3527 QLIST_ENTRY(MapClient) link;
3528 } MapClient;
3530 static QLIST_HEAD(map_client_list, MapClient) map_client_list
3531 = QLIST_HEAD_INITIALIZER(map_client_list);
3533 void *cpu_register_map_client(void *opaque, void (*callback)(void *opaque))
3535 MapClient *client = qemu_malloc(sizeof(*client));
3537 client->opaque = opaque;
3538 client->callback = callback;
3539 QLIST_INSERT_HEAD(&map_client_list, client, link);
3540 return client;
3543 void cpu_unregister_map_client(void *_client)
3545 MapClient *client = (MapClient *)_client;
3547 QLIST_REMOVE(client, link);
3548 qemu_free(client);
3551 static void cpu_notify_map_clients(void)
3553 MapClient *client;
3555 while (!QLIST_EMPTY(&map_client_list)) {
3556 client = QLIST_FIRST(&map_client_list);
3557 client->callback(client->opaque);
3558 cpu_unregister_map_client(client);
3562 /* Map a physical memory region into a host virtual address.
3563 * May map a subset of the requested range, given by and returned in *plen.
3564 * May return NULL if resources needed to perform the mapping are exhausted.
3565 * Use only for reads OR writes - not for read-modify-write operations.
3566 * Use cpu_register_map_client() to know when retrying the map operation is
3567 * likely to succeed.
3569 void *cpu_physical_memory_map(target_phys_addr_t addr,
3570 target_phys_addr_t *plen,
3571 int is_write)
3573 target_phys_addr_t len = *plen;
3574 target_phys_addr_t done = 0;
3575 int l;
3576 uint8_t *ret = NULL;
3577 uint8_t *ptr;
3578 target_phys_addr_t page;
3579 unsigned long pd;
3580 PhysPageDesc *p;
3581 unsigned long addr1;
3583 while (len > 0) {
3584 page = addr & TARGET_PAGE_MASK;
3585 l = (page + TARGET_PAGE_SIZE) - addr;
3586 if (l > len)
3587 l = len;
3588 p = phys_page_find(page >> TARGET_PAGE_BITS);
3589 if (!p) {
3590 pd = IO_MEM_UNASSIGNED;
3591 } else {
3592 pd = p->phys_offset;
3595 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
3596 if (done || bounce.buffer) {
3597 break;
3599 bounce.buffer = qemu_memalign(TARGET_PAGE_SIZE, TARGET_PAGE_SIZE);
3600 bounce.addr = addr;
3601 bounce.len = l;
3602 if (!is_write) {
3603 cpu_physical_memory_rw(addr, bounce.buffer, l, 0);
3605 ptr = bounce.buffer;
3606 } else {
3607 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
3608 ptr = qemu_get_ram_ptr(addr1);
3610 if (!done) {
3611 ret = ptr;
3612 } else if (ret + done != ptr) {
3613 break;
3616 len -= l;
3617 addr += l;
3618 done += l;
3620 *plen = done;
3621 return ret;
3624 /* Unmaps a memory region previously mapped by cpu_physical_memory_map().
3625 * Will also mark the memory as dirty if is_write == 1. access_len gives
3626 * the amount of memory that was actually read or written by the caller.
3628 void cpu_physical_memory_unmap(void *buffer, target_phys_addr_t len,
3629 int is_write, target_phys_addr_t access_len)
3631 unsigned long flush_len = (unsigned long)access_len;
3633 if (buffer != bounce.buffer) {
3634 if (is_write) {
3635 ram_addr_t addr1 = qemu_ram_addr_from_host(buffer);
3636 while (access_len) {
3637 unsigned l;
3638 l = TARGET_PAGE_SIZE;
3639 if (l > access_len)
3640 l = access_len;
3641 if (!cpu_physical_memory_is_dirty(addr1)) {
3642 /* invalidate code */
3643 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
3644 /* set dirty bit */
3645 phys_ram_dirty[addr1 >> TARGET_PAGE_BITS] |=
3646 (0xff & ~CODE_DIRTY_FLAG);
3648 addr1 += l;
3649 access_len -= l;
3651 dma_flush_range((unsigned long)buffer,
3652 (unsigned long)buffer + flush_len);
3654 return;
3656 if (is_write) {
3657 cpu_physical_memory_write(bounce.addr, bounce.buffer, access_len);
3659 qemu_vfree(bounce.buffer);
3660 bounce.buffer = NULL;
3661 cpu_notify_map_clients();
3664 /* warning: addr must be aligned */
3665 uint32_t ldl_phys(target_phys_addr_t addr)
3667 int io_index;
3668 uint8_t *ptr;
3669 uint32_t val;
3670 unsigned long pd;
3671 PhysPageDesc *p;
3673 p = phys_page_find(addr >> TARGET_PAGE_BITS);
3674 if (!p) {
3675 pd = IO_MEM_UNASSIGNED;
3676 } else {
3677 pd = p->phys_offset;
3680 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
3681 !(pd & IO_MEM_ROMD)) {
3682 /* I/O case */
3683 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3684 if (p)
3685 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3686 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
3687 } else {
3688 /* RAM case */
3689 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
3690 (addr & ~TARGET_PAGE_MASK);
3691 val = ldl_p(ptr);
3693 return val;
3696 /* warning: addr must be aligned */
3697 uint64_t ldq_phys(target_phys_addr_t addr)
3699 int io_index;
3700 uint8_t *ptr;
3701 uint64_t val;
3702 unsigned long pd;
3703 PhysPageDesc *p;
3705 p = phys_page_find(addr >> TARGET_PAGE_BITS);
3706 if (!p) {
3707 pd = IO_MEM_UNASSIGNED;
3708 } else {
3709 pd = p->phys_offset;
3712 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
3713 !(pd & IO_MEM_ROMD)) {
3714 /* I/O case */
3715 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3716 if (p)
3717 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3718 #ifdef TARGET_WORDS_BIGENDIAN
3719 val = (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr) << 32;
3720 val |= io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4);
3721 #else
3722 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
3723 val |= (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4) << 32;
3724 #endif
3725 } else {
3726 /* RAM case */
3727 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
3728 (addr & ~TARGET_PAGE_MASK);
3729 val = ldq_p(ptr);
3731 return val;
3734 /* XXX: optimize */
3735 uint32_t ldub_phys(target_phys_addr_t addr)
3737 uint8_t val;
3738 cpu_physical_memory_read(addr, &val, 1);
3739 return val;
3742 /* XXX: optimize */
3743 uint32_t lduw_phys(target_phys_addr_t addr)
3745 uint16_t val;
3746 cpu_physical_memory_read(addr, (uint8_t *)&val, 2);
3747 return tswap16(val);
3750 /* warning: addr must be aligned. The ram page is not masked as dirty
3751 and the code inside is not invalidated. It is useful if the dirty
3752 bits are used to track modified PTEs */
3753 void stl_phys_notdirty(target_phys_addr_t addr, uint32_t val)
3755 int io_index;
3756 uint8_t *ptr;
3757 unsigned long pd;
3758 PhysPageDesc *p;
3760 p = phys_page_find(addr >> TARGET_PAGE_BITS);
3761 if (!p) {
3762 pd = IO_MEM_UNASSIGNED;
3763 } else {
3764 pd = p->phys_offset;
3767 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
3768 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3769 if (p)
3770 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3771 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
3772 } else {
3773 unsigned long addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
3774 ptr = qemu_get_ram_ptr(addr1);
3775 stl_p(ptr, val);
3777 if (unlikely(in_migration)) {
3778 if (!cpu_physical_memory_is_dirty(addr1)) {
3779 /* invalidate code */
3780 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
3781 /* set dirty bit */
3782 phys_ram_dirty[addr1 >> TARGET_PAGE_BITS] |=
3783 (0xff & ~CODE_DIRTY_FLAG);
3789 void stq_phys_notdirty(target_phys_addr_t addr, uint64_t val)
3791 int io_index;
3792 uint8_t *ptr;
3793 unsigned long pd;
3794 PhysPageDesc *p;
3796 p = phys_page_find(addr >> TARGET_PAGE_BITS);
3797 if (!p) {
3798 pd = IO_MEM_UNASSIGNED;
3799 } else {
3800 pd = p->phys_offset;
3803 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
3804 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3805 if (p)
3806 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3807 #ifdef TARGET_WORDS_BIGENDIAN
3808 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val >> 32);
3809 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val);
3810 #else
3811 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
3812 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val >> 32);
3813 #endif
3814 } else {
3815 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
3816 (addr & ~TARGET_PAGE_MASK);
3817 stq_p(ptr, val);
3821 /* warning: addr must be aligned */
3822 void stl_phys(target_phys_addr_t addr, uint32_t val)
3824 int io_index;
3825 uint8_t *ptr;
3826 unsigned long pd;
3827 PhysPageDesc *p;
3829 p = phys_page_find(addr >> TARGET_PAGE_BITS);
3830 if (!p) {
3831 pd = IO_MEM_UNASSIGNED;
3832 } else {
3833 pd = p->phys_offset;
3836 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
3837 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
3838 if (p)
3839 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3840 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
3841 } else {
3842 unsigned long addr1;
3843 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
3844 /* RAM case */
3845 ptr = qemu_get_ram_ptr(addr1);
3846 stl_p(ptr, val);
3847 if (!cpu_physical_memory_is_dirty(addr1)) {
3848 /* invalidate code */
3849 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
3850 /* set dirty bit */
3851 phys_ram_dirty[addr1 >> TARGET_PAGE_BITS] |=
3852 (0xff & ~CODE_DIRTY_FLAG);
3857 /* XXX: optimize */
3858 void stb_phys(target_phys_addr_t addr, uint32_t val)
3860 uint8_t v = val;
3861 cpu_physical_memory_write(addr, &v, 1);
3864 /* XXX: optimize */
3865 void stw_phys(target_phys_addr_t addr, uint32_t val)
3867 uint16_t v = tswap16(val);
3868 cpu_physical_memory_write(addr, (const uint8_t *)&v, 2);
3871 /* XXX: optimize */
3872 void stq_phys(target_phys_addr_t addr, uint64_t val)
3874 val = tswap64(val);
3875 cpu_physical_memory_write(addr, (const uint8_t *)&val, 8);
3878 /* virtual memory access for debug (includes writing to ROM) */
3879 int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
3880 uint8_t *buf, int len, int is_write)
3882 int l;
3883 target_phys_addr_t phys_addr;
3884 target_ulong page;
3886 while (len > 0) {
3887 page = addr & TARGET_PAGE_MASK;
3888 phys_addr = cpu_get_phys_page_debug(env, page);
3889 /* if no physical page mapped, return an error */
3890 if (phys_addr == -1)
3891 return -1;
3892 l = (page + TARGET_PAGE_SIZE) - addr;
3893 if (l > len)
3894 l = len;
3895 phys_addr += (addr & ~TARGET_PAGE_MASK);
3896 if (is_write)
3897 cpu_physical_memory_write_rom(phys_addr, buf, l);
3898 else
3899 cpu_physical_memory_rw(phys_addr, buf, l, is_write);
3900 len -= l;
3901 buf += l;
3902 addr += l;
3904 return 0;
3906 #endif
3908 /* in deterministic execution mode, instructions doing device I/Os
3909 must be at the end of the TB */
3910 void cpu_io_recompile(CPUState *env, void *retaddr)
3912 TranslationBlock *tb;
3913 uint32_t n, cflags;
3914 target_ulong pc, cs_base;
3915 uint64_t flags;
3917 tb = tb_find_pc((unsigned long)retaddr);
3918 if (!tb) {
3919 cpu_abort(env, "cpu_io_recompile: could not find TB for pc=%p",
3920 retaddr);
3922 n = env->icount_decr.u16.low + tb->icount;
3923 cpu_restore_state(tb, env, (unsigned long)retaddr, NULL);
3924 /* Calculate how many instructions had been executed before the fault
3925 occurred. */
3926 n = n - env->icount_decr.u16.low;
3927 /* Generate a new TB ending on the I/O insn. */
3928 n++;
3929 /* On MIPS and SH, delay slot instructions can only be restarted if
3930 they were already the first instruction in the TB. If this is not
3931 the first instruction in a TB then re-execute the preceding
3932 branch. */
3933 #if defined(TARGET_MIPS)
3934 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
3935 env->active_tc.PC -= 4;
3936 env->icount_decr.u16.low++;
3937 env->hflags &= ~MIPS_HFLAG_BMASK;
3939 #elif defined(TARGET_SH4)
3940 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
3941 && n > 1) {
3942 env->pc -= 2;
3943 env->icount_decr.u16.low++;
3944 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
3946 #endif
3947 /* This should never happen. */
3948 if (n > CF_COUNT_MASK)
3949 cpu_abort(env, "TB too big during recompile");
3951 cflags = n | CF_LAST_IO;
3952 pc = tb->pc;
3953 cs_base = tb->cs_base;
3954 flags = tb->flags;
3955 tb_phys_invalidate(tb, -1);
3956 /* FIXME: In theory this could raise an exception. In practice
3957 we have already translated the block once so it's probably ok. */
3958 tb_gen_code(env, pc, cs_base, flags, cflags);
3959 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
3960 the first in the TB) then we end up generating a whole new TB and
3961 repeating the fault, which is horribly inefficient.
3962 Better would be to execute just this insn uncached, or generate a
3963 second new TB. */
3964 cpu_resume_from_signal(env, NULL);
3967 #if !defined(CONFIG_USER_ONLY)
3969 void dump_exec_info(FILE *f,
3970 int (*cpu_fprintf)(FILE *f, const char *fmt, ...))
3972 int i, target_code_size, max_target_code_size;
3973 int direct_jmp_count, direct_jmp2_count, cross_page;
3974 TranslationBlock *tb;
3976 target_code_size = 0;
3977 max_target_code_size = 0;
3978 cross_page = 0;
3979 direct_jmp_count = 0;
3980 direct_jmp2_count = 0;
3981 for(i = 0; i < nb_tbs; i++) {
3982 tb = &tbs[i];
3983 target_code_size += tb->size;
3984 if (tb->size > max_target_code_size)
3985 max_target_code_size = tb->size;
3986 if (tb->page_addr[1] != -1)
3987 cross_page++;
3988 if (tb->tb_next_offset[0] != 0xffff) {
3989 direct_jmp_count++;
3990 if (tb->tb_next_offset[1] != 0xffff) {
3991 direct_jmp2_count++;
3995 /* XXX: avoid using doubles ? */
3996 cpu_fprintf(f, "Translation buffer state:\n");
3997 cpu_fprintf(f, "gen code size %ld/%ld\n",
3998 code_gen_ptr - code_gen_buffer, code_gen_buffer_max_size);
3999 cpu_fprintf(f, "TB count %d/%d\n",
4000 nb_tbs, code_gen_max_blocks);
4001 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
4002 nb_tbs ? target_code_size / nb_tbs : 0,
4003 max_target_code_size);
4004 cpu_fprintf(f, "TB avg host size %d bytes (expansion ratio: %0.1f)\n",
4005 nb_tbs ? (code_gen_ptr - code_gen_buffer) / nb_tbs : 0,
4006 target_code_size ? (double) (code_gen_ptr - code_gen_buffer) / target_code_size : 0);
4007 cpu_fprintf(f, "cross page TB count %d (%d%%)\n",
4008 cross_page,
4009 nb_tbs ? (cross_page * 100) / nb_tbs : 0);
4010 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
4011 direct_jmp_count,
4012 nb_tbs ? (direct_jmp_count * 100) / nb_tbs : 0,
4013 direct_jmp2_count,
4014 nb_tbs ? (direct_jmp2_count * 100) / nb_tbs : 0);
4015 cpu_fprintf(f, "\nStatistics:\n");
4016 cpu_fprintf(f, "TB flush count %d\n", tb_flush_count);
4017 cpu_fprintf(f, "TB invalidate count %d\n", tb_phys_invalidate_count);
4018 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
4019 #ifdef CONFIG_PROFILER
4020 tcg_dump_info(f, cpu_fprintf);
4021 #endif
4024 #define MMUSUFFIX _cmmu
4025 #define GETPC() NULL
4026 #define env cpu_single_env
4027 #define SOFTMMU_CODE_ACCESS
4029 #define SHIFT 0
4030 #include "softmmu_template.h"
4032 #define SHIFT 1
4033 #include "softmmu_template.h"
4035 #define SHIFT 2
4036 #include "softmmu_template.h"
4038 #define SHIFT 3
4039 #include "softmmu_template.h"
4041 #undef env
4043 #endif