2 * internal execution defines for qemu
4 * Copyright (c) 2003 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 /* allow to see translation results - the slowdown should be negligible, so we leave it */
24 /* is_jmp field values */
25 #define DISAS_NEXT 0 /* next instruction can be analyzed */
26 #define DISAS_JUMP 1 /* only pc was modified dynamically */
27 #define DISAS_UPDATE 2 /* cpu state was modified dynamically */
28 #define DISAS_TB_JUMP 3 /* only pc was modified statically */
30 struct TranslationBlock
;
32 /* XXX: make safe guess about sizes */
33 #define MAX_OP_PER_INSTR 32
34 /* A Call op needs up to 6 + 2N parameters (N = number of arguments). */
35 #define MAX_OPC_PARAM 10
36 #define OPC_BUF_SIZE 512
37 #define OPC_MAX_SIZE (OPC_BUF_SIZE - MAX_OP_PER_INSTR)
39 /* Maximum size a TCG op can expand to. This is complicated because a
40 single op may require several host instructions and regirster reloads.
41 For now take a wild guess at 128 bytes, which should allow at least
42 a couple of fixup instructions per argument. */
43 #define TCG_MAX_OP_SIZE 128
45 #define OPPARAM_BUF_SIZE (OPC_BUF_SIZE * MAX_OPC_PARAM)
47 extern target_ulong gen_opc_pc
[OPC_BUF_SIZE
];
48 extern target_ulong gen_opc_npc
[OPC_BUF_SIZE
];
49 extern uint8_t gen_opc_cc_op
[OPC_BUF_SIZE
];
50 extern uint8_t gen_opc_instr_start
[OPC_BUF_SIZE
];
51 extern target_ulong gen_opc_jump_pc
[2];
52 extern uint32_t gen_opc_hflags
[OPC_BUF_SIZE
];
54 typedef void (GenOpFunc
)(void);
55 typedef void (GenOpFunc1
)(long);
56 typedef void (GenOpFunc2
)(long, long);
57 typedef void (GenOpFunc3
)(long, long, long);
59 #if defined(TARGET_I386)
61 void optimize_flags_init(void);
68 int gen_intermediate_code(CPUState
*env
, struct TranslationBlock
*tb
);
69 int gen_intermediate_code_pc(CPUState
*env
, struct TranslationBlock
*tb
);
70 unsigned long code_gen_max_block_size(void);
71 void cpu_gen_init(void);
72 int cpu_gen_code(CPUState
*env
, struct TranslationBlock
*tb
,
73 int *gen_code_size_ptr
);
74 int cpu_restore_state(struct TranslationBlock
*tb
,
75 CPUState
*env
, unsigned long searched_pc
,
77 int cpu_gen_code_copy(CPUState
*env
, struct TranslationBlock
*tb
,
78 int max_code_size
, int *gen_code_size_ptr
);
79 int cpu_restore_state_copy(struct TranslationBlock
*tb
,
80 CPUState
*env
, unsigned long searched_pc
,
82 void cpu_resume_from_signal(CPUState
*env1
, void *puc
);
83 void cpu_exec_init(CPUState
*env
);
84 int page_unprotect(target_ulong address
, unsigned long pc
, void *puc
);
85 void tb_invalidate_phys_page_range(target_ulong start
, target_ulong end
,
86 int is_cpu_write_access
);
87 void tb_invalidate_page_range(target_ulong start
, target_ulong end
);
88 void tlb_flush_page(CPUState
*env
, target_ulong addr
);
89 void tlb_flush(CPUState
*env
, int flush_global
);
90 int tlb_set_page_exec(CPUState
*env
, target_ulong vaddr
,
91 target_phys_addr_t paddr
, int prot
,
92 int mmu_idx
, int is_softmmu
);
93 static inline int tlb_set_page(CPUState
*env
, target_ulong vaddr
,
94 target_phys_addr_t paddr
, int prot
,
95 int mmu_idx
, int is_softmmu
)
99 return tlb_set_page_exec(env
, vaddr
, paddr
, prot
, mmu_idx
, is_softmmu
);
102 #define CODE_GEN_ALIGN 16 /* must be >= of the size of a icache line */
104 #define CODE_GEN_PHYS_HASH_BITS 15
105 #define CODE_GEN_PHYS_HASH_SIZE (1 << CODE_GEN_PHYS_HASH_BITS)
107 /* maximum total translate dcode allocated */
109 /* NOTE: the translated code area cannot be too big because on some
110 archs the range of "fast" function calls is limited. Here is a
111 summary of the ranges:
113 i386 : signed 32 bits
116 sparc : signed 32 bits
117 alpha : signed 23 bits
120 #if defined(__alpha__)
121 #define CODE_GEN_BUFFER_SIZE (2 * 1024 * 1024)
122 #elif defined(__ia64)
123 #define CODE_GEN_BUFFER_SIZE (4 * 1024 * 1024) /* range of addl */
124 #elif defined(__powerpc__)
125 #define CODE_GEN_BUFFER_SIZE (6 * 1024 * 1024)
127 /* XXX: make it dynamic on x86 */
128 #define CODE_GEN_BUFFER_SIZE (16 * 1024 * 1024)
131 //#define CODE_GEN_BUFFER_SIZE (128 * 1024)
133 /* estimated block size for TB allocation */
134 /* XXX: use a per code average code fragment size and modulate it
135 according to the host CPU */
136 #if defined(CONFIG_SOFTMMU)
137 #define CODE_GEN_AVG_BLOCK_SIZE 128
139 #define CODE_GEN_AVG_BLOCK_SIZE 64
142 #define CODE_GEN_MAX_BLOCKS (CODE_GEN_BUFFER_SIZE / CODE_GEN_AVG_BLOCK_SIZE)
144 #if defined(__powerpc__) || defined(__x86_64__)
145 #define USE_DIRECT_JUMP
147 #if defined(__i386__) && !defined(_WIN32)
148 #define USE_DIRECT_JUMP
151 typedef struct TranslationBlock
{
152 target_ulong pc
; /* simulated PC corresponding to this block (EIP + CS base) */
153 target_ulong cs_base
; /* CS base for this block */
154 uint64_t flags
; /* flags defining in which context the code was generated */
155 uint16_t size
; /* size of target code for this block (1 <=
156 size <= TARGET_PAGE_SIZE) */
157 uint16_t cflags
; /* compile flags */
158 #define CF_CODE_COPY 0x0001 /* block was generated in code copy mode */
159 #define CF_TB_FP_USED 0x0002 /* fp ops are used in the TB */
160 #define CF_FP_USED 0x0004 /* fp ops are used in the TB or in a chained TB */
161 #define CF_SINGLE_INSN 0x0008 /* compile only a single instruction */
163 uint8_t *tc_ptr
; /* pointer to the translated code */
164 /* next matching tb for physical address. */
165 struct TranslationBlock
*phys_hash_next
;
166 /* first and second physical page containing code. The lower bit
167 of the pointer tells the index in page_next[] */
168 struct TranslationBlock
*page_next
[2];
169 target_ulong page_addr
[2];
171 /* the following data are used to directly call another TB from
172 the code of this one. */
173 uint16_t tb_next_offset
[2]; /* offset of original jump target */
174 #ifdef USE_DIRECT_JUMP
175 uint16_t tb_jmp_offset
[4]; /* offset of jump instruction */
177 unsigned long tb_next
[2]; /* address of jump generated code */
179 /* list of TBs jumping to this one. This is a circular list using
180 the two least significant bits of the pointers to tell what is
181 the next pointer: 0 = jmp_next[0], 1 = jmp_next[1], 2 =
183 struct TranslationBlock
*jmp_next
[2];
184 struct TranslationBlock
*jmp_first
;
187 static inline unsigned int tb_jmp_cache_hash_page(target_ulong pc
)
190 tmp
= pc
^ (pc
>> (TARGET_PAGE_BITS
- TB_JMP_PAGE_BITS
));
191 return (tmp
>> TB_JMP_PAGE_BITS
) & TB_JMP_PAGE_MASK
;
194 static inline unsigned int tb_jmp_cache_hash_func(target_ulong pc
)
197 tmp
= pc
^ (pc
>> (TARGET_PAGE_BITS
- TB_JMP_PAGE_BITS
));
198 return (((tmp
>> TB_JMP_PAGE_BITS
) & TB_JMP_PAGE_MASK
) |
199 (tmp
& TB_JMP_ADDR_MASK
));
202 static inline unsigned int tb_phys_hash_func(unsigned long pc
)
204 return pc
& (CODE_GEN_PHYS_HASH_SIZE
- 1);
207 TranslationBlock
*tb_alloc(target_ulong pc
);
208 void tb_flush(CPUState
*env
);
209 void tb_link_phys(TranslationBlock
*tb
,
210 target_ulong phys_pc
, target_ulong phys_page2
);
212 extern TranslationBlock
*tb_phys_hash
[CODE_GEN_PHYS_HASH_SIZE
];
214 extern uint8_t code_gen_buffer
[CODE_GEN_BUFFER_SIZE
];
215 extern uint8_t *code_gen_ptr
;
217 #if defined(USE_DIRECT_JUMP)
219 #if defined(__powerpc__)
220 static inline void tb_set_jmp_target1(unsigned long jmp_addr
, unsigned long addr
)
224 /* patch the branch destination */
225 ptr
= (uint32_t *)jmp_addr
;
227 val
= (val
& ~0x03fffffc) | ((addr
- jmp_addr
) & 0x03fffffc);
230 asm volatile ("dcbst 0,%0" : : "r"(ptr
) : "memory");
231 asm volatile ("sync" : : : "memory");
232 asm volatile ("icbi 0,%0" : : "r"(ptr
) : "memory");
233 asm volatile ("sync" : : : "memory");
234 asm volatile ("isync" : : : "memory");
236 #elif defined(__i386__) || defined(__x86_64__)
237 static inline void tb_set_jmp_target1(unsigned long jmp_addr
, unsigned long addr
)
239 /* patch the branch destination */
240 *(uint32_t *)jmp_addr
= addr
- (jmp_addr
+ 4);
241 /* no need to flush icache explicitely */
245 static inline void tb_set_jmp_target(TranslationBlock
*tb
,
246 int n
, unsigned long addr
)
248 unsigned long offset
;
250 offset
= tb
->tb_jmp_offset
[n
];
251 tb_set_jmp_target1((unsigned long)(tb
->tc_ptr
+ offset
), addr
);
252 offset
= tb
->tb_jmp_offset
[n
+ 2];
253 if (offset
!= 0xffff)
254 tb_set_jmp_target1((unsigned long)(tb
->tc_ptr
+ offset
), addr
);
259 /* set the jump target */
260 static inline void tb_set_jmp_target(TranslationBlock
*tb
,
261 int n
, unsigned long addr
)
263 tb
->tb_next
[n
] = addr
;
268 static inline void tb_add_jump(TranslationBlock
*tb
, int n
,
269 TranslationBlock
*tb_next
)
271 /* NOTE: this test is only needed for thread safety */
272 if (!tb
->jmp_next
[n
]) {
273 /* patch the native jump address */
274 tb_set_jmp_target(tb
, n
, (unsigned long)tb_next
->tc_ptr
);
276 /* add in TB jmp circular list */
277 tb
->jmp_next
[n
] = tb_next
->jmp_first
;
278 tb_next
->jmp_first
= (TranslationBlock
*)((long)(tb
) | (n
));
282 TranslationBlock
*tb_find_pc(unsigned long pc_ptr
);
285 #define offsetof(type, field) ((size_t) &((type *)0)->field)
289 #define ASM_DATA_SECTION ".section \".data\"\n"
290 #define ASM_PREVIOUS_SECTION ".section .text\n"
291 #elif defined(__APPLE__)
292 #define ASM_DATA_SECTION ".data\n"
293 #define ASM_PREVIOUS_SECTION ".text\n"
295 #define ASM_DATA_SECTION ".section \".data\"\n"
296 #define ASM_PREVIOUS_SECTION ".previous\n"
299 #define ASM_OP_LABEL_NAME(n, opname) \
300 ASM_NAME(__op_label) #n "." ASM_NAME(opname)
302 extern CPUWriteMemoryFunc
*io_mem_write
[IO_MEM_NB_ENTRIES
][4];
303 extern CPUReadMemoryFunc
*io_mem_read
[IO_MEM_NB_ENTRIES
][4];
304 extern void *io_mem_opaque
[IO_MEM_NB_ENTRIES
];
306 #if defined(__hppa__)
308 typedef int spinlock_t
[4];
310 #define SPIN_LOCK_UNLOCKED { 1, 1, 1, 1 }
312 static inline void resetlock (spinlock_t
*p
)
314 (*p
)[0] = (*p
)[1] = (*p
)[2] = (*p
)[3] = 1;
319 typedef int spinlock_t
;
321 #define SPIN_LOCK_UNLOCKED 0
323 static inline void resetlock (spinlock_t
*p
)
325 *p
= SPIN_LOCK_UNLOCKED
;
330 #if defined(__powerpc__)
331 static inline int testandset (int *p
)
334 __asm__
__volatile__ (
342 : "r" (p
), "r" (1), "r" (0)
346 #elif defined(__i386__)
347 static inline int testandset (int *p
)
349 long int readval
= 0;
351 __asm__
__volatile__ ("lock; cmpxchgl %2, %0"
352 : "+m" (*p
), "+a" (readval
)
357 #elif defined(__x86_64__)
358 static inline int testandset (int *p
)
360 long int readval
= 0;
362 __asm__
__volatile__ ("lock; cmpxchgl %2, %0"
363 : "+m" (*p
), "+a" (readval
)
368 #elif defined(__s390__)
369 static inline int testandset (int *p
)
373 __asm__
__volatile__ ("0: cs %0,%1,0(%2)\n"
376 : "r" (1), "a" (p
), "0" (*p
)
380 #elif defined(__alpha__)
381 static inline int testandset (int *p
)
386 __asm__
__volatile__ ("0: mov 1,%2\n"
393 : "=r" (ret
), "=m" (*p
), "=r" (one
)
397 #elif defined(__sparc__)
398 static inline int testandset (int *p
)
402 __asm__
__volatile__("ldstub [%1], %0"
407 return (ret
? 1 : 0);
409 #elif defined(__arm__)
410 static inline int testandset (int *spinlock
)
412 register unsigned int ret
;
413 __asm__
__volatile__("swp %0, %1, [%2]"
415 : "0"(1), "r"(spinlock
));
419 #elif defined(__mc68000)
420 static inline int testandset (int *p
)
423 __asm__
__volatile__("tas %1; sne %0"
429 #elif defined(__hppa__)
431 /* Because malloc only guarantees 8-byte alignment for malloc'd data,
432 and GCC only guarantees 8-byte alignment for stack locals, we can't
433 be assured of 16-byte alignment for atomic lock data even if we
434 specify "__attribute ((aligned(16)))" in the type declaration. So,
435 we use a struct containing an array of four ints for the atomic lock
436 type and dynamically select the 16-byte aligned int from the array
437 for the semaphore. */
438 #define __PA_LDCW_ALIGNMENT 16
439 static inline void *ldcw_align (void *p
) {
440 unsigned long a
= (unsigned long)p
;
441 a
= (a
+ __PA_LDCW_ALIGNMENT
- 1) & ~(__PA_LDCW_ALIGNMENT
- 1);
445 static inline int testandset (spinlock_t
*p
)
449 __asm__
__volatile__("ldcw 0(%1),%0"
456 #elif defined(__ia64)
458 #include "ia64intrin.h"
459 static inline int testandset (int *p
)
461 return (int)cmpxchg_acq(p
,0,1);
463 #elif defined(__mips__)
464 static inline int testandset (int *p
)
468 __asm__
__volatile__ (
477 : "=r" (ret
), "+R" (*p
)
484 #error unimplemented CPU support
487 #if defined(CONFIG_USER_ONLY)
488 static inline void spin_lock(spinlock_t
*lock
)
490 while (testandset(lock
));
493 static inline void spin_unlock(spinlock_t
*lock
)
498 static inline int spin_trylock(spinlock_t
*lock
)
500 return !testandset(lock
);
503 static inline void spin_lock(spinlock_t
*lock
)
507 static inline void spin_unlock(spinlock_t
*lock
)
511 static inline int spin_trylock(spinlock_t
*lock
)
517 extern spinlock_t tb_lock
;
519 extern int tb_invalidated_flag
;
521 #if !defined(CONFIG_USER_ONLY)
523 void tlb_fill(target_ulong addr
, int is_write
, int mmu_idx
,
526 #define ACCESS_TYPE (NB_MMU_MODES + 1)
527 #define MEMSUFFIX _code
528 #define env cpu_single_env
531 #include "softmmu_header.h"
534 #include "softmmu_header.h"
537 #include "softmmu_header.h"
540 #include "softmmu_header.h"
548 #if defined(CONFIG_USER_ONLY)
549 static inline target_ulong
get_phys_addr_code(CPUState
*env
, target_ulong addr
)
554 /* NOTE: this function can trigger an exception */
555 /* NOTE2: the returned address is not exactly the physical address: it
556 is the offset relative to phys_ram_base */
557 static inline target_ulong
get_phys_addr_code(CPUState
*env
, target_ulong addr
)
559 int mmu_idx
, index
, pd
;
561 index
= (addr
>> TARGET_PAGE_BITS
) & (CPU_TLB_SIZE
- 1);
562 mmu_idx
= cpu_mmu_index(env
);
563 if (__builtin_expect(env
->tlb_table
[mmu_idx
][index
].addr_code
!=
564 (addr
& TARGET_PAGE_MASK
), 0)) {
567 pd
= env
->tlb_table
[mmu_idx
][index
].addr_code
& ~TARGET_PAGE_MASK
;
568 if (pd
> IO_MEM_ROM
&& !(pd
& IO_MEM_ROMD
)) {
569 #if defined(TARGET_SPARC) || defined(TARGET_MIPS)
570 do_unassigned_access(addr
, 0, 1, 0);
572 cpu_abort(env
, "Trying to execute code outside RAM or ROM at 0x" TARGET_FMT_lx
"\n", addr
);
575 return addr
+ env
->tlb_table
[mmu_idx
][index
].addend
- (unsigned long)phys_ram_base
;
580 #define KQEMU_MODIFY_PAGE_MASK (0xff & ~(VGA_DIRTY_FLAG | CODE_DIRTY_FLAG))
582 int kqemu_init(CPUState
*env
);
583 int kqemu_cpu_exec(CPUState
*env
);
584 void kqemu_flush_page(CPUState
*env
, target_ulong addr
);
585 void kqemu_flush(CPUState
*env
, int global
);
586 void kqemu_set_notdirty(CPUState
*env
, ram_addr_t ram_addr
);
587 void kqemu_modify_page(CPUState
*env
, ram_addr_t ram_addr
);
588 void kqemu_cpu_interrupt(CPUState
*env
);
589 void kqemu_record_dump(void);
591 static inline int kqemu_is_ok(CPUState
*env
)
593 return(env
->kqemu_enabled
&&
594 (env
->cr
[0] & CR0_PE_MASK
) &&
595 !(env
->hflags
& HF_INHIBIT_IRQ_MASK
) &&
596 (env
->eflags
& IF_MASK
) &&
597 !(env
->eflags
& VM_MASK
) &&
598 (env
->kqemu_enabled
== 2 ||
599 ((env
->hflags
& HF_CPL_MASK
) == 3 &&
600 (env
->eflags
& IOPL_MASK
) != IOPL_MASK
)));