1 /* 2 * internal execution defines for qemu 3 * 4 * Copyright (c) 2003 Fabrice Bellard 5 * 6 * This library is free software; you can redistribute it and/or 7 * modify it under the terms of the GNU Lesser General Public 8 * License as published by the Free Software Foundation; either 9 * version 2 of the License, or (at your option) any later version. 10 * 11 * This library is distributed in the hope that it will be useful, 12 * but WITHOUT ANY WARRANTY; without even the implied warranty of 13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14 * Lesser General Public License for more details. 15 * 16 * You should have received a copy of the GNU Lesser General Public 17 * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18 */ 19 20 #ifndef _EXEC_ALL_H_ 21 #define _EXEC_ALL_H_ 22 23 #include "qemu-common.h" 24 25 /* allow to see translation results - the slowdown should be negligible, so we leave it */ 26 #define DEBUG_DISAS 27 28 /* Page tracking code uses ram addresses in system mode, and virtual 29 addresses in userspace mode. Define tb_page_addr_t to be an appropriate 30 type. */ 31 #if defined(CONFIG_USER_ONLY) 32 typedef abi_ulong tb_page_addr_t; 33 #else 34 typedef ram_addr_t tb_page_addr_t; 35 #endif 36 37 /* is_jmp field values */ 38 #define DISAS_NEXT 0 /* next instruction can be analyzed */ 39 #define DISAS_JUMP 1 /* only pc was modified dynamically */ 40 #define DISAS_UPDATE 2 /* cpu state was modified dynamically */ 41 #define DISAS_TB_JUMP 3 /* only pc was modified statically */ 42 43 struct TranslationBlock; 44 typedef struct TranslationBlock TranslationBlock; 45 46 /* XXX: make safe guess about sizes */ 47 #define MAX_OP_PER_INSTR 266 48 49 #if HOST_LONG_BITS == 32 50 #define MAX_OPC_PARAM_PER_ARG 2 51 #else 52 #define MAX_OPC_PARAM_PER_ARG 1 53 #endif 54 #define MAX_OPC_PARAM_IARGS 5 55 #define MAX_OPC_PARAM_OARGS 1 56 #define MAX_OPC_PARAM_ARGS (MAX_OPC_PARAM_IARGS + MAX_OPC_PARAM_OARGS) 57 58 /* A Call op needs up to 4 + 2N parameters on 32-bit archs, 59 * and up to 4 + N parameters on 64-bit archs 60 * (N = number of input arguments + output arguments). */ 61 #define MAX_OPC_PARAM (4 + (MAX_OPC_PARAM_PER_ARG * MAX_OPC_PARAM_ARGS)) 62 #define OPC_BUF_SIZE 640 63 #define OPC_MAX_SIZE (OPC_BUF_SIZE - MAX_OP_PER_INSTR) 64 65 /* Maximum size a TCG op can expand to. This is complicated because a 66 single op may require several host instructions and register reloads. 67 For now take a wild guess at 192 bytes, which should allow at least 68 a couple of fixup instructions per argument. */ 69 #define TCG_MAX_OP_SIZE 192 70 71 #define OPPARAM_BUF_SIZE (OPC_BUF_SIZE * MAX_OPC_PARAM) 72 73 #include "qemu/log.h" 74 75 void gen_intermediate_code(CPUArchState *env, struct TranslationBlock *tb); 76 void gen_intermediate_code_pc(CPUArchState *env, struct TranslationBlock *tb); 77 void restore_state_to_opc(CPUArchState *env, struct TranslationBlock *tb, 78 int pc_pos); 79 80 void cpu_gen_init(void); 81 int cpu_gen_code(CPUArchState *env, struct TranslationBlock *tb, 82 int *gen_code_size_ptr); 83 bool cpu_restore_state(CPUState *cpu, uintptr_t searched_pc); 84 void page_size_init(void); 85 86 void QEMU_NORETURN cpu_resume_from_signal(CPUState *cpu, void *puc); 87 void QEMU_NORETURN cpu_io_recompile(CPUState *cpu, uintptr_t retaddr); 88 TranslationBlock *tb_gen_code(CPUState *cpu, 89 target_ulong pc, target_ulong cs_base, int flags, 90 int cflags); 91 void cpu_exec_init(CPUArchState *env); 92 void QEMU_NORETURN cpu_loop_exit(CPUState *cpu); 93 94 #if !defined(CONFIG_USER_ONLY) 95 bool qemu_in_vcpu_thread(void); 96 void cpu_reload_memory_map(CPUState *cpu); 97 void tcg_cpu_address_space_init(CPUState *cpu, AddressSpace *as); 98 /* cputlb.c */ 99 void tlb_flush_page(CPUState *cpu, target_ulong addr); 100 void tlb_flush(CPUState *cpu, int flush_global); 101 void tlb_set_page(CPUState *cpu, target_ulong vaddr, 102 hwaddr paddr, int prot, 103 int mmu_idx, target_ulong size); 104 void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr, 105 hwaddr paddr, MemTxAttrs attrs, 106 int prot, int mmu_idx, target_ulong size); 107 void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr); 108 void probe_write(CPUArchState *env, target_ulong addr, int mmu_idx, 109 uintptr_t retaddr); 110 #else 111 static inline void tlb_flush_page(CPUState *cpu, target_ulong addr) 112 { 113 } 114 115 static inline void tlb_flush(CPUState *cpu, int flush_global) 116 { 117 } 118 #endif 119 120 #define CODE_GEN_ALIGN 16 /* must be >= of the size of a icache line */ 121 122 #define CODE_GEN_PHYS_HASH_BITS 15 123 #define CODE_GEN_PHYS_HASH_SIZE (1 << CODE_GEN_PHYS_HASH_BITS) 124 125 /* estimated block size for TB allocation */ 126 /* XXX: use a per code average code fragment size and modulate it 127 according to the host CPU */ 128 #if defined(CONFIG_SOFTMMU) 129 #define CODE_GEN_AVG_BLOCK_SIZE 128 130 #else 131 #define CODE_GEN_AVG_BLOCK_SIZE 64 132 #endif 133 134 #if defined(__arm__) || defined(_ARCH_PPC) \ 135 || defined(__x86_64__) || defined(__i386__) \ 136 || defined(__sparc__) || defined(__aarch64__) \ 137 || defined(__s390x__) || defined(__mips__) \ 138 || defined(CONFIG_TCG_INTERPRETER) 139 #define USE_DIRECT_JUMP 140 #endif 141 142 struct TranslationBlock { 143 target_ulong pc; /* simulated PC corresponding to this block (EIP + CS base) */ 144 target_ulong cs_base; /* CS base for this block */ 145 uint64_t flags; /* flags defining in which context the code was generated */ 146 uint16_t size; /* size of target code for this block (1 <= 147 size <= TARGET_PAGE_SIZE) */ 148 uint16_t icount; 149 uint32_t cflags; /* compile flags */ 150 #define CF_COUNT_MASK 0x7fff 151 #define CF_LAST_IO 0x8000 /* Last insn may be an IO access. */ 152 #define CF_NOCACHE 0x10000 /* To be freed after execution */ 153 #define CF_USE_ICOUNT 0x20000 154 155 void *tc_ptr; /* pointer to the translated code */ 156 /* next matching tb for physical address. */ 157 struct TranslationBlock *phys_hash_next; 158 /* first and second physical page containing code. The lower bit 159 of the pointer tells the index in page_next[] */ 160 struct TranslationBlock *page_next[2]; 161 tb_page_addr_t page_addr[2]; 162 163 /* the following data are used to directly call another TB from 164 the code of this one. */ 165 uint16_t tb_next_offset[2]; /* offset of original jump target */ 166 #ifdef USE_DIRECT_JUMP 167 uint16_t tb_jmp_offset[2]; /* offset of jump instruction */ 168 #else 169 uintptr_t tb_next[2]; /* address of jump generated code */ 170 #endif 171 /* list of TBs jumping to this one. This is a circular list using 172 the two least significant bits of the pointers to tell what is 173 the next pointer: 0 = jmp_next[0], 1 = jmp_next[1], 2 = 174 jmp_first */ 175 struct TranslationBlock *jmp_next[2]; 176 struct TranslationBlock *jmp_first; 177 }; 178 179 #include "exec/spinlock.h" 180 181 typedef struct TBContext TBContext; 182 183 struct TBContext { 184 185 TranslationBlock *tbs; 186 TranslationBlock *tb_phys_hash[CODE_GEN_PHYS_HASH_SIZE]; 187 int nb_tbs; 188 /* any access to the tbs or the page table must use this lock */ 189 spinlock_t tb_lock; 190 191 /* statistics */ 192 int tb_flush_count; 193 int tb_phys_invalidate_count; 194 195 int tb_invalidated_flag; 196 }; 197 198 static inline unsigned int tb_jmp_cache_hash_page(target_ulong pc) 199 { 200 target_ulong tmp; 201 tmp = pc ^ (pc >> (TARGET_PAGE_BITS - TB_JMP_PAGE_BITS)); 202 return (tmp >> (TARGET_PAGE_BITS - TB_JMP_PAGE_BITS)) & TB_JMP_PAGE_MASK; 203 } 204 205 static inline unsigned int tb_jmp_cache_hash_func(target_ulong pc) 206 { 207 target_ulong tmp; 208 tmp = pc ^ (pc >> (TARGET_PAGE_BITS - TB_JMP_PAGE_BITS)); 209 return (((tmp >> (TARGET_PAGE_BITS - TB_JMP_PAGE_BITS)) & TB_JMP_PAGE_MASK) 210 | (tmp & TB_JMP_ADDR_MASK)); 211 } 212 213 static inline unsigned int tb_phys_hash_func(tb_page_addr_t pc) 214 { 215 return (pc >> 2) & (CODE_GEN_PHYS_HASH_SIZE - 1); 216 } 217 218 void tb_free(TranslationBlock *tb); 219 void tb_flush(CPUArchState *env); 220 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr); 221 222 #if defined(USE_DIRECT_JUMP) 223 224 #if defined(CONFIG_TCG_INTERPRETER) 225 static inline void tb_set_jmp_target1(uintptr_t jmp_addr, uintptr_t addr) 226 { 227 /* patch the branch destination */ 228 *(uint32_t *)jmp_addr = addr - (jmp_addr + 4); 229 /* no need to flush icache explicitly */ 230 } 231 #elif defined(_ARCH_PPC) 232 void ppc_tb_set_jmp_target(uintptr_t jmp_addr, uintptr_t addr); 233 #define tb_set_jmp_target1 ppc_tb_set_jmp_target 234 #elif defined(__i386__) || defined(__x86_64__) 235 static inline void tb_set_jmp_target1(uintptr_t jmp_addr, uintptr_t addr) 236 { 237 /* patch the branch destination */ 238 stl_le_p((void*)jmp_addr, addr - (jmp_addr + 4)); 239 /* no need to flush icache explicitly */ 240 } 241 #elif defined(__s390x__) 242 static inline void tb_set_jmp_target1(uintptr_t jmp_addr, uintptr_t addr) 243 { 244 /* patch the branch destination */ 245 intptr_t disp = addr - (jmp_addr - 2); 246 stl_be_p((void*)jmp_addr, disp / 2); 247 /* no need to flush icache explicitly */ 248 } 249 #elif defined(__aarch64__) 250 void aarch64_tb_set_jmp_target(uintptr_t jmp_addr, uintptr_t addr); 251 #define tb_set_jmp_target1 aarch64_tb_set_jmp_target 252 #elif defined(__arm__) 253 static inline void tb_set_jmp_target1(uintptr_t jmp_addr, uintptr_t addr) 254 { 255 #if !QEMU_GNUC_PREREQ(4, 1) 256 register unsigned long _beg __asm ("a1"); 257 register unsigned long _end __asm ("a2"); 258 register unsigned long _flg __asm ("a3"); 259 #endif 260 261 /* we could use a ldr pc, [pc, #-4] kind of branch and avoid the flush */ 262 *(uint32_t *)jmp_addr = 263 (*(uint32_t *)jmp_addr & ~0xffffff) 264 | (((addr - (jmp_addr + 8)) >> 2) & 0xffffff); 265 266 #if QEMU_GNUC_PREREQ(4, 1) 267 __builtin___clear_cache((char *) jmp_addr, (char *) jmp_addr + 4); 268 #else 269 /* flush icache */ 270 _beg = jmp_addr; 271 _end = jmp_addr + 4; 272 _flg = 0; 273 __asm __volatile__ ("swi 0x9f0002" : : "r" (_beg), "r" (_end), "r" (_flg)); 274 #endif 275 } 276 #elif defined(__sparc__) || defined(__mips__) 277 void tb_set_jmp_target1(uintptr_t jmp_addr, uintptr_t addr); 278 #else 279 #error tb_set_jmp_target1 is missing 280 #endif 281 282 static inline void tb_set_jmp_target(TranslationBlock *tb, 283 int n, uintptr_t addr) 284 { 285 uint16_t offset = tb->tb_jmp_offset[n]; 286 tb_set_jmp_target1((uintptr_t)(tb->tc_ptr + offset), addr); 287 } 288 289 #else 290 291 /* set the jump target */ 292 static inline void tb_set_jmp_target(TranslationBlock *tb, 293 int n, uintptr_t addr) 294 { 295 tb->tb_next[n] = addr; 296 } 297 298 #endif 299 300 static inline void tb_add_jump(TranslationBlock *tb, int n, 301 TranslationBlock *tb_next) 302 { 303 /* NOTE: this test is only needed for thread safety */ 304 if (!tb->jmp_next[n]) { 305 /* patch the native jump address */ 306 tb_set_jmp_target(tb, n, (uintptr_t)tb_next->tc_ptr); 307 308 /* add in TB jmp circular list */ 309 tb->jmp_next[n] = tb_next->jmp_first; 310 tb_next->jmp_first = (TranslationBlock *)((uintptr_t)(tb) | (n)); 311 } 312 } 313 314 /* GETRA is the true target of the return instruction that we'll execute, 315 defined here for simplicity of defining the follow-up macros. */ 316 #if defined(CONFIG_TCG_INTERPRETER) 317 extern uintptr_t tci_tb_ptr; 318 # define GETRA() tci_tb_ptr 319 #else 320 # define GETRA() \ 321 ((uintptr_t)__builtin_extract_return_addr(__builtin_return_address(0))) 322 #endif 323 324 /* The true return address will often point to a host insn that is part of 325 the next translated guest insn. Adjust the address backward to point to 326 the middle of the call insn. Subtracting one would do the job except for 327 several compressed mode architectures (arm, mips) which set the low bit 328 to indicate the compressed mode; subtracting two works around that. It 329 is also the case that there are no host isas that contain a call insn 330 smaller than 4 bytes, so we don't worry about special-casing this. */ 331 #if defined(CONFIG_TCG_INTERPRETER) 332 # define GETPC_ADJ 0 333 #else 334 # define GETPC_ADJ 2 335 #endif 336 337 #define GETPC() (GETRA() - GETPC_ADJ) 338 339 #if !defined(CONFIG_USER_ONLY) 340 341 void phys_mem_set_alloc(void *(*alloc)(size_t, uint64_t *align)); 342 343 struct MemoryRegion *iotlb_to_region(CPUState *cpu, 344 hwaddr index); 345 346 void tlb_fill(CPUState *cpu, target_ulong addr, int is_write, int mmu_idx, 347 uintptr_t retaddr); 348 349 #endif 350 351 #if defined(CONFIG_USER_ONLY) 352 static inline tb_page_addr_t get_page_addr_code(CPUArchState *env1, target_ulong addr) 353 { 354 return addr; 355 } 356 #else 357 /* cputlb.c */ 358 tb_page_addr_t get_page_addr_code(CPUArchState *env1, target_ulong addr); 359 #endif 360 361 /* vl.c */ 362 extern int singlestep; 363 364 /* cpu-exec.c */ 365 extern volatile sig_atomic_t exit_request; 366 367 /** 368 * cpu_can_do_io: 369 * @cpu: The CPU for which to check IO. 370 * 371 * Deterministic execution requires that IO only be performed on the last 372 * instruction of a TB so that interrupts take effect immediately. 373 * 374 * Returns: %true if memory-mapped IO is safe, %false otherwise. 375 */ 376 static inline bool cpu_can_do_io(CPUState *cpu) 377 { 378 if (!use_icount) { 379 return true; 380 } 381 /* If not executing code then assume we are ok. */ 382 if (cpu->current_tb == NULL) { 383 return true; 384 } 385 return cpu->can_do_io != 0; 386 } 387 388 #endif 389