xref: /openbmc/qemu/tcg/tci.c (revision 49bd751497f3b71550b152ef9da0e265a94a64c1)
1 /*
2  * Tiny Code Interpreter for QEMU
3  *
4  * Copyright (c) 2009, 2011, 2016 Stefan Weil
5  *
6  * This program is free software: you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License as published by
8  * the Free Software Foundation, either version 2 of the License, or
9  * (at your option) any later version.
10  *
11  * This program is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  * GNU General Public License for more details.
15  *
16  * You should have received a copy of the GNU General Public License
17  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
18  */
19 
20 #include "qemu/osdep.h"
21 #include "tcg/tcg.h"
22 #include "tcg/helper-info.h"
23 #include "tcg/tcg-ldst.h"
24 #include "disas/dis-asm.h"
25 #include "tcg-has.h"
26 #include <ffi.h>
27 
28 
29 /*
30  * Enable TCI assertions only when debugging TCG (and without NDEBUG defined).
31  * Without assertions, the interpreter runs much faster.
32  */
33 #if defined(CONFIG_DEBUG_TCG)
34 # define tci_assert(cond) assert(cond)
35 #else
36 # define tci_assert(cond) ((void)(cond))
37 #endif
38 
39 __thread uintptr_t tci_tb_ptr;
40 
41 static void tci_write_reg64(tcg_target_ulong *regs, uint32_t high_index,
42                             uint32_t low_index, uint64_t value)
43 {
44     regs[low_index] = (uint32_t)value;
45     regs[high_index] = value >> 32;
46 }
47 
48 /* Create a 64 bit value from two 32 bit values. */
49 static uint64_t tci_uint64(uint32_t high, uint32_t low)
50 {
51     return ((uint64_t)high << 32) + low;
52 }
53 
54 /*
55  * Load sets of arguments all at once.  The naming convention is:
56  *   tci_args_<arguments>
57  * where arguments is a sequence of
58  *
59  *   b = immediate (bit position)
60  *   c = condition (TCGCond)
61  *   i = immediate (uint32_t)
62  *   I = immediate (tcg_target_ulong)
63  *   l = label or pointer
64  *   m = immediate (MemOpIdx)
65  *   n = immediate (call return length)
66  *   r = register
67  *   s = signed ldst offset
68  */
69 
70 static void tci_args_l(uint32_t insn, const void *tb_ptr, void **l0)
71 {
72     int diff = sextract32(insn, 12, 20);
73     *l0 = diff ? (void *)tb_ptr + diff : NULL;
74 }
75 
76 static void tci_args_r(uint32_t insn, TCGReg *r0)
77 {
78     *r0 = extract32(insn, 8, 4);
79 }
80 
81 static void tci_args_nl(uint32_t insn, const void *tb_ptr,
82                         uint8_t *n0, void **l1)
83 {
84     *n0 = extract32(insn, 8, 4);
85     *l1 = sextract32(insn, 12, 20) + (void *)tb_ptr;
86 }
87 
88 static void tci_args_rl(uint32_t insn, const void *tb_ptr,
89                         TCGReg *r0, void **l1)
90 {
91     *r0 = extract32(insn, 8, 4);
92     *l1 = sextract32(insn, 12, 20) + (void *)tb_ptr;
93 }
94 
95 static void tci_args_rr(uint32_t insn, TCGReg *r0, TCGReg *r1)
96 {
97     *r0 = extract32(insn, 8, 4);
98     *r1 = extract32(insn, 12, 4);
99 }
100 
101 static void tci_args_ri(uint32_t insn, TCGReg *r0, tcg_target_ulong *i1)
102 {
103     *r0 = extract32(insn, 8, 4);
104     *i1 = sextract32(insn, 12, 20);
105 }
106 
107 static void tci_args_rrm(uint32_t insn, TCGReg *r0,
108                          TCGReg *r1, MemOpIdx *m2)
109 {
110     *r0 = extract32(insn, 8, 4);
111     *r1 = extract32(insn, 12, 4);
112     *m2 = extract32(insn, 16, 16);
113 }
114 
115 static void tci_args_rrr(uint32_t insn, TCGReg *r0, TCGReg *r1, TCGReg *r2)
116 {
117     *r0 = extract32(insn, 8, 4);
118     *r1 = extract32(insn, 12, 4);
119     *r2 = extract32(insn, 16, 4);
120 }
121 
122 static void tci_args_rrs(uint32_t insn, TCGReg *r0, TCGReg *r1, int32_t *i2)
123 {
124     *r0 = extract32(insn, 8, 4);
125     *r1 = extract32(insn, 12, 4);
126     *i2 = sextract32(insn, 16, 16);
127 }
128 
129 static void tci_args_rrbb(uint32_t insn, TCGReg *r0, TCGReg *r1,
130                           uint8_t *i2, uint8_t *i3)
131 {
132     *r0 = extract32(insn, 8, 4);
133     *r1 = extract32(insn, 12, 4);
134     *i2 = extract32(insn, 16, 6);
135     *i3 = extract32(insn, 22, 6);
136 }
137 
138 static void tci_args_rrrc(uint32_t insn,
139                           TCGReg *r0, TCGReg *r1, TCGReg *r2, TCGCond *c3)
140 {
141     *r0 = extract32(insn, 8, 4);
142     *r1 = extract32(insn, 12, 4);
143     *r2 = extract32(insn, 16, 4);
144     *c3 = extract32(insn, 20, 4);
145 }
146 
147 static void tci_args_rrrbb(uint32_t insn, TCGReg *r0, TCGReg *r1,
148                            TCGReg *r2, uint8_t *i3, uint8_t *i4)
149 {
150     *r0 = extract32(insn, 8, 4);
151     *r1 = extract32(insn, 12, 4);
152     *r2 = extract32(insn, 16, 4);
153     *i3 = extract32(insn, 20, 6);
154     *i4 = extract32(insn, 26, 6);
155 }
156 
157 static void tci_args_rrrr(uint32_t insn,
158                           TCGReg *r0, TCGReg *r1, TCGReg *r2, TCGReg *r3)
159 {
160     *r0 = extract32(insn, 8, 4);
161     *r1 = extract32(insn, 12, 4);
162     *r2 = extract32(insn, 16, 4);
163     *r3 = extract32(insn, 20, 4);
164 }
165 
166 static void tci_args_rrrrrc(uint32_t insn, TCGReg *r0, TCGReg *r1,
167                             TCGReg *r2, TCGReg *r3, TCGReg *r4, TCGCond *c5)
168 {
169     *r0 = extract32(insn, 8, 4);
170     *r1 = extract32(insn, 12, 4);
171     *r2 = extract32(insn, 16, 4);
172     *r3 = extract32(insn, 20, 4);
173     *r4 = extract32(insn, 24, 4);
174     *c5 = extract32(insn, 28, 4);
175 }
176 
177 static void tci_args_rrrrrr(uint32_t insn, TCGReg *r0, TCGReg *r1,
178                             TCGReg *r2, TCGReg *r3, TCGReg *r4, TCGReg *r5)
179 {
180     *r0 = extract32(insn, 8, 4);
181     *r1 = extract32(insn, 12, 4);
182     *r2 = extract32(insn, 16, 4);
183     *r3 = extract32(insn, 20, 4);
184     *r4 = extract32(insn, 24, 4);
185     *r5 = extract32(insn, 28, 4);
186 }
187 
188 static bool tci_compare32(uint32_t u0, uint32_t u1, TCGCond condition)
189 {
190     bool result = false;
191     int32_t i0 = u0;
192     int32_t i1 = u1;
193     switch (condition) {
194     case TCG_COND_EQ:
195         result = (u0 == u1);
196         break;
197     case TCG_COND_NE:
198         result = (u0 != u1);
199         break;
200     case TCG_COND_LT:
201         result = (i0 < i1);
202         break;
203     case TCG_COND_GE:
204         result = (i0 >= i1);
205         break;
206     case TCG_COND_LE:
207         result = (i0 <= i1);
208         break;
209     case TCG_COND_GT:
210         result = (i0 > i1);
211         break;
212     case TCG_COND_LTU:
213         result = (u0 < u1);
214         break;
215     case TCG_COND_GEU:
216         result = (u0 >= u1);
217         break;
218     case TCG_COND_LEU:
219         result = (u0 <= u1);
220         break;
221     case TCG_COND_GTU:
222         result = (u0 > u1);
223         break;
224     case TCG_COND_TSTEQ:
225         result = (u0 & u1) == 0;
226         break;
227     case TCG_COND_TSTNE:
228         result = (u0 & u1) != 0;
229         break;
230     default:
231         g_assert_not_reached();
232     }
233     return result;
234 }
235 
236 static bool tci_compare64(uint64_t u0, uint64_t u1, TCGCond condition)
237 {
238     bool result = false;
239     int64_t i0 = u0;
240     int64_t i1 = u1;
241     switch (condition) {
242     case TCG_COND_EQ:
243         result = (u0 == u1);
244         break;
245     case TCG_COND_NE:
246         result = (u0 != u1);
247         break;
248     case TCG_COND_LT:
249         result = (i0 < i1);
250         break;
251     case TCG_COND_GE:
252         result = (i0 >= i1);
253         break;
254     case TCG_COND_LE:
255         result = (i0 <= i1);
256         break;
257     case TCG_COND_GT:
258         result = (i0 > i1);
259         break;
260     case TCG_COND_LTU:
261         result = (u0 < u1);
262         break;
263     case TCG_COND_GEU:
264         result = (u0 >= u1);
265         break;
266     case TCG_COND_LEU:
267         result = (u0 <= u1);
268         break;
269     case TCG_COND_GTU:
270         result = (u0 > u1);
271         break;
272     case TCG_COND_TSTEQ:
273         result = (u0 & u1) == 0;
274         break;
275     case TCG_COND_TSTNE:
276         result = (u0 & u1) != 0;
277         break;
278     default:
279         g_assert_not_reached();
280     }
281     return result;
282 }
283 
284 static uint64_t tci_qemu_ld(CPUArchState *env, uint64_t taddr,
285                             MemOpIdx oi, const void *tb_ptr)
286 {
287     MemOp mop = get_memop(oi);
288     uintptr_t ra = (uintptr_t)tb_ptr;
289 
290     switch (mop & MO_SSIZE) {
291     case MO_UB:
292         return helper_ldub_mmu(env, taddr, oi, ra);
293     case MO_SB:
294         return helper_ldsb_mmu(env, taddr, oi, ra);
295     case MO_UW:
296         return helper_lduw_mmu(env, taddr, oi, ra);
297     case MO_SW:
298         return helper_ldsw_mmu(env, taddr, oi, ra);
299     case MO_UL:
300         return helper_ldul_mmu(env, taddr, oi, ra);
301     case MO_SL:
302         return helper_ldsl_mmu(env, taddr, oi, ra);
303     case MO_UQ:
304         return helper_ldq_mmu(env, taddr, oi, ra);
305     default:
306         g_assert_not_reached();
307     }
308 }
309 
310 static void tci_qemu_st(CPUArchState *env, uint64_t taddr, uint64_t val,
311                         MemOpIdx oi, const void *tb_ptr)
312 {
313     MemOp mop = get_memop(oi);
314     uintptr_t ra = (uintptr_t)tb_ptr;
315 
316     switch (mop & MO_SIZE) {
317     case MO_UB:
318         helper_stb_mmu(env, taddr, val, oi, ra);
319         break;
320     case MO_UW:
321         helper_stw_mmu(env, taddr, val, oi, ra);
322         break;
323     case MO_UL:
324         helper_stl_mmu(env, taddr, val, oi, ra);
325         break;
326     case MO_UQ:
327         helper_stq_mmu(env, taddr, val, oi, ra);
328         break;
329     default:
330         g_assert_not_reached();
331     }
332 }
333 
334 #if TCG_TARGET_REG_BITS == 64
335 # define CASE_32_64(x) \
336         case glue(glue(INDEX_op_, x), _i64): \
337         case glue(glue(INDEX_op_, x), _i32):
338 # define CASE_64(x) \
339         case glue(glue(INDEX_op_, x), _i64):
340 #else
341 # define CASE_32_64(x) \
342         case glue(glue(INDEX_op_, x), _i32):
343 # define CASE_64(x)
344 #endif
345 
346 /* Interpret pseudo code in tb. */
347 /*
348  * Disable CFI checks.
349  * One possible operation in the pseudo code is a call to binary code.
350  * Therefore, disable CFI checks in the interpreter function
351  */
352 uintptr_t QEMU_DISABLE_CFI tcg_qemu_tb_exec(CPUArchState *env,
353                                             const void *v_tb_ptr)
354 {
355     const uint32_t *tb_ptr = v_tb_ptr;
356     tcg_target_ulong regs[TCG_TARGET_NB_REGS];
357     uint64_t stack[(TCG_STATIC_CALL_ARGS_SIZE + TCG_STATIC_FRAME_SIZE)
358                    / sizeof(uint64_t)];
359 
360     regs[TCG_AREG0] = (tcg_target_ulong)env;
361     regs[TCG_REG_CALL_STACK] = (uintptr_t)stack;
362     tci_assert(tb_ptr);
363 
364     for (;;) {
365         uint32_t insn;
366         TCGOpcode opc;
367         TCGReg r0, r1, r2, r3, r4, r5;
368         tcg_target_ulong t1;
369         TCGCond condition;
370         uint8_t pos, len;
371         uint32_t tmp32;
372         uint64_t tmp64, taddr;
373         uint64_t T1, T2;
374         MemOpIdx oi;
375         int32_t ofs;
376         void *ptr;
377 
378         insn = *tb_ptr++;
379         opc = extract32(insn, 0, 8);
380 
381         switch (opc) {
382         case INDEX_op_call:
383             {
384                 void *call_slots[MAX_CALL_IARGS];
385                 ffi_cif *cif;
386                 void *func;
387                 unsigned i, s, n;
388 
389                 tci_args_nl(insn, tb_ptr, &len, &ptr);
390                 func = ((void **)ptr)[0];
391                 cif = ((void **)ptr)[1];
392 
393                 n = cif->nargs;
394                 for (i = s = 0; i < n; ++i) {
395                     ffi_type *t = cif->arg_types[i];
396                     call_slots[i] = &stack[s];
397                     s += DIV_ROUND_UP(t->size, 8);
398                 }
399 
400                 /* Helper functions may need to access the "return address" */
401                 tci_tb_ptr = (uintptr_t)tb_ptr;
402                 ffi_call(cif, func, stack, call_slots);
403             }
404 
405             switch (len) {
406             case 0: /* void */
407                 break;
408             case 1: /* uint32_t */
409                 /*
410                  * The result winds up "left-aligned" in the stack[0] slot.
411                  * Note that libffi has an odd special case in that it will
412                  * always widen an integral result to ffi_arg.
413                  */
414                 if (sizeof(ffi_arg) == 8) {
415                     regs[TCG_REG_R0] = (uint32_t)stack[0];
416                 } else {
417                     regs[TCG_REG_R0] = *(uint32_t *)stack;
418                 }
419                 break;
420             case 2: /* uint64_t */
421                 /*
422                  * For TCG_TARGET_REG_BITS == 32, the register pair
423                  * must stay in host memory order.
424                  */
425                 memcpy(&regs[TCG_REG_R0], stack, 8);
426                 break;
427             case 3: /* Int128 */
428                 memcpy(&regs[TCG_REG_R0], stack, 16);
429                 break;
430             default:
431                 g_assert_not_reached();
432             }
433             break;
434 
435         case INDEX_op_br:
436             tci_args_l(insn, tb_ptr, &ptr);
437             tb_ptr = ptr;
438             continue;
439         case INDEX_op_setcond_i32:
440             tci_args_rrrc(insn, &r0, &r1, &r2, &condition);
441             regs[r0] = tci_compare32(regs[r1], regs[r2], condition);
442             break;
443         case INDEX_op_movcond_i32:
444             tci_args_rrrrrc(insn, &r0, &r1, &r2, &r3, &r4, &condition);
445             tmp32 = tci_compare32(regs[r1], regs[r2], condition);
446             regs[r0] = regs[tmp32 ? r3 : r4];
447             break;
448 #if TCG_TARGET_REG_BITS == 32
449         case INDEX_op_setcond2_i32:
450             tci_args_rrrrrc(insn, &r0, &r1, &r2, &r3, &r4, &condition);
451             T1 = tci_uint64(regs[r2], regs[r1]);
452             T2 = tci_uint64(regs[r4], regs[r3]);
453             regs[r0] = tci_compare64(T1, T2, condition);
454             break;
455 #elif TCG_TARGET_REG_BITS == 64
456         case INDEX_op_setcond_i64:
457             tci_args_rrrc(insn, &r0, &r1, &r2, &condition);
458             regs[r0] = tci_compare64(regs[r1], regs[r2], condition);
459             break;
460         case INDEX_op_movcond_i64:
461             tci_args_rrrrrc(insn, &r0, &r1, &r2, &r3, &r4, &condition);
462             tmp32 = tci_compare64(regs[r1], regs[r2], condition);
463             regs[r0] = regs[tmp32 ? r3 : r4];
464             break;
465 #endif
466         case INDEX_op_mov:
467             tci_args_rr(insn, &r0, &r1);
468             regs[r0] = regs[r1];
469             break;
470         case INDEX_op_tci_movi:
471             tci_args_ri(insn, &r0, &t1);
472             regs[r0] = t1;
473             break;
474         case INDEX_op_tci_movl:
475             tci_args_rl(insn, tb_ptr, &r0, &ptr);
476             regs[r0] = *(tcg_target_ulong *)ptr;
477             break;
478 
479             /* Load/store operations (32 bit). */
480 
481         CASE_32_64(ld8u)
482             tci_args_rrs(insn, &r0, &r1, &ofs);
483             ptr = (void *)(regs[r1] + ofs);
484             regs[r0] = *(uint8_t *)ptr;
485             break;
486         CASE_32_64(ld8s)
487             tci_args_rrs(insn, &r0, &r1, &ofs);
488             ptr = (void *)(regs[r1] + ofs);
489             regs[r0] = *(int8_t *)ptr;
490             break;
491         CASE_32_64(ld16u)
492             tci_args_rrs(insn, &r0, &r1, &ofs);
493             ptr = (void *)(regs[r1] + ofs);
494             regs[r0] = *(uint16_t *)ptr;
495             break;
496         CASE_32_64(ld16s)
497             tci_args_rrs(insn, &r0, &r1, &ofs);
498             ptr = (void *)(regs[r1] + ofs);
499             regs[r0] = *(int16_t *)ptr;
500             break;
501         case INDEX_op_ld_i32:
502         CASE_64(ld32u)
503             tci_args_rrs(insn, &r0, &r1, &ofs);
504             ptr = (void *)(regs[r1] + ofs);
505             regs[r0] = *(uint32_t *)ptr;
506             break;
507         CASE_32_64(st8)
508             tci_args_rrs(insn, &r0, &r1, &ofs);
509             ptr = (void *)(regs[r1] + ofs);
510             *(uint8_t *)ptr = regs[r0];
511             break;
512         CASE_32_64(st16)
513             tci_args_rrs(insn, &r0, &r1, &ofs);
514             ptr = (void *)(regs[r1] + ofs);
515             *(uint16_t *)ptr = regs[r0];
516             break;
517         case INDEX_op_st_i32:
518         CASE_64(st32)
519             tci_args_rrs(insn, &r0, &r1, &ofs);
520             ptr = (void *)(regs[r1] + ofs);
521             *(uint32_t *)ptr = regs[r0];
522             break;
523 
524             /* Arithmetic operations (mixed 32/64 bit). */
525 
526         case INDEX_op_add:
527             tci_args_rrr(insn, &r0, &r1, &r2);
528             regs[r0] = regs[r1] + regs[r2];
529             break;
530         CASE_32_64(sub)
531             tci_args_rrr(insn, &r0, &r1, &r2);
532             regs[r0] = regs[r1] - regs[r2];
533             break;
534         CASE_32_64(mul)
535             tci_args_rrr(insn, &r0, &r1, &r2);
536             regs[r0] = regs[r1] * regs[r2];
537             break;
538         case INDEX_op_and:
539             tci_args_rrr(insn, &r0, &r1, &r2);
540             regs[r0] = regs[r1] & regs[r2];
541             break;
542         case INDEX_op_or:
543             tci_args_rrr(insn, &r0, &r1, &r2);
544             regs[r0] = regs[r1] | regs[r2];
545             break;
546         CASE_32_64(xor)
547             tci_args_rrr(insn, &r0, &r1, &r2);
548             regs[r0] = regs[r1] ^ regs[r2];
549             break;
550         case INDEX_op_andc:
551             tci_args_rrr(insn, &r0, &r1, &r2);
552             regs[r0] = regs[r1] & ~regs[r2];
553             break;
554 #if TCG_TARGET_HAS_orc_i32 || TCG_TARGET_HAS_orc_i64
555         CASE_32_64(orc)
556             tci_args_rrr(insn, &r0, &r1, &r2);
557             regs[r0] = regs[r1] | ~regs[r2];
558             break;
559 #endif
560 #if TCG_TARGET_HAS_eqv_i32 || TCG_TARGET_HAS_eqv_i64
561         CASE_32_64(eqv)
562             tci_args_rrr(insn, &r0, &r1, &r2);
563             regs[r0] = ~(regs[r1] ^ regs[r2]);
564             break;
565 #endif
566 #if TCG_TARGET_HAS_nand_i32 || TCG_TARGET_HAS_nand_i64
567         CASE_32_64(nand)
568             tci_args_rrr(insn, &r0, &r1, &r2);
569             regs[r0] = ~(regs[r1] & regs[r2]);
570             break;
571 #endif
572 #if TCG_TARGET_HAS_nor_i32 || TCG_TARGET_HAS_nor_i64
573         CASE_32_64(nor)
574             tci_args_rrr(insn, &r0, &r1, &r2);
575             regs[r0] = ~(regs[r1] | regs[r2]);
576             break;
577 #endif
578 
579             /* Arithmetic operations (32 bit). */
580 
581         case INDEX_op_div_i32:
582             tci_args_rrr(insn, &r0, &r1, &r2);
583             regs[r0] = (int32_t)regs[r1] / (int32_t)regs[r2];
584             break;
585         case INDEX_op_divu_i32:
586             tci_args_rrr(insn, &r0, &r1, &r2);
587             regs[r0] = (uint32_t)regs[r1] / (uint32_t)regs[r2];
588             break;
589         case INDEX_op_rem_i32:
590             tci_args_rrr(insn, &r0, &r1, &r2);
591             regs[r0] = (int32_t)regs[r1] % (int32_t)regs[r2];
592             break;
593         case INDEX_op_remu_i32:
594             tci_args_rrr(insn, &r0, &r1, &r2);
595             regs[r0] = (uint32_t)regs[r1] % (uint32_t)regs[r2];
596             break;
597 #if TCG_TARGET_HAS_clz_i32
598         case INDEX_op_clz_i32:
599             tci_args_rrr(insn, &r0, &r1, &r2);
600             tmp32 = regs[r1];
601             regs[r0] = tmp32 ? clz32(tmp32) : regs[r2];
602             break;
603 #endif
604 #if TCG_TARGET_HAS_ctz_i32
605         case INDEX_op_ctz_i32:
606             tci_args_rrr(insn, &r0, &r1, &r2);
607             tmp32 = regs[r1];
608             regs[r0] = tmp32 ? ctz32(tmp32) : regs[r2];
609             break;
610 #endif
611 #if TCG_TARGET_HAS_ctpop_i32
612         case INDEX_op_ctpop_i32:
613             tci_args_rr(insn, &r0, &r1);
614             regs[r0] = ctpop32(regs[r1]);
615             break;
616 #endif
617 
618             /* Shift/rotate operations (32 bit). */
619 
620         case INDEX_op_shl_i32:
621             tci_args_rrr(insn, &r0, &r1, &r2);
622             regs[r0] = (uint32_t)regs[r1] << (regs[r2] & 31);
623             break;
624         case INDEX_op_shr_i32:
625             tci_args_rrr(insn, &r0, &r1, &r2);
626             regs[r0] = (uint32_t)regs[r1] >> (regs[r2] & 31);
627             break;
628         case INDEX_op_sar_i32:
629             tci_args_rrr(insn, &r0, &r1, &r2);
630             regs[r0] = (int32_t)regs[r1] >> (regs[r2] & 31);
631             break;
632 #if TCG_TARGET_HAS_rot_i32
633         case INDEX_op_rotl_i32:
634             tci_args_rrr(insn, &r0, &r1, &r2);
635             regs[r0] = rol32(regs[r1], regs[r2] & 31);
636             break;
637         case INDEX_op_rotr_i32:
638             tci_args_rrr(insn, &r0, &r1, &r2);
639             regs[r0] = ror32(regs[r1], regs[r2] & 31);
640             break;
641 #endif
642         case INDEX_op_deposit_i32:
643             tci_args_rrrbb(insn, &r0, &r1, &r2, &pos, &len);
644             regs[r0] = deposit32(regs[r1], pos, len, regs[r2]);
645             break;
646         case INDEX_op_extract_i32:
647             tci_args_rrbb(insn, &r0, &r1, &pos, &len);
648             regs[r0] = extract32(regs[r1], pos, len);
649             break;
650         case INDEX_op_sextract_i32:
651             tci_args_rrbb(insn, &r0, &r1, &pos, &len);
652             regs[r0] = sextract32(regs[r1], pos, len);
653             break;
654         case INDEX_op_brcond_i32:
655             tci_args_rl(insn, tb_ptr, &r0, &ptr);
656             if ((uint32_t)regs[r0]) {
657                 tb_ptr = ptr;
658             }
659             break;
660 #if TCG_TARGET_REG_BITS == 32 || TCG_TARGET_HAS_add2_i32
661         case INDEX_op_add2_i32:
662             tci_args_rrrrrr(insn, &r0, &r1, &r2, &r3, &r4, &r5);
663             T1 = tci_uint64(regs[r3], regs[r2]);
664             T2 = tci_uint64(regs[r5], regs[r4]);
665             tci_write_reg64(regs, r1, r0, T1 + T2);
666             break;
667 #endif
668 #if TCG_TARGET_REG_BITS == 32 || TCG_TARGET_HAS_sub2_i32
669         case INDEX_op_sub2_i32:
670             tci_args_rrrrrr(insn, &r0, &r1, &r2, &r3, &r4, &r5);
671             T1 = tci_uint64(regs[r3], regs[r2]);
672             T2 = tci_uint64(regs[r5], regs[r4]);
673             tci_write_reg64(regs, r1, r0, T1 - T2);
674             break;
675 #endif
676 #if TCG_TARGET_HAS_mulu2_i32
677         case INDEX_op_mulu2_i32:
678             tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
679             tmp64 = (uint64_t)(uint32_t)regs[r2] * (uint32_t)regs[r3];
680             tci_write_reg64(regs, r1, r0, tmp64);
681             break;
682 #endif
683 #if TCG_TARGET_HAS_muls2_i32
684         case INDEX_op_muls2_i32:
685             tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
686             tmp64 = (int64_t)(int32_t)regs[r2] * (int32_t)regs[r3];
687             tci_write_reg64(regs, r1, r0, tmp64);
688             break;
689 #endif
690 #if TCG_TARGET_HAS_bswap16_i32 || TCG_TARGET_HAS_bswap16_i64
691         CASE_32_64(bswap16)
692             tci_args_rr(insn, &r0, &r1);
693             regs[r0] = bswap16(regs[r1]);
694             break;
695 #endif
696 #if TCG_TARGET_HAS_bswap32_i32 || TCG_TARGET_HAS_bswap32_i64
697         CASE_32_64(bswap32)
698             tci_args_rr(insn, &r0, &r1);
699             regs[r0] = bswap32(regs[r1]);
700             break;
701 #endif
702 #if TCG_TARGET_HAS_not_i32 || TCG_TARGET_HAS_not_i64
703         CASE_32_64(not)
704             tci_args_rr(insn, &r0, &r1);
705             regs[r0] = ~regs[r1];
706             break;
707 #endif
708         CASE_32_64(neg)
709             tci_args_rr(insn, &r0, &r1);
710             regs[r0] = -regs[r1];
711             break;
712 #if TCG_TARGET_REG_BITS == 64
713             /* Load/store operations (64 bit). */
714 
715         case INDEX_op_ld32s_i64:
716             tci_args_rrs(insn, &r0, &r1, &ofs);
717             ptr = (void *)(regs[r1] + ofs);
718             regs[r0] = *(int32_t *)ptr;
719             break;
720         case INDEX_op_ld_i64:
721             tci_args_rrs(insn, &r0, &r1, &ofs);
722             ptr = (void *)(regs[r1] + ofs);
723             regs[r0] = *(uint64_t *)ptr;
724             break;
725         case INDEX_op_st_i64:
726             tci_args_rrs(insn, &r0, &r1, &ofs);
727             ptr = (void *)(regs[r1] + ofs);
728             *(uint64_t *)ptr = regs[r0];
729             break;
730 
731             /* Arithmetic operations (64 bit). */
732 
733         case INDEX_op_div_i64:
734             tci_args_rrr(insn, &r0, &r1, &r2);
735             regs[r0] = (int64_t)regs[r1] / (int64_t)regs[r2];
736             break;
737         case INDEX_op_divu_i64:
738             tci_args_rrr(insn, &r0, &r1, &r2);
739             regs[r0] = (uint64_t)regs[r1] / (uint64_t)regs[r2];
740             break;
741         case INDEX_op_rem_i64:
742             tci_args_rrr(insn, &r0, &r1, &r2);
743             regs[r0] = (int64_t)regs[r1] % (int64_t)regs[r2];
744             break;
745         case INDEX_op_remu_i64:
746             tci_args_rrr(insn, &r0, &r1, &r2);
747             regs[r0] = (uint64_t)regs[r1] % (uint64_t)regs[r2];
748             break;
749 #if TCG_TARGET_HAS_clz_i64
750         case INDEX_op_clz_i64:
751             tci_args_rrr(insn, &r0, &r1, &r2);
752             regs[r0] = regs[r1] ? clz64(regs[r1]) : regs[r2];
753             break;
754 #endif
755 #if TCG_TARGET_HAS_ctz_i64
756         case INDEX_op_ctz_i64:
757             tci_args_rrr(insn, &r0, &r1, &r2);
758             regs[r0] = regs[r1] ? ctz64(regs[r1]) : regs[r2];
759             break;
760 #endif
761 #if TCG_TARGET_HAS_ctpop_i64
762         case INDEX_op_ctpop_i64:
763             tci_args_rr(insn, &r0, &r1);
764             regs[r0] = ctpop64(regs[r1]);
765             break;
766 #endif
767 #if TCG_TARGET_HAS_mulu2_i64
768         case INDEX_op_mulu2_i64:
769             tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
770             mulu64(&regs[r0], &regs[r1], regs[r2], regs[r3]);
771             break;
772 #endif
773 #if TCG_TARGET_HAS_muls2_i64
774         case INDEX_op_muls2_i64:
775             tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
776             muls64(&regs[r0], &regs[r1], regs[r2], regs[r3]);
777             break;
778 #endif
779 #if TCG_TARGET_HAS_add2_i64
780         case INDEX_op_add2_i64:
781             tci_args_rrrrrr(insn, &r0, &r1, &r2, &r3, &r4, &r5);
782             T1 = regs[r2] + regs[r4];
783             T2 = regs[r3] + regs[r5] + (T1 < regs[r2]);
784             regs[r0] = T1;
785             regs[r1] = T2;
786             break;
787 #endif
788 #if TCG_TARGET_HAS_add2_i64
789         case INDEX_op_sub2_i64:
790             tci_args_rrrrrr(insn, &r0, &r1, &r2, &r3, &r4, &r5);
791             T1 = regs[r2] - regs[r4];
792             T2 = regs[r3] - regs[r5] - (regs[r2] < regs[r4]);
793             regs[r0] = T1;
794             regs[r1] = T2;
795             break;
796 #endif
797 
798             /* Shift/rotate operations (64 bit). */
799 
800         case INDEX_op_shl_i64:
801             tci_args_rrr(insn, &r0, &r1, &r2);
802             regs[r0] = regs[r1] << (regs[r2] & 63);
803             break;
804         case INDEX_op_shr_i64:
805             tci_args_rrr(insn, &r0, &r1, &r2);
806             regs[r0] = regs[r1] >> (regs[r2] & 63);
807             break;
808         case INDEX_op_sar_i64:
809             tci_args_rrr(insn, &r0, &r1, &r2);
810             regs[r0] = (int64_t)regs[r1] >> (regs[r2] & 63);
811             break;
812 #if TCG_TARGET_HAS_rot_i64
813         case INDEX_op_rotl_i64:
814             tci_args_rrr(insn, &r0, &r1, &r2);
815             regs[r0] = rol64(regs[r1], regs[r2] & 63);
816             break;
817         case INDEX_op_rotr_i64:
818             tci_args_rrr(insn, &r0, &r1, &r2);
819             regs[r0] = ror64(regs[r1], regs[r2] & 63);
820             break;
821 #endif
822         case INDEX_op_deposit_i64:
823             tci_args_rrrbb(insn, &r0, &r1, &r2, &pos, &len);
824             regs[r0] = deposit64(regs[r1], pos, len, regs[r2]);
825             break;
826         case INDEX_op_extract_i64:
827             tci_args_rrbb(insn, &r0, &r1, &pos, &len);
828             regs[r0] = extract64(regs[r1], pos, len);
829             break;
830         case INDEX_op_sextract_i64:
831             tci_args_rrbb(insn, &r0, &r1, &pos, &len);
832             regs[r0] = sextract64(regs[r1], pos, len);
833             break;
834         case INDEX_op_brcond_i64:
835             tci_args_rl(insn, tb_ptr, &r0, &ptr);
836             if (regs[r0]) {
837                 tb_ptr = ptr;
838             }
839             break;
840         case INDEX_op_ext_i32_i64:
841             tci_args_rr(insn, &r0, &r1);
842             regs[r0] = (int32_t)regs[r1];
843             break;
844         case INDEX_op_extu_i32_i64:
845             tci_args_rr(insn, &r0, &r1);
846             regs[r0] = (uint32_t)regs[r1];
847             break;
848 #if TCG_TARGET_HAS_bswap64_i64
849         case INDEX_op_bswap64_i64:
850             tci_args_rr(insn, &r0, &r1);
851             regs[r0] = bswap64(regs[r1]);
852             break;
853 #endif
854 #endif /* TCG_TARGET_REG_BITS == 64 */
855 
856             /* QEMU specific operations. */
857 
858         case INDEX_op_exit_tb:
859             tci_args_l(insn, tb_ptr, &ptr);
860             return (uintptr_t)ptr;
861 
862         case INDEX_op_goto_tb:
863             tci_args_l(insn, tb_ptr, &ptr);
864             tb_ptr = *(void **)ptr;
865             break;
866 
867         case INDEX_op_goto_ptr:
868             tci_args_r(insn, &r0);
869             ptr = (void *)regs[r0];
870             if (!ptr) {
871                 return 0;
872             }
873             tb_ptr = ptr;
874             break;
875 
876         case INDEX_op_qemu_ld_i32:
877             tci_args_rrm(insn, &r0, &r1, &oi);
878             taddr = regs[r1];
879             regs[r0] = tci_qemu_ld(env, taddr, oi, tb_ptr);
880             break;
881 
882         case INDEX_op_qemu_ld_i64:
883             if (TCG_TARGET_REG_BITS == 64) {
884                 tci_args_rrm(insn, &r0, &r1, &oi);
885                 taddr = regs[r1];
886             } else {
887                 tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
888                 taddr = regs[r2];
889                 oi = regs[r3];
890             }
891             tmp64 = tci_qemu_ld(env, taddr, oi, tb_ptr);
892             if (TCG_TARGET_REG_BITS == 32) {
893                 tci_write_reg64(regs, r1, r0, tmp64);
894             } else {
895                 regs[r0] = tmp64;
896             }
897             break;
898 
899         case INDEX_op_qemu_st_i32:
900             tci_args_rrm(insn, &r0, &r1, &oi);
901             taddr = regs[r1];
902             tci_qemu_st(env, taddr, regs[r0], oi, tb_ptr);
903             break;
904 
905         case INDEX_op_qemu_st_i64:
906             if (TCG_TARGET_REG_BITS == 64) {
907                 tci_args_rrm(insn, &r0, &r1, &oi);
908                 tmp64 = regs[r0];
909                 taddr = regs[r1];
910             } else {
911                 tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
912                 tmp64 = tci_uint64(regs[r1], regs[r0]);
913                 taddr = regs[r2];
914                 oi = regs[r3];
915             }
916             tci_qemu_st(env, taddr, tmp64, oi, tb_ptr);
917             break;
918 
919         case INDEX_op_mb:
920             /* Ensure ordering for all kinds */
921             smp_mb();
922             break;
923         default:
924             g_assert_not_reached();
925         }
926     }
927 }
928 
929 /*
930  * Disassembler that matches the interpreter
931  */
932 
933 static const char *str_r(TCGReg r)
934 {
935     static const char regs[TCG_TARGET_NB_REGS][4] = {
936         "r0", "r1", "r2",  "r3",  "r4",  "r5",  "r6",  "r7",
937         "r8", "r9", "r10", "r11", "r12", "r13", "env", "sp"
938     };
939 
940     QEMU_BUILD_BUG_ON(TCG_AREG0 != TCG_REG_R14);
941     QEMU_BUILD_BUG_ON(TCG_REG_CALL_STACK != TCG_REG_R15);
942 
943     assert((unsigned)r < TCG_TARGET_NB_REGS);
944     return regs[r];
945 }
946 
947 static const char *str_c(TCGCond c)
948 {
949     static const char cond[16][8] = {
950         [TCG_COND_NEVER] = "never",
951         [TCG_COND_ALWAYS] = "always",
952         [TCG_COND_EQ] = "eq",
953         [TCG_COND_NE] = "ne",
954         [TCG_COND_LT] = "lt",
955         [TCG_COND_GE] = "ge",
956         [TCG_COND_LE] = "le",
957         [TCG_COND_GT] = "gt",
958         [TCG_COND_LTU] = "ltu",
959         [TCG_COND_GEU] = "geu",
960         [TCG_COND_LEU] = "leu",
961         [TCG_COND_GTU] = "gtu",
962         [TCG_COND_TSTEQ] = "tsteq",
963         [TCG_COND_TSTNE] = "tstne",
964     };
965 
966     assert((unsigned)c < ARRAY_SIZE(cond));
967     assert(cond[c][0] != 0);
968     return cond[c];
969 }
970 
971 /* Disassemble TCI bytecode. */
972 int print_insn_tci(bfd_vma addr, disassemble_info *info)
973 {
974     const uint32_t *tb_ptr = (const void *)(uintptr_t)addr;
975     const TCGOpDef *def;
976     const char *op_name;
977     uint32_t insn;
978     TCGOpcode op;
979     TCGReg r0, r1, r2, r3, r4, r5;
980     tcg_target_ulong i1;
981     int32_t s2;
982     TCGCond c;
983     MemOpIdx oi;
984     uint8_t pos, len;
985     void *ptr;
986 
987     /* TCI is always the host, so we don't need to load indirect. */
988     insn = *tb_ptr++;
989 
990     info->fprintf_func(info->stream, "%08x  ", insn);
991 
992     op = extract32(insn, 0, 8);
993     def = &tcg_op_defs[op];
994     op_name = def->name;
995 
996     switch (op) {
997     case INDEX_op_br:
998     case INDEX_op_exit_tb:
999     case INDEX_op_goto_tb:
1000         tci_args_l(insn, tb_ptr, &ptr);
1001         info->fprintf_func(info->stream, "%-12s  %p", op_name, ptr);
1002         break;
1003 
1004     case INDEX_op_goto_ptr:
1005         tci_args_r(insn, &r0);
1006         info->fprintf_func(info->stream, "%-12s  %s", op_name, str_r(r0));
1007         break;
1008 
1009     case INDEX_op_call:
1010         tci_args_nl(insn, tb_ptr, &len, &ptr);
1011         info->fprintf_func(info->stream, "%-12s  %d, %p", op_name, len, ptr);
1012         break;
1013 
1014     case INDEX_op_brcond_i32:
1015     case INDEX_op_brcond_i64:
1016         tci_args_rl(insn, tb_ptr, &r0, &ptr);
1017         info->fprintf_func(info->stream, "%-12s  %s, 0, ne, %p",
1018                            op_name, str_r(r0), ptr);
1019         break;
1020 
1021     case INDEX_op_setcond_i32:
1022     case INDEX_op_setcond_i64:
1023         tci_args_rrrc(insn, &r0, &r1, &r2, &c);
1024         info->fprintf_func(info->stream, "%-12s  %s, %s, %s, %s",
1025                            op_name, str_r(r0), str_r(r1), str_r(r2), str_c(c));
1026         break;
1027 
1028     case INDEX_op_tci_movi:
1029         tci_args_ri(insn, &r0, &i1);
1030         info->fprintf_func(info->stream, "%-12s  %s, 0x%" TCG_PRIlx,
1031                            op_name, str_r(r0), i1);
1032         break;
1033 
1034     case INDEX_op_tci_movl:
1035         tci_args_rl(insn, tb_ptr, &r0, &ptr);
1036         info->fprintf_func(info->stream, "%-12s  %s, %p",
1037                            op_name, str_r(r0), ptr);
1038         break;
1039 
1040     case INDEX_op_ld8u_i32:
1041     case INDEX_op_ld8u_i64:
1042     case INDEX_op_ld8s_i32:
1043     case INDEX_op_ld8s_i64:
1044     case INDEX_op_ld16u_i32:
1045     case INDEX_op_ld16u_i64:
1046     case INDEX_op_ld16s_i32:
1047     case INDEX_op_ld16s_i64:
1048     case INDEX_op_ld32u_i64:
1049     case INDEX_op_ld32s_i64:
1050     case INDEX_op_ld_i32:
1051     case INDEX_op_ld_i64:
1052     case INDEX_op_st8_i32:
1053     case INDEX_op_st8_i64:
1054     case INDEX_op_st16_i32:
1055     case INDEX_op_st16_i64:
1056     case INDEX_op_st32_i64:
1057     case INDEX_op_st_i32:
1058     case INDEX_op_st_i64:
1059         tci_args_rrs(insn, &r0, &r1, &s2);
1060         info->fprintf_func(info->stream, "%-12s  %s, %s, %d",
1061                            op_name, str_r(r0), str_r(r1), s2);
1062         break;
1063 
1064     case INDEX_op_mov:
1065     case INDEX_op_ext_i32_i64:
1066     case INDEX_op_extu_i32_i64:
1067     case INDEX_op_bswap16_i32:
1068     case INDEX_op_bswap16_i64:
1069     case INDEX_op_bswap32_i32:
1070     case INDEX_op_bswap32_i64:
1071     case INDEX_op_bswap64_i64:
1072     case INDEX_op_not_i32:
1073     case INDEX_op_not_i64:
1074     case INDEX_op_neg_i32:
1075     case INDEX_op_neg_i64:
1076     case INDEX_op_ctpop_i32:
1077     case INDEX_op_ctpop_i64:
1078         tci_args_rr(insn, &r0, &r1);
1079         info->fprintf_func(info->stream, "%-12s  %s, %s",
1080                            op_name, str_r(r0), str_r(r1));
1081         break;
1082 
1083     case INDEX_op_add:
1084     case INDEX_op_and:
1085     case INDEX_op_andc:
1086     case INDEX_op_or:
1087     case INDEX_op_sub_i32:
1088     case INDEX_op_sub_i64:
1089     case INDEX_op_mul_i32:
1090     case INDEX_op_mul_i64:
1091     case INDEX_op_xor_i32:
1092     case INDEX_op_xor_i64:
1093     case INDEX_op_orc_i32:
1094     case INDEX_op_orc_i64:
1095     case INDEX_op_eqv_i32:
1096     case INDEX_op_eqv_i64:
1097     case INDEX_op_nand_i32:
1098     case INDEX_op_nand_i64:
1099     case INDEX_op_nor_i32:
1100     case INDEX_op_nor_i64:
1101     case INDEX_op_div_i32:
1102     case INDEX_op_div_i64:
1103     case INDEX_op_rem_i32:
1104     case INDEX_op_rem_i64:
1105     case INDEX_op_divu_i32:
1106     case INDEX_op_divu_i64:
1107     case INDEX_op_remu_i32:
1108     case INDEX_op_remu_i64:
1109     case INDEX_op_shl_i32:
1110     case INDEX_op_shl_i64:
1111     case INDEX_op_shr_i32:
1112     case INDEX_op_shr_i64:
1113     case INDEX_op_sar_i32:
1114     case INDEX_op_sar_i64:
1115     case INDEX_op_rotl_i32:
1116     case INDEX_op_rotl_i64:
1117     case INDEX_op_rotr_i32:
1118     case INDEX_op_rotr_i64:
1119     case INDEX_op_clz_i32:
1120     case INDEX_op_clz_i64:
1121     case INDEX_op_ctz_i32:
1122     case INDEX_op_ctz_i64:
1123         tci_args_rrr(insn, &r0, &r1, &r2);
1124         info->fprintf_func(info->stream, "%-12s  %s, %s, %s",
1125                            op_name, str_r(r0), str_r(r1), str_r(r2));
1126         break;
1127 
1128     case INDEX_op_deposit_i32:
1129     case INDEX_op_deposit_i64:
1130         tci_args_rrrbb(insn, &r0, &r1, &r2, &pos, &len);
1131         info->fprintf_func(info->stream, "%-12s  %s, %s, %s, %d, %d",
1132                            op_name, str_r(r0), str_r(r1), str_r(r2), pos, len);
1133         break;
1134 
1135     case INDEX_op_extract_i32:
1136     case INDEX_op_extract_i64:
1137     case INDEX_op_sextract_i32:
1138     case INDEX_op_sextract_i64:
1139         tci_args_rrbb(insn, &r0, &r1, &pos, &len);
1140         info->fprintf_func(info->stream, "%-12s  %s,%s,%d,%d",
1141                            op_name, str_r(r0), str_r(r1), pos, len);
1142         break;
1143 
1144     case INDEX_op_movcond_i32:
1145     case INDEX_op_movcond_i64:
1146     case INDEX_op_setcond2_i32:
1147         tci_args_rrrrrc(insn, &r0, &r1, &r2, &r3, &r4, &c);
1148         info->fprintf_func(info->stream, "%-12s  %s, %s, %s, %s, %s, %s",
1149                            op_name, str_r(r0), str_r(r1), str_r(r2),
1150                            str_r(r3), str_r(r4), str_c(c));
1151         break;
1152 
1153     case INDEX_op_mulu2_i32:
1154     case INDEX_op_mulu2_i64:
1155     case INDEX_op_muls2_i32:
1156     case INDEX_op_muls2_i64:
1157         tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
1158         info->fprintf_func(info->stream, "%-12s  %s, %s, %s, %s",
1159                            op_name, str_r(r0), str_r(r1),
1160                            str_r(r2), str_r(r3));
1161         break;
1162 
1163     case INDEX_op_add2_i32:
1164     case INDEX_op_add2_i64:
1165     case INDEX_op_sub2_i32:
1166     case INDEX_op_sub2_i64:
1167         tci_args_rrrrrr(insn, &r0, &r1, &r2, &r3, &r4, &r5);
1168         info->fprintf_func(info->stream, "%-12s  %s, %s, %s, %s, %s, %s",
1169                            op_name, str_r(r0), str_r(r1), str_r(r2),
1170                            str_r(r3), str_r(r4), str_r(r5));
1171         break;
1172 
1173     case INDEX_op_qemu_ld_i64:
1174     case INDEX_op_qemu_st_i64:
1175         if (TCG_TARGET_REG_BITS == 32) {
1176             tci_args_rrrr(insn, &r0, &r1, &r2, &r3);
1177             info->fprintf_func(info->stream, "%-12s  %s, %s, %s, %s",
1178                                op_name, str_r(r0), str_r(r1),
1179                                str_r(r2), str_r(r3));
1180             break;
1181         }
1182         /* fall through */
1183     case INDEX_op_qemu_ld_i32:
1184     case INDEX_op_qemu_st_i32:
1185         tci_args_rrm(insn, &r0, &r1, &oi);
1186         info->fprintf_func(info->stream, "%-12s  %s, %s, %x",
1187                            op_name, str_r(r0), str_r(r1), oi);
1188         break;
1189 
1190     case 0:
1191         /* tcg_out_nop_fill uses zeros */
1192         if (insn == 0) {
1193             info->fprintf_func(info->stream, "align");
1194             break;
1195         }
1196         /* fall through */
1197 
1198     default:
1199         info->fprintf_func(info->stream, "illegal opcode %d", op);
1200         break;
1201     }
1202 
1203     return sizeof(insn);
1204 }
1205