xref: /openbmc/qemu/target/hexagon/gen_tcg.h (revision 5c4b11e827e3cd64a6790b6158c75ed876e6f6e9)
1 /*
2  *  Copyright(c) 2019-2023 Qualcomm Innovation Center, Inc. All Rights Reserved.
3  *
4  *  This program is free software; you can redistribute it and/or modify
5  *  it under the terms of the GNU General Public License as published by
6  *  the Free Software Foundation; either version 2 of the License, or
7  *  (at your option) any later version.
8  *
9  *  This program is distributed in the hope that it will be useful,
10  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
11  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12  *  GNU General Public License for more details.
13  *
14  *  You should have received a copy of the GNU General Public License
15  *  along with this program; if not, see <http://www.gnu.org/licenses/>.
16  */
17 
18 #ifndef HEXAGON_GEN_TCG_H
19 #define HEXAGON_GEN_TCG_H
20 
21 /*
22  * Here is a primer to understand the tag names for load/store instructions
23  *
24  * Data types
25  *      b        signed byte                       r0 = memb(r2+#0)
26  *     ub        unsigned byte                     r0 = memub(r2+#0)
27  *      h        signed half word (16 bits)        r0 = memh(r2+#0)
28  *     uh        unsigned half word                r0 = memuh(r2+#0)
29  *      i        integer (32 bits)                 r0 = memw(r2+#0)
30  *      d        double word (64 bits)             r1:0 = memd(r2+#0)
31  *
32  * Addressing modes
33  *     _io       indirect with offset              r0 = memw(r1+#4)
34  *     _ur       absolute with register offset     r0 = memw(r1<<#4+##variable)
35  *     _rr       indirect with register offset     r0 = memw(r1+r4<<#2)
36  *     gp        global pointer relative           r0 = memw(gp+#200)
37  *     _sp       stack pointer relative            r0 = memw(r29+#12)
38  *     _ap       absolute set                      r0 = memw(r1=##variable)
39  *     _pr       post increment register           r0 = memw(r1++m1)
40  *     _pbr      post increment bit reverse        r0 = memw(r1++m1:brev)
41  *     _pi       post increment immediate          r0 = memb(r1++#1)
42  *     _pci      post increment circular immediate r0 = memw(r1++#4:circ(m0))
43  *     _pcr      post increment circular register  r0 = memw(r1++I:circ(m0))
44  */
45 
46 /* Macros for complex addressing modes */
47 #define GET_EA_ap \
48     do { \
49         fEA_IMM(UiV); \
50         tcg_gen_movi_tl(ReV, UiV); \
51     } while (0)
52 #define GET_EA_pr \
53     do { \
54         fEA_REG(RxV); \
55         fPM_M(RxV, MuV); \
56     } while (0)
57 #define GET_EA_pbr \
58     do { \
59         gen_helper_fbrev(EA, RxV); \
60         tcg_gen_add_tl(RxV, RxV, MuV); \
61     } while (0)
62 #define GET_EA_pi \
63     do { \
64         fEA_REG(RxV); \
65         fPM_I(RxV, siV); \
66     } while (0)
67 #define GET_EA_pci \
68     do { \
69         TCGv tcgv_siV = tcg_constant_tl(siV); \
70         tcg_gen_mov_tl(EA, RxV); \
71         gen_helper_fcircadd(RxV, RxV, tcgv_siV, MuV, \
72                             hex_gpr[HEX_REG_CS0 + MuN]); \
73     } while (0)
74 #define GET_EA_pcr(SHIFT) \
75     do { \
76         TCGv ireg = tcg_temp_new(); \
77         tcg_gen_mov_tl(EA, RxV); \
78         gen_read_ireg(ireg, MuV, (SHIFT)); \
79         gen_helper_fcircadd(RxV, RxV, ireg, MuV, hex_gpr[HEX_REG_CS0 + MuN]); \
80     } while (0)
81 
82 /* Instructions with multiple definitions */
83 #define fGEN_TCG_LOAD_AP(RES, SIZE, SIGN) \
84     do { \
85         fMUST_IMMEXT(UiV); \
86         fEA_IMM(UiV); \
87         fLOAD(1, SIZE, SIGN, EA, RES); \
88         tcg_gen_movi_tl(ReV, UiV); \
89     } while (0)
90 
91 #define fGEN_TCG_L4_loadrub_ap(SHORTCODE) \
92     fGEN_TCG_LOAD_AP(RdV, 1, u)
93 #define fGEN_TCG_L4_loadrb_ap(SHORTCODE) \
94     fGEN_TCG_LOAD_AP(RdV, 1, s)
95 #define fGEN_TCG_L4_loadruh_ap(SHORTCODE) \
96     fGEN_TCG_LOAD_AP(RdV, 2, u)
97 #define fGEN_TCG_L4_loadrh_ap(SHORTCODE) \
98     fGEN_TCG_LOAD_AP(RdV, 2, s)
99 #define fGEN_TCG_L4_loadri_ap(SHORTCODE) \
100     fGEN_TCG_LOAD_AP(RdV, 4, u)
101 #define fGEN_TCG_L4_loadrd_ap(SHORTCODE) \
102     fGEN_TCG_LOAD_AP(RddV, 8, u)
103 
104 #define fGEN_TCG_L2_loadrub_pci(SHORTCODE)    SHORTCODE
105 #define fGEN_TCG_L2_loadrb_pci(SHORTCODE)     SHORTCODE
106 #define fGEN_TCG_L2_loadruh_pci(SHORTCODE)    SHORTCODE
107 #define fGEN_TCG_L2_loadrh_pci(SHORTCODE)     SHORTCODE
108 #define fGEN_TCG_L2_loadri_pci(SHORTCODE)     SHORTCODE
109 #define fGEN_TCG_L2_loadrd_pci(SHORTCODE)     SHORTCODE
110 
111 #define fGEN_TCG_LOAD_pcr(SHIFT, LOAD) \
112     do { \
113         TCGv ireg = tcg_temp_new(); \
114         tcg_gen_mov_tl(EA, RxV); \
115         gen_read_ireg(ireg, MuV, SHIFT); \
116         gen_helper_fcircadd(RxV, RxV, ireg, MuV, hex_gpr[HEX_REG_CS0 + MuN]); \
117         LOAD; \
118     } while (0)
119 
120 #define fGEN_TCG_L2_loadrub_pcr(SHORTCODE) \
121       fGEN_TCG_LOAD_pcr(0, fLOAD(1, 1, u, EA, RdV))
122 #define fGEN_TCG_L2_loadrb_pcr(SHORTCODE) \
123       fGEN_TCG_LOAD_pcr(0, fLOAD(1, 1, s, EA, RdV))
124 #define fGEN_TCG_L2_loadruh_pcr(SHORTCODE) \
125       fGEN_TCG_LOAD_pcr(1, fLOAD(1, 2, u, EA, RdV))
126 #define fGEN_TCG_L2_loadrh_pcr(SHORTCODE) \
127       fGEN_TCG_LOAD_pcr(1, fLOAD(1, 2, s, EA, RdV))
128 #define fGEN_TCG_L2_loadri_pcr(SHORTCODE) \
129       fGEN_TCG_LOAD_pcr(2, fLOAD(1, 4, u, EA, RdV))
130 #define fGEN_TCG_L2_loadrd_pcr(SHORTCODE) \
131       fGEN_TCG_LOAD_pcr(3, fLOAD(1, 8, u, EA, RddV))
132 
133 #define fGEN_TCG_L2_loadrub_pr(SHORTCODE)      SHORTCODE
134 #define fGEN_TCG_L2_loadrub_pbr(SHORTCODE)     SHORTCODE
135 #define fGEN_TCG_L2_loadrub_pi(SHORTCODE)      SHORTCODE
136 #define fGEN_TCG_L2_loadrb_pr(SHORTCODE)       SHORTCODE
137 #define fGEN_TCG_L2_loadrb_pbr(SHORTCODE)      SHORTCODE
138 #define fGEN_TCG_L2_loadrb_pi(SHORTCODE)       SHORTCODE
139 #define fGEN_TCG_L2_loadruh_pr(SHORTCODE)      SHORTCODE
140 #define fGEN_TCG_L2_loadruh_pbr(SHORTCODE)     SHORTCODE
141 #define fGEN_TCG_L2_loadruh_pi(SHORTCODE)      SHORTCODE
142 #define fGEN_TCG_L2_loadrh_pr(SHORTCODE)       SHORTCODE
143 #define fGEN_TCG_L2_loadrh_pbr(SHORTCODE)      SHORTCODE
144 #define fGEN_TCG_L2_loadrh_pi(SHORTCODE)       SHORTCODE
145 #define fGEN_TCG_L2_loadri_pr(SHORTCODE)       SHORTCODE
146 #define fGEN_TCG_L2_loadri_pbr(SHORTCODE)      SHORTCODE
147 #define fGEN_TCG_L2_loadri_pi(SHORTCODE)       SHORTCODE
148 #define fGEN_TCG_L2_loadrd_pr(SHORTCODE)       SHORTCODE
149 #define fGEN_TCG_L2_loadrd_pbr(SHORTCODE)      SHORTCODE
150 #define fGEN_TCG_L2_loadrd_pi(SHORTCODE)       SHORTCODE
151 
152 /*
153  * These instructions load 2 bytes and places them in
154  * two halves of the destination register.
155  * The GET_EA macro determines the addressing mode.
156  * The SIGN argument determines whether to zero-extend or
157  * sign-extend.
158  */
159 #define fGEN_TCG_loadbXw2(GET_EA, SIGN) \
160     do { \
161         TCGv tmp = tcg_temp_new(); \
162         TCGv byte = tcg_temp_new(); \
163         GET_EA; \
164         fLOAD(1, 2, u, EA, tmp); \
165         tcg_gen_movi_tl(RdV, 0); \
166         for (int i = 0; i < 2; i++) { \
167             gen_set_half(i, RdV, gen_get_byte(byte, i, tmp, (SIGN))); \
168         } \
169     } while (0)
170 
171 #define fGEN_TCG_L2_loadbzw2_io(SHORTCODE) \
172     fGEN_TCG_loadbXw2(fEA_RI(RsV, siV), false)
173 #define fGEN_TCG_L4_loadbzw2_ur(SHORTCODE) \
174     fGEN_TCG_loadbXw2(fEA_IRs(UiV, RtV, uiV), false)
175 #define fGEN_TCG_L2_loadbsw2_io(SHORTCODE) \
176     fGEN_TCG_loadbXw2(fEA_RI(RsV, siV), true)
177 #define fGEN_TCG_L4_loadbsw2_ur(SHORTCODE) \
178     fGEN_TCG_loadbXw2(fEA_IRs(UiV, RtV, uiV), true)
179 #define fGEN_TCG_L4_loadbzw2_ap(SHORTCODE) \
180     fGEN_TCG_loadbXw2(GET_EA_ap, false)
181 #define fGEN_TCG_L2_loadbzw2_pr(SHORTCODE) \
182     fGEN_TCG_loadbXw2(GET_EA_pr, false)
183 #define fGEN_TCG_L2_loadbzw2_pbr(SHORTCODE) \
184     fGEN_TCG_loadbXw2(GET_EA_pbr, false)
185 #define fGEN_TCG_L2_loadbzw2_pi(SHORTCODE) \
186     fGEN_TCG_loadbXw2(GET_EA_pi, false)
187 #define fGEN_TCG_L4_loadbsw2_ap(SHORTCODE) \
188     fGEN_TCG_loadbXw2(GET_EA_ap, true)
189 #define fGEN_TCG_L2_loadbsw2_pr(SHORTCODE) \
190     fGEN_TCG_loadbXw2(GET_EA_pr, true)
191 #define fGEN_TCG_L2_loadbsw2_pbr(SHORTCODE) \
192     fGEN_TCG_loadbXw2(GET_EA_pbr, true)
193 #define fGEN_TCG_L2_loadbsw2_pi(SHORTCODE) \
194     fGEN_TCG_loadbXw2(GET_EA_pi, true)
195 #define fGEN_TCG_L2_loadbzw2_pci(SHORTCODE) \
196     fGEN_TCG_loadbXw2(GET_EA_pci, false)
197 #define fGEN_TCG_L2_loadbsw2_pci(SHORTCODE) \
198     fGEN_TCG_loadbXw2(GET_EA_pci, true)
199 #define fGEN_TCG_L2_loadbzw2_pcr(SHORTCODE) \
200     fGEN_TCG_loadbXw2(GET_EA_pcr(1), false)
201 #define fGEN_TCG_L2_loadbsw2_pcr(SHORTCODE) \
202     fGEN_TCG_loadbXw2(GET_EA_pcr(1), true)
203 
204 /*
205  * These instructions load 4 bytes and places them in
206  * four halves of the destination register pair.
207  * The GET_EA macro determines the addressing mode.
208  * The SIGN argument determines whether to zero-extend or
209  * sign-extend.
210  */
211 #define fGEN_TCG_loadbXw4(GET_EA, SIGN) \
212     do { \
213         TCGv tmp = tcg_temp_new(); \
214         TCGv byte = tcg_temp_new(); \
215         GET_EA; \
216         fLOAD(1, 4, u, EA, tmp);  \
217         tcg_gen_movi_i64(RddV, 0); \
218         for (int i = 0; i < 4; i++) { \
219             gen_set_half_i64(i, RddV, gen_get_byte(byte, i, tmp, (SIGN)));  \
220         }  \
221     } while (0)
222 
223 #define fGEN_TCG_L2_loadbzw4_io(SHORTCODE) \
224     fGEN_TCG_loadbXw4(fEA_RI(RsV, siV), false)
225 #define fGEN_TCG_L4_loadbzw4_ur(SHORTCODE) \
226     fGEN_TCG_loadbXw4(fEA_IRs(UiV, RtV, uiV), false)
227 #define fGEN_TCG_L2_loadbsw4_io(SHORTCODE) \
228     fGEN_TCG_loadbXw4(fEA_RI(RsV, siV), true)
229 #define fGEN_TCG_L4_loadbsw4_ur(SHORTCODE) \
230     fGEN_TCG_loadbXw4(fEA_IRs(UiV, RtV, uiV), true)
231 #define fGEN_TCG_L2_loadbzw4_pci(SHORTCODE) \
232     fGEN_TCG_loadbXw4(GET_EA_pci, false)
233 #define fGEN_TCG_L2_loadbsw4_pci(SHORTCODE) \
234     fGEN_TCG_loadbXw4(GET_EA_pci, true)
235 #define fGEN_TCG_L2_loadbzw4_pcr(SHORTCODE) \
236     fGEN_TCG_loadbXw4(GET_EA_pcr(2), false)
237 #define fGEN_TCG_L2_loadbsw4_pcr(SHORTCODE) \
238     fGEN_TCG_loadbXw4(GET_EA_pcr(2), true)
239 #define fGEN_TCG_L4_loadbzw4_ap(SHORTCODE) \
240     fGEN_TCG_loadbXw4(GET_EA_ap, false)
241 #define fGEN_TCG_L2_loadbzw4_pr(SHORTCODE) \
242     fGEN_TCG_loadbXw4(GET_EA_pr, false)
243 #define fGEN_TCG_L2_loadbzw4_pbr(SHORTCODE) \
244     fGEN_TCG_loadbXw4(GET_EA_pbr, false)
245 #define fGEN_TCG_L2_loadbzw4_pi(SHORTCODE) \
246     fGEN_TCG_loadbXw4(GET_EA_pi, false)
247 #define fGEN_TCG_L4_loadbsw4_ap(SHORTCODE) \
248     fGEN_TCG_loadbXw4(GET_EA_ap, true)
249 #define fGEN_TCG_L2_loadbsw4_pr(SHORTCODE) \
250     fGEN_TCG_loadbXw4(GET_EA_pr, true)
251 #define fGEN_TCG_L2_loadbsw4_pbr(SHORTCODE) \
252     fGEN_TCG_loadbXw4(GET_EA_pbr, true)
253 #define fGEN_TCG_L2_loadbsw4_pi(SHORTCODE) \
254     fGEN_TCG_loadbXw4(GET_EA_pi, true)
255 
256 /*
257  * These instructions load a half word, shift the destination right by 16 bits
258  * and place the loaded value in the high half word of the destination pair.
259  * The GET_EA macro determines the addressing mode.
260  */
261 #define fGEN_TCG_loadalignh(GET_EA) \
262     do { \
263         TCGv tmp = tcg_temp_new(); \
264         TCGv_i64 tmp_i64 = tcg_temp_new_i64(); \
265         GET_EA;  \
266         fLOAD(1, 2, u, EA, tmp);  \
267         tcg_gen_extu_i32_i64(tmp_i64, tmp); \
268         tcg_gen_shri_i64(RyyV, RyyV, 16); \
269         tcg_gen_deposit_i64(RyyV, RyyV, tmp_i64, 48, 16); \
270     } while (0)
271 
272 #define fGEN_TCG_L4_loadalignh_ur(SHORTCODE) \
273     fGEN_TCG_loadalignh(fEA_IRs(UiV, RtV, uiV))
274 #define fGEN_TCG_L2_loadalignh_io(SHORTCODE) \
275     fGEN_TCG_loadalignh(fEA_RI(RsV, siV))
276 #define fGEN_TCG_L2_loadalignh_pci(SHORTCODE) \
277     fGEN_TCG_loadalignh(GET_EA_pci)
278 #define fGEN_TCG_L2_loadalignh_pcr(SHORTCODE) \
279     fGEN_TCG_loadalignh(GET_EA_pcr(1))
280 #define fGEN_TCG_L4_loadalignh_ap(SHORTCODE) \
281     fGEN_TCG_loadalignh(GET_EA_ap)
282 #define fGEN_TCG_L2_loadalignh_pr(SHORTCODE) \
283     fGEN_TCG_loadalignh(GET_EA_pr)
284 #define fGEN_TCG_L2_loadalignh_pbr(SHORTCODE) \
285     fGEN_TCG_loadalignh(GET_EA_pbr)
286 #define fGEN_TCG_L2_loadalignh_pi(SHORTCODE) \
287     fGEN_TCG_loadalignh(GET_EA_pi)
288 
289 /* Same as above, but loads a byte instead of half word */
290 #define fGEN_TCG_loadalignb(GET_EA) \
291     do { \
292         TCGv tmp = tcg_temp_new(); \
293         TCGv_i64 tmp_i64 = tcg_temp_new_i64(); \
294         GET_EA;  \
295         fLOAD(1, 1, u, EA, tmp);  \
296         tcg_gen_extu_i32_i64(tmp_i64, tmp); \
297         tcg_gen_shri_i64(RyyV, RyyV, 8); \
298         tcg_gen_deposit_i64(RyyV, RyyV, tmp_i64, 56, 8); \
299     } while (0)
300 
301 #define fGEN_TCG_L2_loadalignb_io(SHORTCODE) \
302     fGEN_TCG_loadalignb(fEA_RI(RsV, siV))
303 #define fGEN_TCG_L4_loadalignb_ur(SHORTCODE) \
304     fGEN_TCG_loadalignb(fEA_IRs(UiV, RtV, uiV))
305 #define fGEN_TCG_L2_loadalignb_pci(SHORTCODE) \
306     fGEN_TCG_loadalignb(GET_EA_pci)
307 #define fGEN_TCG_L2_loadalignb_pcr(SHORTCODE) \
308     fGEN_TCG_loadalignb(GET_EA_pcr(0))
309 #define fGEN_TCG_L4_loadalignb_ap(SHORTCODE) \
310     fGEN_TCG_loadalignb(GET_EA_ap)
311 #define fGEN_TCG_L2_loadalignb_pr(SHORTCODE) \
312     fGEN_TCG_loadalignb(GET_EA_pr)
313 #define fGEN_TCG_L2_loadalignb_pbr(SHORTCODE) \
314     fGEN_TCG_loadalignb(GET_EA_pbr)
315 #define fGEN_TCG_L2_loadalignb_pi(SHORTCODE) \
316     fGEN_TCG_loadalignb(GET_EA_pi)
317 
318 /*
319  * Predicated loads
320  * Here is a primer to understand the tag names
321  *
322  * Predicate used
323  *      t        true "old" value                  if (p0) r0 = memb(r2+#0)
324  *      f        false "old" value                 if (!p0) r0 = memb(r2+#0)
325  *      tnew     true "new" value                  if (p0.new) r0 = memb(r2+#0)
326  *      fnew     false "new" value                 if (!p0.new) r0 = memb(r2+#0)
327  */
328 #define fGEN_TCG_PRED_LOAD(GET_EA, PRED, SIZE, SIGN) \
329     do { \
330         TCGv LSB = tcg_temp_new(); \
331         TCGLabel *label = gen_new_label(); \
332         tcg_gen_movi_tl(EA, 0); \
333         PRED;  \
334         CHECK_NOSHUF_PRED(GET_EA, SIZE, LSB); \
335         tcg_gen_brcondi_tl(TCG_COND_EQ, LSB, 0, label); \
336         fLOAD(1, SIZE, SIGN, EA, RdV); \
337         gen_set_label(label); \
338     } while (0)
339 
340 #define fGEN_TCG_L2_ploadrubt_pi(SHORTCODE) \
341     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLD(PtV), 1, u)
342 #define fGEN_TCG_L2_ploadrubf_pi(SHORTCODE) \
343     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLDNOT(PtV), 1, u)
344 #define fGEN_TCG_L2_ploadrubtnew_pi(SHORTCODE) \
345     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEW(PtN), 1, u)
346 #define fGEN_TCG_L2_ploadrubfnew_pi(SHORTCODE) \
347     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEWNOT(PtN), 1, u)
348 #define fGEN_TCG_L2_ploadrbt_pi(SHORTCODE) \
349     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLD(PtV), 1, s)
350 #define fGEN_TCG_L2_ploadrbf_pi(SHORTCODE) \
351     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLDNOT(PtV), 1, s)
352 #define fGEN_TCG_L2_ploadrbtnew_pi(SHORTCODE) \
353     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEW(PtN), 1, s)
354 #define fGEN_TCG_L2_ploadrbfnew_pi(SHORTCODE) \
355     fGEN_TCG_PRED_LOAD({ fEA_REG(RxV); fPM_I(RxV, siV); }, \
356                        fLSBNEWNOT(PtN), 1, s)
357 
358 #define fGEN_TCG_L2_ploadruht_pi(SHORTCODE) \
359     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLD(PtV), 2, u)
360 #define fGEN_TCG_L2_ploadruhf_pi(SHORTCODE) \
361     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLDNOT(PtV), 2, u)
362 #define fGEN_TCG_L2_ploadruhtnew_pi(SHORTCODE) \
363     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEW(PtN), 2, u)
364 #define fGEN_TCG_L2_ploadruhfnew_pi(SHORTCODE) \
365     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEWNOT(PtN), 2, u)
366 #define fGEN_TCG_L2_ploadrht_pi(SHORTCODE) \
367     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLD(PtV), 2, s)
368 #define fGEN_TCG_L2_ploadrhf_pi(SHORTCODE) \
369     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLDNOT(PtV), 2, s)
370 #define fGEN_TCG_L2_ploadrhtnew_pi(SHORTCODE) \
371     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEW(PtN), 2, s)
372 #define fGEN_TCG_L2_ploadrhfnew_pi(SHORTCODE) \
373     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEWNOT(PtN), 2, s)
374 
375 #define fGEN_TCG_L2_ploadrit_pi(SHORTCODE) \
376     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLD(PtV), 4, u)
377 #define fGEN_TCG_L2_ploadrif_pi(SHORTCODE) \
378     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBOLDNOT(PtV), 4, u)
379 #define fGEN_TCG_L2_ploadritnew_pi(SHORTCODE) \
380     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEW(PtN), 4, u)
381 #define fGEN_TCG_L2_ploadrifnew_pi(SHORTCODE) \
382     fGEN_TCG_PRED_LOAD(GET_EA_pi, fLSBNEWNOT(PtN), 4, u)
383 
384 /* Predicated loads into a register pair */
385 #define fGEN_TCG_PRED_LOAD_PAIR(GET_EA, PRED) \
386     do { \
387         TCGv LSB = tcg_temp_new(); \
388         TCGLabel *label = gen_new_label(); \
389         tcg_gen_movi_tl(EA, 0); \
390         PRED;  \
391         CHECK_NOSHUF_PRED(GET_EA, 8, LSB); \
392         tcg_gen_brcondi_tl(TCG_COND_EQ, LSB, 0, label); \
393         fLOAD(1, 8, u, EA, RddV); \
394         gen_set_label(label); \
395     } while (0)
396 
397 #define fGEN_TCG_L2_ploadrdt_pi(SHORTCODE) \
398     fGEN_TCG_PRED_LOAD_PAIR(GET_EA_pi, fLSBOLD(PtV))
399 #define fGEN_TCG_L2_ploadrdf_pi(SHORTCODE) \
400     fGEN_TCG_PRED_LOAD_PAIR(GET_EA_pi, fLSBOLDNOT(PtV))
401 #define fGEN_TCG_L2_ploadrdtnew_pi(SHORTCODE) \
402     fGEN_TCG_PRED_LOAD_PAIR(GET_EA_pi, fLSBNEW(PtN))
403 #define fGEN_TCG_L2_ploadrdfnew_pi(SHORTCODE) \
404     fGEN_TCG_PRED_LOAD_PAIR(GET_EA_pi, fLSBNEWNOT(PtN))
405 
406 /* load-locked and store-locked */
407 #define fGEN_TCG_L2_loadw_locked(SHORTCODE) \
408     SHORTCODE
409 #define fGEN_TCG_L4_loadd_locked(SHORTCODE) \
410     SHORTCODE
411 #define fGEN_TCG_S2_storew_locked(SHORTCODE) \
412     SHORTCODE
413 #define fGEN_TCG_S4_stored_locked(SHORTCODE) \
414     SHORTCODE
415 
416 #define fGEN_TCG_STORE(SHORTCODE) \
417     do { \
418         TCGv HALF G_GNUC_UNUSED = tcg_temp_new(); \
419         TCGv BYTE G_GNUC_UNUSED = tcg_temp_new(); \
420         SHORTCODE; \
421     } while (0)
422 
423 #define fGEN_TCG_STORE_pcr(SHIFT, STORE) \
424     do { \
425         TCGv ireg = tcg_temp_new(); \
426         TCGv HALF G_GNUC_UNUSED = tcg_temp_new(); \
427         TCGv BYTE G_GNUC_UNUSED = tcg_temp_new(); \
428         tcg_gen_mov_tl(EA, RxV); \
429         gen_read_ireg(ireg, MuV, SHIFT); \
430         gen_helper_fcircadd(RxV, RxV, ireg, MuV, hex_gpr[HEX_REG_CS0 + MuN]); \
431         STORE; \
432     } while (0)
433 
434 #define fGEN_TCG_S2_storerb_pbr(SHORTCODE) \
435     fGEN_TCG_STORE(SHORTCODE)
436 #define fGEN_TCG_S2_storerb_pci(SHORTCODE) \
437     fGEN_TCG_STORE(SHORTCODE)
438 #define fGEN_TCG_S2_storerb_pcr(SHORTCODE) \
439     fGEN_TCG_STORE_pcr(0, fSTORE(1, 1, EA, fGETBYTE(0, RtV)))
440 
441 #define fGEN_TCG_S2_storerh_pbr(SHORTCODE) \
442     fGEN_TCG_STORE(SHORTCODE)
443 #define fGEN_TCG_S2_storerh_pci(SHORTCODE) \
444     fGEN_TCG_STORE(SHORTCODE)
445 #define fGEN_TCG_S2_storerh_pcr(SHORTCODE) \
446     fGEN_TCG_STORE_pcr(1, fSTORE(1, 2, EA, fGETHALF(0, RtV)))
447 
448 #define fGEN_TCG_S2_storerf_pbr(SHORTCODE) \
449     fGEN_TCG_STORE(SHORTCODE)
450 #define fGEN_TCG_S2_storerf_pci(SHORTCODE) \
451     fGEN_TCG_STORE(SHORTCODE)
452 #define fGEN_TCG_S2_storerf_pcr(SHORTCODE) \
453     fGEN_TCG_STORE_pcr(1, fSTORE(1, 2, EA, fGETHALF(1, RtV)))
454 
455 #define fGEN_TCG_S2_storeri_pbr(SHORTCODE) \
456     fGEN_TCG_STORE(SHORTCODE)
457 #define fGEN_TCG_S2_storeri_pci(SHORTCODE) \
458     fGEN_TCG_STORE(SHORTCODE)
459 #define fGEN_TCG_S2_storeri_pcr(SHORTCODE) \
460     fGEN_TCG_STORE_pcr(2, fSTORE(1, 4, EA, RtV))
461 
462 #define fGEN_TCG_S2_storerd_pbr(SHORTCODE) \
463     fGEN_TCG_STORE(SHORTCODE)
464 #define fGEN_TCG_S2_storerd_pci(SHORTCODE) \
465     fGEN_TCG_STORE(SHORTCODE)
466 #define fGEN_TCG_S2_storerd_pcr(SHORTCODE) \
467     fGEN_TCG_STORE_pcr(3, fSTORE(1, 8, EA, RttV))
468 
469 #define fGEN_TCG_S2_storerbnew_pbr(SHORTCODE) \
470     fGEN_TCG_STORE(SHORTCODE)
471 #define fGEN_TCG_S2_storerbnew_pci(SHORTCODE) \
472     fGEN_TCG_STORE(SHORTCODE)
473 #define fGEN_TCG_S2_storerbnew_pcr(SHORTCODE) \
474     fGEN_TCG_STORE_pcr(0, fSTORE(1, 1, EA, fGETBYTE(0, NtN)))
475 
476 #define fGEN_TCG_S2_storerhnew_pbr(SHORTCODE) \
477     fGEN_TCG_STORE(SHORTCODE)
478 #define fGEN_TCG_S2_storerhnew_pci(SHORTCODE) \
479     fGEN_TCG_STORE(SHORTCODE)
480 #define fGEN_TCG_S2_storerhnew_pcr(SHORTCODE) \
481     fGEN_TCG_STORE_pcr(1, fSTORE(1, 2, EA, fGETHALF(0, NtN)))
482 
483 #define fGEN_TCG_S2_storerinew_pbr(SHORTCODE) \
484     fGEN_TCG_STORE(SHORTCODE)
485 #define fGEN_TCG_S2_storerinew_pci(SHORTCODE) \
486     fGEN_TCG_STORE(SHORTCODE)
487 #define fGEN_TCG_S2_storerinew_pcr(SHORTCODE) \
488     fGEN_TCG_STORE_pcr(2, fSTORE(1, 4, EA, NtN))
489 
490 /* dczeroa clears the 32 byte cache line at the address given */
491 #define fGEN_TCG_Y2_dczeroa(SHORTCODE) SHORTCODE
492 
493 /* In linux-user mode, these are not modelled, suppress compiler warning */
494 #define fGEN_TCG_Y2_dcinva(SHORTCODE) \
495     do { RsV = RsV; } while (0)
496 #define fGEN_TCG_Y2_dccleaninva(SHORTCODE) \
497     do { RsV = RsV; } while (0)
498 #define fGEN_TCG_Y2_dccleana(SHORTCODE) \
499     do { RsV = RsV; } while (0)
500 #define fGEN_TCG_Y2_icinva(SHORTCODE) \
501     do { RsV = RsV; } while (0)
502 
503 /*
504  * allocframe(#uiV)
505  *     RxV == r29
506  */
507 #define fGEN_TCG_S2_allocframe(SHORTCODE) \
508     gen_allocframe(ctx, RxV, uiV)
509 
510 /* sub-instruction version (no RxV, so handle it manually) */
511 #define fGEN_TCG_SS2_allocframe(SHORTCODE) \
512     do { \
513         TCGv r29 = tcg_temp_new(); \
514         tcg_gen_mov_tl(r29, hex_gpr[HEX_REG_SP]); \
515         gen_allocframe(ctx, r29, uiV); \
516         gen_log_reg_write(ctx, HEX_REG_SP, r29); \
517     } while (0)
518 
519 /*
520  * Rdd32 = deallocframe(Rs32):raw
521  *     RddV == r31:30
522  *     RsV  == r30
523  */
524 #define fGEN_TCG_L2_deallocframe(SHORTCODE) \
525     gen_deallocframe(ctx, RddV, RsV)
526 
527 /* sub-instruction version (no RddV/RsV, so handle it manually) */
528 #define fGEN_TCG_SL2_deallocframe(SHORTCODE) \
529     do { \
530         TCGv_i64 r31_30 = tcg_temp_new_i64(); \
531         gen_deallocframe(ctx, r31_30, hex_gpr[HEX_REG_FP]); \
532         gen_log_reg_write_pair(ctx, HEX_REG_FP, r31_30); \
533     } while (0)
534 
535 /*
536  * dealloc_return
537  * Assembler mapped to
538  * r31:30 = dealloc_return(r30):raw
539  */
540 #define fGEN_TCG_L4_return(SHORTCODE) \
541     gen_return(ctx, RddV, RsV)
542 
543 /*
544  * sub-instruction version (no RddV, so handle it manually)
545  */
546 #define fGEN_TCG_SL2_return(SHORTCODE) \
547     do { \
548         TCGv_i64 RddV = get_result_gpr_pair(ctx, HEX_REG_FP); \
549         gen_return(ctx, RddV, hex_gpr[HEX_REG_FP]); \
550         gen_log_reg_write_pair(ctx, HEX_REG_FP, RddV); \
551     } while (0)
552 
553 /*
554  * Conditional returns follow this naming convention
555  *     _t                 predicate true
556  *     _f                 predicate false
557  *     _tnew_pt           predicate.new true predict taken
558  *     _fnew_pt           predicate.new false predict taken
559  *     _tnew_pnt          predicate.new true predict not taken
560  *     _fnew_pnt          predicate.new false predict not taken
561  * Predictions are not modelled in QEMU
562  *
563  * Example:
564  *     if (p1) r31:30 = dealloc_return(r30):raw
565  */
566 #define fGEN_TCG_L4_return_t(SHORTCODE) \
567     gen_cond_return(ctx, RddV, RsV, PvV, TCG_COND_EQ);
568 #define fGEN_TCG_L4_return_f(SHORTCODE) \
569     gen_cond_return(ctx, RddV, RsV, PvV, TCG_COND_NE)
570 #define fGEN_TCG_L4_return_tnew_pt(SHORTCODE) \
571     gen_cond_return(ctx, RddV, RsV, PvN, TCG_COND_EQ)
572 #define fGEN_TCG_L4_return_fnew_pt(SHORTCODE) \
573     gen_cond_return(ctx, RddV, RsV, PvN, TCG_COND_NE)
574 #define fGEN_TCG_L4_return_tnew_pnt(SHORTCODE) \
575     gen_cond_return(ctx, RddV, RsV, PvN, TCG_COND_EQ)
576 #define fGEN_TCG_L4_return_fnew_pnt(SHORTCODE) \
577     gen_cond_return(ctx, RddV, RsV, PvN, TCG_COND_NE)
578 
579 #define fGEN_TCG_SL2_return_t(SHORTCODE) \
580     gen_cond_return_subinsn(ctx, TCG_COND_EQ, hex_pred[0])
581 #define fGEN_TCG_SL2_return_f(SHORTCODE) \
582     gen_cond_return_subinsn(ctx, TCG_COND_NE, hex_pred[0])
583 #define fGEN_TCG_SL2_return_tnew(SHORTCODE) \
584     gen_cond_return_subinsn(ctx, TCG_COND_EQ, hex_new_pred_value[0])
585 #define fGEN_TCG_SL2_return_fnew(SHORTCODE) \
586     gen_cond_return_subinsn(ctx, TCG_COND_NE, hex_new_pred_value[0])
587 
588 /*
589  * Mathematical operations with more than one definition require
590  * special handling
591  */
592 #define fGEN_TCG_A5_ACS(SHORTCODE) \
593     do { \
594         gen_helper_vacsh_pred(PeV, cpu_env, RxxV, RssV, RttV); \
595         gen_helper_vacsh_val(RxxV, cpu_env, RxxV, RssV, RttV); \
596     } while (0)
597 
598 /*
599  * Approximate reciprocal
600  * r3,p1 = sfrecipa(r0, r1)
601  *
602  * The helper packs the 2 32-bit results into a 64-bit value,
603  * so unpack them into the proper results.
604  */
605 #define fGEN_TCG_F2_sfrecipa(SHORTCODE) \
606     do { \
607         TCGv_i64 tmp = tcg_temp_new_i64(); \
608         gen_helper_sfrecipa(tmp, cpu_env, RsV, RtV);  \
609         tcg_gen_extrh_i64_i32(RdV, tmp); \
610         tcg_gen_extrl_i64_i32(PeV, tmp); \
611     } while (0)
612 
613 /*
614  * Approximation of the reciprocal square root
615  * r1,p0 = sfinvsqrta(r0)
616  *
617  * The helper packs the 2 32-bit results into a 64-bit value,
618  * so unpack them into the proper results.
619  */
620 #define fGEN_TCG_F2_sfinvsqrta(SHORTCODE) \
621     do { \
622         TCGv_i64 tmp = tcg_temp_new_i64(); \
623         gen_helper_sfinvsqrta(tmp, cpu_env, RsV); \
624         tcg_gen_extrh_i64_i32(RdV, tmp); \
625         tcg_gen_extrl_i64_i32(PeV, tmp); \
626     } while (0)
627 
628 /*
629  * Add or subtract with carry.
630  * Predicate register is used as an extra input and output.
631  * r5:4 = add(r1:0, r3:2, p1):carry
632  */
633 #define fGEN_TCG_A4_addp_c(SHORTCODE) \
634     do { \
635         TCGv_i64 carry = tcg_temp_new_i64(); \
636         TCGv_i64 zero = tcg_constant_i64(0); \
637         tcg_gen_extu_i32_i64(carry, PxV); \
638         tcg_gen_andi_i64(carry, carry, 1); \
639         tcg_gen_add2_i64(RddV, carry, RssV, zero, carry, zero); \
640         tcg_gen_add2_i64(RddV, carry, RddV, carry, RttV, zero); \
641         tcg_gen_extrl_i64_i32(PxV, carry); \
642         gen_8bitsof(PxV, PxV); \
643     } while (0)
644 
645 /* r5:4 = sub(r1:0, r3:2, p1):carry */
646 #define fGEN_TCG_A4_subp_c(SHORTCODE) \
647     do { \
648         TCGv_i64 carry = tcg_temp_new_i64(); \
649         TCGv_i64 zero = tcg_constant_i64(0); \
650         TCGv_i64 not_RttV = tcg_temp_new_i64(); \
651         tcg_gen_extu_i32_i64(carry, PxV); \
652         tcg_gen_andi_i64(carry, carry, 1); \
653         tcg_gen_not_i64(not_RttV, RttV); \
654         tcg_gen_add2_i64(RddV, carry, RssV, zero, carry, zero); \
655         tcg_gen_add2_i64(RddV, carry, RddV, carry, not_RttV, zero); \
656         tcg_gen_extrl_i64_i32(PxV, carry); \
657         gen_8bitsof(PxV, PxV); \
658     } while (0)
659 
660 /*
661  * Compare each of the 8 unsigned bytes
662  * The minimum is placed in each byte of the destination.
663  * Each bit of the predicate is set true if the bit from the first operand
664  * is greater than the bit from the second operand.
665  * r5:4,p1 = vminub(r1:0, r3:2)
666  */
667 #define fGEN_TCG_A6_vminub_RdP(SHORTCODE) \
668     do { \
669         TCGv left = tcg_temp_new(); \
670         TCGv right = tcg_temp_new(); \
671         TCGv tmp = tcg_temp_new(); \
672         tcg_gen_movi_tl(PeV, 0); \
673         tcg_gen_movi_i64(RddV, 0); \
674         for (int i = 0; i < 8; i++) { \
675             gen_get_byte_i64(left, i, RttV, false); \
676             gen_get_byte_i64(right, i, RssV, false); \
677             tcg_gen_setcond_tl(TCG_COND_GT, tmp, left, right); \
678             tcg_gen_deposit_tl(PeV, PeV, tmp, i, 1); \
679             tcg_gen_umin_tl(tmp, left, right); \
680             gen_set_byte_i64(i, RddV, tmp); \
681         } \
682     } while (0)
683 
684 #define fGEN_TCG_J2_call(SHORTCODE) \
685     gen_call(ctx, riV)
686 #define fGEN_TCG_J2_callr(SHORTCODE) \
687     gen_callr(ctx, RsV)
688 #define fGEN_TCG_J2_callrh(SHORTCODE) \
689     gen_callr(ctx, RsV)
690 
691 #define fGEN_TCG_J2_callt(SHORTCODE) \
692     gen_cond_call(ctx, PuV, TCG_COND_EQ, riV)
693 #define fGEN_TCG_J2_callf(SHORTCODE) \
694     gen_cond_call(ctx, PuV, TCG_COND_NE, riV)
695 #define fGEN_TCG_J2_callrt(SHORTCODE) \
696     gen_cond_callr(ctx, TCG_COND_EQ, PuV, RsV)
697 #define fGEN_TCG_J2_callrf(SHORTCODE) \
698     gen_cond_callr(ctx, TCG_COND_NE, PuV, RsV)
699 
700 #define fGEN_TCG_J2_loop0r(SHORTCODE) \
701     gen_loop0r(ctx, RsV, riV)
702 #define fGEN_TCG_J2_loop1r(SHORTCODE) \
703     gen_loop1r(ctx, RsV, riV)
704 #define fGEN_TCG_J2_loop0i(SHORTCODE) \
705     gen_loop0i(ctx, UiV, riV)
706 #define fGEN_TCG_J2_loop1i(SHORTCODE) \
707     gen_loop1i(ctx, UiV, riV)
708 #define fGEN_TCG_J2_ploop1sr(SHORTCODE) \
709     gen_ploopNsr(ctx, 1, RsV, riV)
710 #define fGEN_TCG_J2_ploop1si(SHORTCODE) \
711     gen_ploopNsi(ctx, 1, UiV, riV)
712 #define fGEN_TCG_J2_ploop2sr(SHORTCODE) \
713     gen_ploopNsr(ctx, 2, RsV, riV)
714 #define fGEN_TCG_J2_ploop2si(SHORTCODE) \
715     gen_ploopNsi(ctx, 2, UiV, riV)
716 #define fGEN_TCG_J2_ploop3sr(SHORTCODE) \
717     gen_ploopNsr(ctx, 3, RsV, riV)
718 #define fGEN_TCG_J2_ploop3si(SHORTCODE) \
719     gen_ploopNsi(ctx, 3, UiV, riV)
720 
721 #define fGEN_TCG_J2_endloop0(SHORTCODE) \
722     gen_endloop0(ctx)
723 #define fGEN_TCG_J2_endloop1(SHORTCODE) \
724     gen_endloop1(ctx)
725 #define fGEN_TCG_J2_endloop01(SHORTCODE) \
726     gen_endloop01(ctx)
727 
728 /*
729  * Compound compare and jump instructions
730  * Here is a primer to understand the tag names
731  *
732  * Comparison
733  *      cmpeqi   compare equal to an immediate
734  *      cmpgti   compare greater than an immediate
735  *      cmpgtiu  compare greater than an unsigned immediate
736  *      cmpeqn1  compare equal to negative 1
737  *      cmpgtn1  compare greater than negative 1
738  *      cmpeq    compare equal (two registers)
739  *      cmpgtu   compare greater than unsigned (two registers)
740  *      tstbit0  test bit zero
741  *
742  * Condition
743  *      tp0      p0 is true     p0 = cmp.eq(r0,#5); if (p0.new) jump:nt address
744  *      fp0      p0 is false    p0 = cmp.eq(r0,#5); if (!p0.new) jump:nt address
745  *      tp1      p1 is true     p1 = cmp.eq(r0,#5); if (p1.new) jump:nt address
746  *      fp1      p1 is false    p1 = cmp.eq(r0,#5); if (!p1.new) jump:nt address
747  *
748  * Prediction (not modelled in qemu)
749  *      _nt      not taken
750  *      _t       taken
751  */
752 #define fGEN_TCG_J4_cmpeq_tp0_jump_t(SHORTCODE) \
753     gen_cmpnd_cmp_jmp_t(ctx, 0, TCG_COND_EQ, RsV, RtV, riV)
754 #define fGEN_TCG_J4_cmpeq_tp0_jump_nt(SHORTCODE) \
755     gen_cmpnd_cmp_jmp_t(ctx, 0, TCG_COND_EQ, RsV, RtV, riV)
756 #define fGEN_TCG_J4_cmpeq_fp0_jump_t(SHORTCODE) \
757     gen_cmpnd_cmp_jmp_f(ctx, 0, TCG_COND_EQ, RsV, RtV, riV)
758 #define fGEN_TCG_J4_cmpeq_fp0_jump_nt(SHORTCODE) \
759     gen_cmpnd_cmp_jmp_f(ctx, 0, TCG_COND_EQ, RsV, RtV, riV)
760 #define fGEN_TCG_J4_cmpeq_tp1_jump_t(SHORTCODE) \
761     gen_cmpnd_cmp_jmp_t(ctx, 1, TCG_COND_EQ, RsV, RtV, riV)
762 #define fGEN_TCG_J4_cmpeq_tp1_jump_nt(SHORTCODE) \
763     gen_cmpnd_cmp_jmp_t(ctx, 1, TCG_COND_EQ, RsV, RtV, riV)
764 #define fGEN_TCG_J4_cmpeq_fp1_jump_t(SHORTCODE) \
765     gen_cmpnd_cmp_jmp_f(ctx, 1, TCG_COND_EQ, RsV, RtV, riV)
766 #define fGEN_TCG_J4_cmpeq_fp1_jump_nt(SHORTCODE) \
767     gen_cmpnd_cmp_jmp_f(ctx, 1, TCG_COND_EQ, RsV, RtV, riV)
768 
769 #define fGEN_TCG_J4_cmpgt_tp0_jump_t(SHORTCODE) \
770     gen_cmpnd_cmp_jmp_t(ctx, 0, TCG_COND_GT, RsV, RtV, riV)
771 #define fGEN_TCG_J4_cmpgt_tp0_jump_nt(SHORTCODE) \
772     gen_cmpnd_cmp_jmp_t(ctx, 0, TCG_COND_GT, RsV, RtV, riV)
773 #define fGEN_TCG_J4_cmpgt_fp0_jump_t(SHORTCODE) \
774     gen_cmpnd_cmp_jmp_f(ctx, 0, TCG_COND_GT, RsV, RtV, riV)
775 #define fGEN_TCG_J4_cmpgt_fp0_jump_nt(SHORTCODE) \
776     gen_cmpnd_cmp_jmp_f(ctx, 0, TCG_COND_GT, RsV, RtV, riV)
777 #define fGEN_TCG_J4_cmpgt_tp1_jump_t(SHORTCODE) \
778     gen_cmpnd_cmp_jmp_t(ctx, 1, TCG_COND_GT, RsV, RtV, riV)
779 #define fGEN_TCG_J4_cmpgt_tp1_jump_nt(SHORTCODE) \
780     gen_cmpnd_cmp_jmp_t(ctx, 1, TCG_COND_GT, RsV, RtV, riV)
781 #define fGEN_TCG_J4_cmpgt_fp1_jump_t(SHORTCODE) \
782     gen_cmpnd_cmp_jmp_f(ctx, 1, TCG_COND_GT, RsV, RtV, riV)
783 #define fGEN_TCG_J4_cmpgt_fp1_jump_nt(SHORTCODE) \
784     gen_cmpnd_cmp_jmp_f(ctx, 1, TCG_COND_GT, RsV, RtV, riV)
785 
786 #define fGEN_TCG_J4_cmpgtu_tp0_jump_t(SHORTCODE) \
787     gen_cmpnd_cmp_jmp_t(ctx, 0, TCG_COND_GTU, RsV, RtV, riV)
788 #define fGEN_TCG_J4_cmpgtu_tp0_jump_nt(SHORTCODE) \
789     gen_cmpnd_cmp_jmp_t(ctx, 0, TCG_COND_GTU, RsV, RtV, riV)
790 #define fGEN_TCG_J4_cmpgtu_fp0_jump_t(SHORTCODE) \
791     gen_cmpnd_cmp_jmp_f(ctx, 0, TCG_COND_GTU, RsV, RtV, riV)
792 #define fGEN_TCG_J4_cmpgtu_fp0_jump_nt(SHORTCODE) \
793     gen_cmpnd_cmp_jmp_f(ctx, 0, TCG_COND_GTU, RsV, RtV, riV)
794 #define fGEN_TCG_J4_cmpgtu_tp1_jump_t(SHORTCODE) \
795     gen_cmpnd_cmp_jmp_t(ctx, 1, TCG_COND_GTU, RsV, RtV, riV)
796 #define fGEN_TCG_J4_cmpgtu_tp1_jump_nt(SHORTCODE) \
797     gen_cmpnd_cmp_jmp_t(ctx, 1, TCG_COND_GTU, RsV, RtV, riV)
798 #define fGEN_TCG_J4_cmpgtu_fp1_jump_t(SHORTCODE) \
799     gen_cmpnd_cmp_jmp_f(ctx, 1, TCG_COND_GTU, RsV, RtV, riV)
800 #define fGEN_TCG_J4_cmpgtu_fp1_jump_nt(SHORTCODE) \
801     gen_cmpnd_cmp_jmp_f(ctx, 1, TCG_COND_GTU, RsV, RtV, riV)
802 
803 #define fGEN_TCG_J4_cmpeqi_tp0_jump_t(SHORTCODE) \
804     gen_cmpnd_cmpi_jmp_t(ctx, 0, TCG_COND_EQ, RsV, UiV, riV)
805 #define fGEN_TCG_J4_cmpeqi_tp0_jump_nt(SHORTCODE) \
806     gen_cmpnd_cmpi_jmp_t(ctx, 0, TCG_COND_EQ, RsV, UiV, riV)
807 #define fGEN_TCG_J4_cmpeqi_fp0_jump_t(SHORTCODE) \
808     gen_cmpnd_cmpi_jmp_f(ctx, 0, TCG_COND_EQ, RsV, UiV, riV)
809 #define fGEN_TCG_J4_cmpeqi_fp0_jump_nt(SHORTCODE) \
810     gen_cmpnd_cmpi_jmp_f(ctx, 0, TCG_COND_EQ, RsV, UiV, riV)
811 #define fGEN_TCG_J4_cmpeqi_tp1_jump_t(SHORTCODE) \
812     gen_cmpnd_cmpi_jmp_t(ctx, 1, TCG_COND_EQ, RsV, UiV, riV)
813 #define fGEN_TCG_J4_cmpeqi_tp1_jump_nt(SHORTCODE) \
814     gen_cmpnd_cmpi_jmp_t(ctx, 1, TCG_COND_EQ, RsV, UiV, riV)
815 #define fGEN_TCG_J4_cmpeqi_fp1_jump_t(SHORTCODE) \
816     gen_cmpnd_cmpi_jmp_f(ctx, 1, TCG_COND_EQ, RsV, UiV, riV)
817 #define fGEN_TCG_J4_cmpeqi_fp1_jump_nt(SHORTCODE) \
818     gen_cmpnd_cmpi_jmp_f(ctx, 1, TCG_COND_EQ, RsV, UiV, riV)
819 
820 #define fGEN_TCG_J4_cmpgti_tp0_jump_t(SHORTCODE) \
821     gen_cmpnd_cmpi_jmp_t(ctx, 0, TCG_COND_GT, RsV, UiV, riV)
822 #define fGEN_TCG_J4_cmpgti_tp0_jump_nt(SHORTCODE) \
823     gen_cmpnd_cmpi_jmp_t(ctx, 0, TCG_COND_GT, RsV, UiV, riV)
824 #define fGEN_TCG_J4_cmpgti_fp0_jump_t(SHORTCODE) \
825     gen_cmpnd_cmpi_jmp_f(ctx, 0, TCG_COND_GT, RsV, UiV, riV)
826 #define fGEN_TCG_J4_cmpgti_fp0_jump_nt(SHORTCODE) \
827     gen_cmpnd_cmpi_jmp_f(ctx, 0, TCG_COND_GT, RsV, UiV, riV)
828 #define fGEN_TCG_J4_cmpgti_tp1_jump_t(SHORTCODE) \
829     gen_cmpnd_cmpi_jmp_t(ctx, 1, TCG_COND_GT, RsV, UiV, riV)
830 #define fGEN_TCG_J4_cmpgti_tp1_jump_nt(SHORTCODE) \
831     gen_cmpnd_cmpi_jmp_t(ctx, 1, TCG_COND_GT, RsV, UiV, riV)
832 #define fGEN_TCG_J4_cmpgti_fp1_jump_t(SHORTCODE) \
833     gen_cmpnd_cmpi_jmp_f(ctx, 1, TCG_COND_GT, RsV, UiV, riV)
834 #define fGEN_TCG_J4_cmpgti_fp1_jump_nt(SHORTCODE) \
835     gen_cmpnd_cmpi_jmp_f(ctx, 1, TCG_COND_GT, RsV, UiV, riV)
836 
837 #define fGEN_TCG_J4_cmpgtui_tp0_jump_t(SHORTCODE) \
838     gen_cmpnd_cmpi_jmp_t(ctx, 0, TCG_COND_GTU, RsV, UiV, riV)
839 #define fGEN_TCG_J4_cmpgtui_tp0_jump_nt(SHORTCODE) \
840     gen_cmpnd_cmpi_jmp_t(ctx, 0, TCG_COND_GTU, RsV, UiV, riV)
841 #define fGEN_TCG_J4_cmpgtui_fp0_jump_t(SHORTCODE) \
842     gen_cmpnd_cmpi_jmp_f(ctx, 0, TCG_COND_GTU, RsV, UiV, riV)
843 #define fGEN_TCG_J4_cmpgtui_fp0_jump_nt(SHORTCODE) \
844     gen_cmpnd_cmpi_jmp_f(ctx, 0, TCG_COND_GTU, RsV, UiV, riV)
845 #define fGEN_TCG_J4_cmpgtui_tp1_jump_t(SHORTCODE) \
846     gen_cmpnd_cmpi_jmp_t(ctx, 1, TCG_COND_GTU, RsV, UiV, riV)
847 #define fGEN_TCG_J4_cmpgtui_tp1_jump_nt(SHORTCODE) \
848     gen_cmpnd_cmpi_jmp_t(ctx, 1, TCG_COND_GTU, RsV, UiV, riV)
849 #define fGEN_TCG_J4_cmpgtui_fp1_jump_t(SHORTCODE) \
850     gen_cmpnd_cmpi_jmp_f(ctx, 1, TCG_COND_GTU, RsV, UiV, riV)
851 #define fGEN_TCG_J4_cmpgtui_fp1_jump_nt(SHORTCODE) \
852     gen_cmpnd_cmpi_jmp_f(ctx, 1, TCG_COND_GTU, RsV, UiV, riV)
853 
854 #define fGEN_TCG_J4_cmpeqn1_tp0_jump_t(SHORTCODE) \
855     gen_cmpnd_cmp_n1_jmp_t(ctx, 0, TCG_COND_EQ, RsV, riV)
856 #define fGEN_TCG_J4_cmpeqn1_tp0_jump_nt(SHORTCODE) \
857     gen_cmpnd_cmp_n1_jmp_t(ctx, 0, TCG_COND_EQ, RsV, riV)
858 #define fGEN_TCG_J4_cmpeqn1_fp0_jump_t(SHORTCODE) \
859     gen_cmpnd_cmp_n1_jmp_f(ctx, 0, TCG_COND_EQ, RsV, riV)
860 #define fGEN_TCG_J4_cmpeqn1_fp0_jump_nt(SHORTCODE) \
861     gen_cmpnd_cmp_n1_jmp_f(ctx, 0, TCG_COND_EQ, RsV, riV)
862 #define fGEN_TCG_J4_cmpeqn1_tp1_jump_t(SHORTCODE) \
863     gen_cmpnd_cmp_n1_jmp_t(ctx, 1, TCG_COND_EQ, RsV, riV)
864 #define fGEN_TCG_J4_cmpeqn1_tp1_jump_nt(SHORTCODE) \
865     gen_cmpnd_cmp_n1_jmp_t(ctx, 1, TCG_COND_EQ, RsV, riV)
866 #define fGEN_TCG_J4_cmpeqn1_fp1_jump_t(SHORTCODE) \
867     gen_cmpnd_cmp_n1_jmp_f(ctx, 1, TCG_COND_EQ, RsV, riV)
868 #define fGEN_TCG_J4_cmpeqn1_fp1_jump_nt(SHORTCODE) \
869     gen_cmpnd_cmp_n1_jmp_f(ctx, 1, TCG_COND_EQ, RsV, riV)
870 
871 #define fGEN_TCG_J4_cmpgtn1_tp0_jump_t(SHORTCODE) \
872     gen_cmpnd_cmp_n1_jmp_t(ctx, 0, TCG_COND_GT, RsV, riV)
873 #define fGEN_TCG_J4_cmpgtn1_tp0_jump_nt(SHORTCODE) \
874     gen_cmpnd_cmp_n1_jmp_t(ctx, 0, TCG_COND_GT, RsV, riV)
875 #define fGEN_TCG_J4_cmpgtn1_fp0_jump_t(SHORTCODE) \
876     gen_cmpnd_cmp_n1_jmp_f(ctx, 0, TCG_COND_GT, RsV, riV)
877 #define fGEN_TCG_J4_cmpgtn1_fp0_jump_nt(SHORTCODE) \
878     gen_cmpnd_cmp_n1_jmp_f(ctx, 0, TCG_COND_GT, RsV, riV)
879 #define fGEN_TCG_J4_cmpgtn1_tp1_jump_t(SHORTCODE) \
880     gen_cmpnd_cmp_n1_jmp_t(ctx, 1, TCG_COND_GT, RsV, riV)
881 #define fGEN_TCG_J4_cmpgtn1_tp1_jump_nt(SHORTCODE) \
882     gen_cmpnd_cmp_n1_jmp_t(ctx, 1, TCG_COND_GT, RsV, riV)
883 #define fGEN_TCG_J4_cmpgtn1_fp1_jump_t(SHORTCODE) \
884     gen_cmpnd_cmp_n1_jmp_f(ctx, 1, TCG_COND_GT, RsV, riV)
885 #define fGEN_TCG_J4_cmpgtn1_fp1_jump_nt(SHORTCODE) \
886     gen_cmpnd_cmp_n1_jmp_f(ctx, 1, TCG_COND_GT, RsV, riV)
887 
888 #define fGEN_TCG_J4_tstbit0_tp0_jump_nt(SHORTCODE) \
889     gen_cmpnd_tstbit0_jmp(ctx, 0, RsV, TCG_COND_EQ, riV)
890 #define fGEN_TCG_J4_tstbit0_tp0_jump_t(SHORTCODE) \
891     gen_cmpnd_tstbit0_jmp(ctx, 0, RsV, TCG_COND_EQ, riV)
892 #define fGEN_TCG_J4_tstbit0_fp0_jump_nt(SHORTCODE) \
893     gen_cmpnd_tstbit0_jmp(ctx, 0, RsV, TCG_COND_NE, riV)
894 #define fGEN_TCG_J4_tstbit0_fp0_jump_t(SHORTCODE) \
895     gen_cmpnd_tstbit0_jmp(ctx, 0, RsV, TCG_COND_NE, riV)
896 #define fGEN_TCG_J4_tstbit0_tp1_jump_nt(SHORTCODE) \
897     gen_cmpnd_tstbit0_jmp(ctx, 1, RsV, TCG_COND_EQ, riV)
898 #define fGEN_TCG_J4_tstbit0_tp1_jump_t(SHORTCODE) \
899     gen_cmpnd_tstbit0_jmp(ctx, 1, RsV, TCG_COND_EQ, riV)
900 #define fGEN_TCG_J4_tstbit0_fp1_jump_nt(SHORTCODE) \
901     gen_cmpnd_tstbit0_jmp(ctx, 1, RsV, TCG_COND_NE, riV)
902 #define fGEN_TCG_J4_tstbit0_fp1_jump_t(SHORTCODE) \
903     gen_cmpnd_tstbit0_jmp(ctx, 1, RsV, TCG_COND_NE, riV)
904 
905 #define fGEN_TCG_J2_jump(SHORTCODE) \
906     gen_jump(ctx, riV)
907 #define fGEN_TCG_J2_jumpr(SHORTCODE) \
908     gen_jumpr(ctx, RsV)
909 #define fGEN_TCG_J2_jumprh(SHORTCODE) \
910     gen_jumpr(ctx, RsV)
911 #define fGEN_TCG_J4_jumpseti(SHORTCODE) \
912     do { \
913         tcg_gen_movi_tl(RdV, UiV); \
914         gen_jump(ctx, riV); \
915     } while (0)
916 
917 #define fGEN_TCG_cond_jumpt(COND) \
918     do { \
919         TCGv LSB = tcg_temp_new(); \
920         COND; \
921         gen_cond_jump(ctx, TCG_COND_EQ, LSB, riV); \
922     } while (0)
923 #define fGEN_TCG_cond_jumpf(COND) \
924     do { \
925         TCGv LSB = tcg_temp_new(); \
926         COND; \
927         gen_cond_jump(ctx, TCG_COND_NE, LSB, riV); \
928     } while (0)
929 
930 #define fGEN_TCG_J2_jumpt(SHORTCODE) \
931     fGEN_TCG_cond_jumpt(fLSBOLD(PuV))
932 #define fGEN_TCG_J2_jumptpt(SHORTCODE) \
933     fGEN_TCG_cond_jumpt(fLSBOLD(PuV))
934 #define fGEN_TCG_J2_jumpf(SHORTCODE) \
935     fGEN_TCG_cond_jumpf(fLSBOLD(PuV))
936 #define fGEN_TCG_J2_jumpfpt(SHORTCODE) \
937     fGEN_TCG_cond_jumpf(fLSBOLD(PuV))
938 #define fGEN_TCG_J2_jumptnew(SHORTCODE) \
939     gen_cond_jump(ctx, TCG_COND_EQ, PuN, riV)
940 #define fGEN_TCG_J2_jumptnewpt(SHORTCODE) \
941     gen_cond_jump(ctx, TCG_COND_EQ, PuN, riV)
942 #define fGEN_TCG_J2_jumpfnewpt(SHORTCODE) \
943     fGEN_TCG_cond_jumpf(fLSBNEW(PuN))
944 #define fGEN_TCG_J2_jumpfnew(SHORTCODE) \
945     fGEN_TCG_cond_jumpf(fLSBNEW(PuN))
946 #define fGEN_TCG_J2_jumprz(SHORTCODE) \
947     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_NE, LSB, RsV, 0))
948 #define fGEN_TCG_J2_jumprzpt(SHORTCODE) \
949     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_NE, LSB, RsV, 0))
950 #define fGEN_TCG_J2_jumprnz(SHORTCODE) \
951     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_EQ, LSB, RsV, 0))
952 #define fGEN_TCG_J2_jumprnzpt(SHORTCODE) \
953     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_EQ, LSB, RsV, 0))
954 #define fGEN_TCG_J2_jumprgtez(SHORTCODE) \
955     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_GE, LSB, RsV, 0))
956 #define fGEN_TCG_J2_jumprgtezpt(SHORTCODE) \
957     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_GE, LSB, RsV, 0))
958 #define fGEN_TCG_J2_jumprltez(SHORTCODE) \
959     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_LE, LSB, RsV, 0))
960 #define fGEN_TCG_J2_jumprltezpt(SHORTCODE) \
961     fGEN_TCG_cond_jumpt(tcg_gen_setcondi_tl(TCG_COND_LE, LSB, RsV, 0))
962 
963 #define fGEN_TCG_cond_jumprt(COND) \
964     do { \
965         TCGv LSB = tcg_temp_new(); \
966         COND; \
967         gen_cond_jumpr(ctx, RsV, TCG_COND_EQ, LSB); \
968     } while (0)
969 #define fGEN_TCG_cond_jumprf(COND) \
970     do { \
971         TCGv LSB = tcg_temp_new(); \
972         COND; \
973         gen_cond_jumpr(ctx, RsV, TCG_COND_NE, LSB); \
974     } while (0)
975 
976 #define fGEN_TCG_J2_jumprt(SHORTCODE) \
977     fGEN_TCG_cond_jumprt(fLSBOLD(PuV))
978 #define fGEN_TCG_J2_jumprtpt(SHORTCODE) \
979     fGEN_TCG_cond_jumprt(fLSBOLD(PuV))
980 #define fGEN_TCG_J2_jumprf(SHORTCODE) \
981     fGEN_TCG_cond_jumprf(fLSBOLD(PuV))
982 #define fGEN_TCG_J2_jumprfpt(SHORTCODE) \
983     fGEN_TCG_cond_jumprf(fLSBOLD(PuV))
984 #define fGEN_TCG_J2_jumprtnew(SHORTCODE) \
985     fGEN_TCG_cond_jumprt(fLSBNEW(PuN))
986 #define fGEN_TCG_J2_jumprtnewpt(SHORTCODE) \
987     fGEN_TCG_cond_jumprt(fLSBNEW(PuN))
988 #define fGEN_TCG_J2_jumprfnew(SHORTCODE) \
989     fGEN_TCG_cond_jumprf(fLSBNEW(PuN))
990 #define fGEN_TCG_J2_jumprfnewpt(SHORTCODE) \
991     fGEN_TCG_cond_jumprf(fLSBNEW(PuN))
992 
993 /*
994  * New value compare & jump instructions
995  * if ([!]COND(r0.new, r1) jump:t address
996  * if ([!]COND(r0.new, #7) jump:t address
997  */
998 #define fGEN_TCG_J4_cmpgt_t_jumpnv_t(SHORTCODE) \
999     gen_cmp_jumpnv(ctx, TCG_COND_GT, NsN, RtV, riV)
1000 #define fGEN_TCG_J4_cmpgt_t_jumpnv_nt(SHORTCODE) \
1001     gen_cmp_jumpnv(ctx, TCG_COND_GT, NsN, RtV, riV)
1002 #define fGEN_TCG_J4_cmpgt_f_jumpnv_t(SHORTCODE) \
1003     gen_cmp_jumpnv(ctx, TCG_COND_LE, NsN, RtV, riV)
1004 #define fGEN_TCG_J4_cmpgt_f_jumpnv_nt(SHORTCODE) \
1005     gen_cmp_jumpnv(ctx, TCG_COND_LE, NsN, RtV, riV)
1006 
1007 #define fGEN_TCG_J4_cmpeq_t_jumpnv_t(SHORTCODE) \
1008     gen_cmp_jumpnv(ctx, TCG_COND_EQ, NsN, RtV, riV)
1009 #define fGEN_TCG_J4_cmpeq_t_jumpnv_nt(SHORTCODE) \
1010     gen_cmp_jumpnv(ctx, TCG_COND_EQ, NsN, RtV, riV)
1011 #define fGEN_TCG_J4_cmpeq_f_jumpnv_t(SHORTCODE) \
1012     gen_cmp_jumpnv(ctx, TCG_COND_NE, NsN, RtV, riV)
1013 #define fGEN_TCG_J4_cmpeq_f_jumpnv_nt(SHORTCODE) \
1014     gen_cmp_jumpnv(ctx, TCG_COND_NE, NsN, RtV, riV)
1015 
1016 #define fGEN_TCG_J4_cmplt_t_jumpnv_t(SHORTCODE) \
1017     gen_cmp_jumpnv(ctx, TCG_COND_LT, NsN, RtV, riV)
1018 #define fGEN_TCG_J4_cmplt_t_jumpnv_nt(SHORTCODE) \
1019     gen_cmp_jumpnv(ctx, TCG_COND_LT, NsN, RtV, riV)
1020 #define fGEN_TCG_J4_cmplt_f_jumpnv_t(SHORTCODE) \
1021     gen_cmp_jumpnv(ctx, TCG_COND_GE, NsN, RtV, riV)
1022 #define fGEN_TCG_J4_cmplt_f_jumpnv_nt(SHORTCODE) \
1023     gen_cmp_jumpnv(ctx, TCG_COND_GE, NsN, RtV, riV)
1024 
1025 #define fGEN_TCG_J4_cmpeqi_t_jumpnv_t(SHORTCODE) \
1026     gen_cmpi_jumpnv(ctx, TCG_COND_EQ, NsN, UiV, riV)
1027 #define fGEN_TCG_J4_cmpeqi_t_jumpnv_nt(SHORTCODE) \
1028     gen_cmpi_jumpnv(ctx, TCG_COND_EQ, NsN, UiV, riV)
1029 #define fGEN_TCG_J4_cmpeqi_f_jumpnv_t(SHORTCODE) \
1030     gen_cmpi_jumpnv(ctx, TCG_COND_NE, NsN, UiV, riV)
1031 #define fGEN_TCG_J4_cmpeqi_f_jumpnv_nt(SHORTCODE) \
1032     gen_cmpi_jumpnv(ctx, TCG_COND_NE, NsN, UiV, riV)
1033 
1034 #define fGEN_TCG_J4_cmpgti_t_jumpnv_t(SHORTCODE) \
1035     gen_cmpi_jumpnv(ctx, TCG_COND_GT, NsN, UiV, riV)
1036 #define fGEN_TCG_J4_cmpgti_t_jumpnv_nt(SHORTCODE) \
1037     gen_cmpi_jumpnv(ctx, TCG_COND_GT, NsN, UiV, riV)
1038 #define fGEN_TCG_J4_cmpgti_f_jumpnv_t(SHORTCODE) \
1039     gen_cmpi_jumpnv(ctx, TCG_COND_LE, NsN, UiV, riV)
1040 #define fGEN_TCG_J4_cmpgti_f_jumpnv_nt(SHORTCODE) \
1041     gen_cmpi_jumpnv(ctx, TCG_COND_LE, NsN, UiV, riV)
1042 
1043 #define fGEN_TCG_J4_cmpltu_t_jumpnv_t(SHORTCODE) \
1044     gen_cmp_jumpnv(ctx, TCG_COND_LTU, NsN, RtV, riV)
1045 #define fGEN_TCG_J4_cmpltu_t_jumpnv_nt(SHORTCODE) \
1046     gen_cmp_jumpnv(ctx, TCG_COND_LTU, NsN, RtV, riV)
1047 #define fGEN_TCG_J4_cmpltu_f_jumpnv_t(SHORTCODE) \
1048     gen_cmp_jumpnv(ctx, TCG_COND_GEU, NsN, RtV, riV)
1049 #define fGEN_TCG_J4_cmpltu_f_jumpnv_nt(SHORTCODE) \
1050     gen_cmp_jumpnv(ctx, TCG_COND_GEU, NsN, RtV, riV)
1051 
1052 #define fGEN_TCG_J4_cmpgtui_t_jumpnv_t(SHORTCODE) \
1053     gen_cmpi_jumpnv(ctx, TCG_COND_GTU, NsN, UiV, riV)
1054 #define fGEN_TCG_J4_cmpgtui_t_jumpnv_nt(SHORTCODE) \
1055     gen_cmpi_jumpnv(ctx, TCG_COND_GTU, NsN, UiV, riV)
1056 #define fGEN_TCG_J4_cmpgtui_f_jumpnv_t(SHORTCODE) \
1057     gen_cmpi_jumpnv(ctx, TCG_COND_LEU, NsN, UiV, riV)
1058 #define fGEN_TCG_J4_cmpgtui_f_jumpnv_nt(SHORTCODE) \
1059     gen_cmpi_jumpnv(ctx, TCG_COND_LEU, NsN, UiV, riV)
1060 
1061 #define fGEN_TCG_J4_cmpgtu_t_jumpnv_t(SHORTCODE) \
1062     gen_cmp_jumpnv(ctx, TCG_COND_GTU, NsN, RtV, riV)
1063 #define fGEN_TCG_J4_cmpgtu_t_jumpnv_nt(SHORTCODE) \
1064     gen_cmp_jumpnv(ctx, TCG_COND_GTU, NsN, RtV, riV)
1065 #define fGEN_TCG_J4_cmpgtu_f_jumpnv_t(SHORTCODE) \
1066     gen_cmp_jumpnv(ctx, TCG_COND_LEU, NsN, RtV, riV)
1067 #define fGEN_TCG_J4_cmpgtu_f_jumpnv_nt(SHORTCODE) \
1068     gen_cmp_jumpnv(ctx, TCG_COND_LEU, NsN, RtV, riV)
1069 
1070 #define fGEN_TCG_J4_cmpeqn1_t_jumpnv_t(SHORTCODE) \
1071     gen_cmpi_jumpnv(ctx, TCG_COND_EQ, NsN, -1, riV)
1072 #define fGEN_TCG_J4_cmpeqn1_t_jumpnv_nt(SHORTCODE) \
1073     gen_cmpi_jumpnv(ctx, TCG_COND_EQ, NsN, -1, riV)
1074 #define fGEN_TCG_J4_cmpeqn1_f_jumpnv_t(SHORTCODE) \
1075     gen_cmpi_jumpnv(ctx, TCG_COND_NE, NsN, -1, riV)
1076 #define fGEN_TCG_J4_cmpeqn1_f_jumpnv_nt(SHORTCODE) \
1077     gen_cmpi_jumpnv(ctx, TCG_COND_NE, NsN, -1, riV)
1078 
1079 #define fGEN_TCG_J4_cmpgtn1_t_jumpnv_t(SHORTCODE) \
1080     gen_cmpi_jumpnv(ctx, TCG_COND_GT, NsN, -1, riV)
1081 #define fGEN_TCG_J4_cmpgtn1_t_jumpnv_nt(SHORTCODE) \
1082     gen_cmpi_jumpnv(ctx, TCG_COND_GT, NsN, -1, riV)
1083 #define fGEN_TCG_J4_cmpgtn1_f_jumpnv_t(SHORTCODE) \
1084     gen_cmpi_jumpnv(ctx, TCG_COND_LE, NsN, -1, riV)
1085 #define fGEN_TCG_J4_cmpgtn1_f_jumpnv_nt(SHORTCODE) \
1086     gen_cmpi_jumpnv(ctx, TCG_COND_LE, NsN, -1, riV)
1087 
1088 #define fGEN_TCG_J4_tstbit0_t_jumpnv_t(SHORTCODE) \
1089     gen_testbit0_jumpnv(ctx, NsN, TCG_COND_EQ, riV)
1090 #define fGEN_TCG_J4_tstbit0_t_jumpnv_nt(SHORTCODE) \
1091     gen_testbit0_jumpnv(ctx, NsN, TCG_COND_EQ, riV)
1092 #define fGEN_TCG_J4_tstbit0_f_jumpnv_t(SHORTCODE) \
1093     gen_testbit0_jumpnv(ctx, NsN, TCG_COND_NE, riV)
1094 #define fGEN_TCG_J4_tstbit0_f_jumpnv_nt(SHORTCODE) \
1095     gen_testbit0_jumpnv(ctx, NsN, TCG_COND_NE, riV)
1096 
1097 /* r0 = r1 ; jump address */
1098 #define fGEN_TCG_J4_jumpsetr(SHORTCODE) \
1099     do { \
1100         tcg_gen_mov_tl(RdV, RsV); \
1101         gen_jump(ctx, riV); \
1102     } while (0)
1103 
1104 /* if (p0.new) r0 = #0 */
1105 #define fGEN_TCG_SA1_clrtnew(SHORTCODE) \
1106     do { \
1107         tcg_gen_movcond_tl(TCG_COND_EQ, RdV, \
1108                            hex_new_pred_value[0], tcg_constant_tl(0), \
1109                            RdV, tcg_constant_tl(0)); \
1110     } while (0)
1111 
1112 /* if (!p0.new) r0 = #0 */
1113 #define fGEN_TCG_SA1_clrfnew(SHORTCODE) \
1114     do { \
1115         tcg_gen_movcond_tl(TCG_COND_NE, RdV, \
1116                            hex_new_pred_value[0], tcg_constant_tl(0), \
1117                            RdV, tcg_constant_tl(0)); \
1118     } while (0)
1119 
1120 #define fGEN_TCG_J2_pause(SHORTCODE) \
1121     do { \
1122         uiV = uiV; \
1123         tcg_gen_movi_tl(hex_gpr[HEX_REG_PC], ctx->next_PC); \
1124     } while (0)
1125 
1126 /* r0 = asr(r1, r2):sat */
1127 #define fGEN_TCG_S2_asr_r_r_sat(SHORTCODE) \
1128     gen_asr_r_r_sat(ctx, RdV, RsV, RtV)
1129 
1130 /* r0 = asl(r1, r2):sat */
1131 #define fGEN_TCG_S2_asl_r_r_sat(SHORTCODE) \
1132     gen_asl_r_r_sat(ctx, RdV, RsV, RtV)
1133 
1134 #define fGEN_TCG_SL2_jumpr31(SHORTCODE) \
1135     gen_jumpr(ctx, hex_gpr[HEX_REG_LR])
1136 
1137 #define fGEN_TCG_SL2_jumpr31_t(SHORTCODE) \
1138     gen_cond_jumpr31(ctx, TCG_COND_EQ, hex_pred[0])
1139 #define fGEN_TCG_SL2_jumpr31_f(SHORTCODE) \
1140     gen_cond_jumpr31(ctx, TCG_COND_NE, hex_pred[0])
1141 
1142 #define fGEN_TCG_SL2_jumpr31_tnew(SHORTCODE) \
1143     gen_cond_jumpr31(ctx, TCG_COND_EQ, hex_new_pred_value[0])
1144 #define fGEN_TCG_SL2_jumpr31_fnew(SHORTCODE) \
1145     gen_cond_jumpr31(ctx, TCG_COND_NE, hex_new_pred_value[0])
1146 
1147 /* Count trailing zeros/ones */
1148 #define fGEN_TCG_S2_ct0(SHORTCODE) \
1149     do { \
1150         tcg_gen_ctzi_tl(RdV, RsV, 32); \
1151     } while (0)
1152 #define fGEN_TCG_S2_ct1(SHORTCODE) \
1153     do { \
1154         tcg_gen_not_tl(RdV, RsV); \
1155         tcg_gen_ctzi_tl(RdV, RdV, 32); \
1156     } while (0)
1157 #define fGEN_TCG_S2_ct0p(SHORTCODE) \
1158     do { \
1159         TCGv_i64 tmp = tcg_temp_new_i64(); \
1160         tcg_gen_ctzi_i64(tmp, RssV, 64); \
1161         tcg_gen_extrl_i64_i32(RdV, tmp); \
1162     } while (0)
1163 #define fGEN_TCG_S2_ct1p(SHORTCODE) \
1164     do { \
1165         TCGv_i64 tmp = tcg_temp_new_i64(); \
1166         tcg_gen_not_i64(tmp, RssV); \
1167         tcg_gen_ctzi_i64(tmp, tmp, 64); \
1168         tcg_gen_extrl_i64_i32(RdV, tmp); \
1169     } while (0)
1170 
1171 /* Floating point */
1172 #define fGEN_TCG_F2_conv_sf2df(SHORTCODE) \
1173     gen_helper_conv_sf2df(RddV, cpu_env, RsV)
1174 #define fGEN_TCG_F2_conv_df2sf(SHORTCODE) \
1175     gen_helper_conv_df2sf(RdV, cpu_env, RssV)
1176 #define fGEN_TCG_F2_conv_uw2sf(SHORTCODE) \
1177     gen_helper_conv_uw2sf(RdV, cpu_env, RsV)
1178 #define fGEN_TCG_F2_conv_uw2df(SHORTCODE) \
1179     gen_helper_conv_uw2df(RddV, cpu_env, RsV)
1180 #define fGEN_TCG_F2_conv_w2sf(SHORTCODE) \
1181     gen_helper_conv_w2sf(RdV, cpu_env, RsV)
1182 #define fGEN_TCG_F2_conv_w2df(SHORTCODE) \
1183     gen_helper_conv_w2df(RddV, cpu_env, RsV)
1184 #define fGEN_TCG_F2_conv_ud2sf(SHORTCODE) \
1185     gen_helper_conv_ud2sf(RdV, cpu_env, RssV)
1186 #define fGEN_TCG_F2_conv_ud2df(SHORTCODE) \
1187     gen_helper_conv_ud2df(RddV, cpu_env, RssV)
1188 #define fGEN_TCG_F2_conv_d2sf(SHORTCODE) \
1189     gen_helper_conv_d2sf(RdV, cpu_env, RssV)
1190 #define fGEN_TCG_F2_conv_d2df(SHORTCODE) \
1191     gen_helper_conv_d2df(RddV, cpu_env, RssV)
1192 #define fGEN_TCG_F2_conv_sf2uw(SHORTCODE) \
1193     gen_helper_conv_sf2uw(RdV, cpu_env, RsV)
1194 #define fGEN_TCG_F2_conv_sf2w(SHORTCODE) \
1195     gen_helper_conv_sf2w(RdV, cpu_env, RsV)
1196 #define fGEN_TCG_F2_conv_sf2ud(SHORTCODE) \
1197     gen_helper_conv_sf2ud(RddV, cpu_env, RsV)
1198 #define fGEN_TCG_F2_conv_sf2d(SHORTCODE) \
1199     gen_helper_conv_sf2d(RddV, cpu_env, RsV)
1200 #define fGEN_TCG_F2_conv_df2uw(SHORTCODE) \
1201     gen_helper_conv_df2uw(RdV, cpu_env, RssV)
1202 #define fGEN_TCG_F2_conv_df2w(SHORTCODE) \
1203     gen_helper_conv_df2w(RdV, cpu_env, RssV)
1204 #define fGEN_TCG_F2_conv_df2ud(SHORTCODE) \
1205     gen_helper_conv_df2ud(RddV, cpu_env, RssV)
1206 #define fGEN_TCG_F2_conv_df2d(SHORTCODE) \
1207     gen_helper_conv_df2d(RddV, cpu_env, RssV)
1208 #define fGEN_TCG_F2_conv_sf2uw_chop(SHORTCODE) \
1209     gen_helper_conv_sf2uw_chop(RdV, cpu_env, RsV)
1210 #define fGEN_TCG_F2_conv_sf2w_chop(SHORTCODE) \
1211     gen_helper_conv_sf2w_chop(RdV, cpu_env, RsV)
1212 #define fGEN_TCG_F2_conv_sf2ud_chop(SHORTCODE) \
1213     gen_helper_conv_sf2ud_chop(RddV, cpu_env, RsV)
1214 #define fGEN_TCG_F2_conv_sf2d_chop(SHORTCODE) \
1215     gen_helper_conv_sf2d_chop(RddV, cpu_env, RsV)
1216 #define fGEN_TCG_F2_conv_df2uw_chop(SHORTCODE) \
1217     gen_helper_conv_df2uw_chop(RdV, cpu_env, RssV)
1218 #define fGEN_TCG_F2_conv_df2w_chop(SHORTCODE) \
1219     gen_helper_conv_df2w_chop(RdV, cpu_env, RssV)
1220 #define fGEN_TCG_F2_conv_df2ud_chop(SHORTCODE) \
1221     gen_helper_conv_df2ud_chop(RddV, cpu_env, RssV)
1222 #define fGEN_TCG_F2_conv_df2d_chop(SHORTCODE) \
1223     gen_helper_conv_df2d_chop(RddV, cpu_env, RssV)
1224 #define fGEN_TCG_F2_sfadd(SHORTCODE) \
1225     gen_helper_sfadd(RdV, cpu_env, RsV, RtV)
1226 #define fGEN_TCG_F2_sfsub(SHORTCODE) \
1227     gen_helper_sfsub(RdV, cpu_env, RsV, RtV)
1228 #define fGEN_TCG_F2_sfcmpeq(SHORTCODE) \
1229     gen_helper_sfcmpeq(PdV, cpu_env, RsV, RtV)
1230 #define fGEN_TCG_F2_sfcmpgt(SHORTCODE) \
1231     gen_helper_sfcmpgt(PdV, cpu_env, RsV, RtV)
1232 #define fGEN_TCG_F2_sfcmpge(SHORTCODE) \
1233     gen_helper_sfcmpge(PdV, cpu_env, RsV, RtV)
1234 #define fGEN_TCG_F2_sfcmpuo(SHORTCODE) \
1235     gen_helper_sfcmpuo(PdV, cpu_env, RsV, RtV)
1236 #define fGEN_TCG_F2_sfmax(SHORTCODE) \
1237     gen_helper_sfmax(RdV, cpu_env, RsV, RtV)
1238 #define fGEN_TCG_F2_sfmin(SHORTCODE) \
1239     gen_helper_sfmin(RdV, cpu_env, RsV, RtV)
1240 #define fGEN_TCG_F2_sfclass(SHORTCODE) \
1241     do { \
1242         TCGv imm = tcg_constant_tl(uiV); \
1243         gen_helper_sfclass(PdV, cpu_env, RsV, imm); \
1244     } while (0)
1245 #define fGEN_TCG_F2_sffixupn(SHORTCODE) \
1246     gen_helper_sffixupn(RdV, cpu_env, RsV, RtV)
1247 #define fGEN_TCG_F2_sffixupd(SHORTCODE) \
1248     gen_helper_sffixupd(RdV, cpu_env, RsV, RtV)
1249 #define fGEN_TCG_F2_sffixupr(SHORTCODE) \
1250     gen_helper_sffixupr(RdV, cpu_env, RsV)
1251 #define fGEN_TCG_F2_dfadd(SHORTCODE) \
1252     gen_helper_dfadd(RddV, cpu_env, RssV, RttV)
1253 #define fGEN_TCG_F2_dfsub(SHORTCODE) \
1254     gen_helper_dfsub(RddV, cpu_env, RssV, RttV)
1255 #define fGEN_TCG_F2_dfmax(SHORTCODE) \
1256     gen_helper_dfmax(RddV, cpu_env, RssV, RttV)
1257 #define fGEN_TCG_F2_dfmin(SHORTCODE) \
1258     gen_helper_dfmin(RddV, cpu_env, RssV, RttV)
1259 #define fGEN_TCG_F2_dfcmpeq(SHORTCODE) \
1260     gen_helper_dfcmpeq(PdV, cpu_env, RssV, RttV)
1261 #define fGEN_TCG_F2_dfcmpgt(SHORTCODE) \
1262     gen_helper_dfcmpgt(PdV, cpu_env, RssV, RttV)
1263 #define fGEN_TCG_F2_dfcmpge(SHORTCODE) \
1264     gen_helper_dfcmpge(PdV, cpu_env, RssV, RttV)
1265 #define fGEN_TCG_F2_dfcmpuo(SHORTCODE) \
1266     gen_helper_dfcmpuo(PdV, cpu_env, RssV, RttV)
1267 #define fGEN_TCG_F2_dfclass(SHORTCODE) \
1268     do { \
1269         TCGv imm = tcg_constant_tl(uiV); \
1270         gen_helper_dfclass(PdV, cpu_env, RssV, imm); \
1271     } while (0)
1272 #define fGEN_TCG_F2_sfmpy(SHORTCODE) \
1273     gen_helper_sfmpy(RdV, cpu_env, RsV, RtV)
1274 #define fGEN_TCG_F2_sffma(SHORTCODE) \
1275     gen_helper_sffma(RxV, cpu_env, RxV, RsV, RtV)
1276 #define fGEN_TCG_F2_sffma_sc(SHORTCODE) \
1277     gen_helper_sffma_sc(RxV, cpu_env, RxV, RsV, RtV, PuV)
1278 #define fGEN_TCG_F2_sffms(SHORTCODE) \
1279     gen_helper_sffms(RxV, cpu_env, RxV, RsV, RtV)
1280 #define fGEN_TCG_F2_sffma_lib(SHORTCODE) \
1281     gen_helper_sffma_lib(RxV, cpu_env, RxV, RsV, RtV)
1282 #define fGEN_TCG_F2_sffms_lib(SHORTCODE) \
1283     gen_helper_sffms_lib(RxV, cpu_env, RxV, RsV, RtV)
1284 
1285 #define fGEN_TCG_F2_dfmpyfix(SHORTCODE) \
1286     gen_helper_dfmpyfix(RddV, cpu_env, RssV, RttV)
1287 #define fGEN_TCG_F2_dfmpyhh(SHORTCODE) \
1288     gen_helper_dfmpyhh(RxxV, cpu_env, RxxV, RssV, RttV)
1289 
1290 /* Nothing to do for these in qemu, need to suppress compiler warnings */
1291 #define fGEN_TCG_Y4_l2fetch(SHORTCODE) \
1292     do { \
1293         RsV = RsV; \
1294         RtV = RtV; \
1295     } while (0)
1296 #define fGEN_TCG_Y5_l2fetch(SHORTCODE) \
1297     do { \
1298         RsV = RsV; \
1299     } while (0)
1300 #define fGEN_TCG_Y2_isync(SHORTCODE) \
1301     do { } while (0)
1302 #define fGEN_TCG_Y2_barrier(SHORTCODE) \
1303     do { } while (0)
1304 #define fGEN_TCG_Y2_syncht(SHORTCODE) \
1305     do { } while (0)
1306 #define fGEN_TCG_Y2_dcfetchbo(SHORTCODE) \
1307     do { \
1308         RsV = RsV; \
1309         uiV = uiV; \
1310     } while (0)
1311 
1312 #define fGEN_TCG_L2_loadw_aq(SHORTCODE)                 SHORTCODE
1313 #define fGEN_TCG_L4_loadd_aq(SHORTCODE)                 SHORTCODE
1314 
1315 /* Nothing to do for these in qemu, need to suppress compiler warnings */
1316 #define fGEN_TCG_R6_release_at_vi(SHORTCODE) \
1317     do { \
1318         RsV = RsV; \
1319     } while (0)
1320 #define fGEN_TCG_R6_release_st_vi(SHORTCODE) \
1321     do { \
1322         RsV = RsV; \
1323     } while (0)
1324 
1325 #define fGEN_TCG_S2_storew_rl_at_vi(SHORTCODE)          SHORTCODE
1326 #define fGEN_TCG_S4_stored_rl_at_vi(SHORTCODE)          SHORTCODE
1327 #define fGEN_TCG_S2_storew_rl_st_vi(SHORTCODE)          SHORTCODE
1328 #define fGEN_TCG_S4_stored_rl_st_vi(SHORTCODE)          SHORTCODE
1329 
1330 #define fGEN_TCG_J2_trap0(SHORTCODE) \
1331     do { \
1332         uiV = uiV; \
1333         tcg_gen_movi_tl(hex_gpr[HEX_REG_PC], ctx->pkt->pc); \
1334         TCGv excp = tcg_constant_tl(HEX_EXCP_TRAP0); \
1335         gen_helper_raise_exception(cpu_env, excp); \
1336     } while (0)
1337 #endif
1338