xref: /openbmc/qemu/target/ppc/int_helper.c (revision 26c964f85159c78f6ecf132de8f2f0093d3f2e89)
1fcf5ef2aSThomas Huth /*
2fcf5ef2aSThomas Huth  *  PowerPC integer and vector emulation helpers for QEMU.
3fcf5ef2aSThomas Huth  *
4fcf5ef2aSThomas Huth  *  Copyright (c) 2003-2007 Jocelyn Mayer
5fcf5ef2aSThomas Huth  *
6fcf5ef2aSThomas Huth  * This library is free software; you can redistribute it and/or
7fcf5ef2aSThomas Huth  * modify it under the terms of the GNU Lesser General Public
8fcf5ef2aSThomas Huth  * License as published by the Free Software Foundation; either
96bd039cdSChetan Pant  * version 2.1 of the License, or (at your option) any later version.
10fcf5ef2aSThomas Huth  *
11fcf5ef2aSThomas Huth  * This library is distributed in the hope that it will be useful,
12fcf5ef2aSThomas Huth  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13fcf5ef2aSThomas Huth  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14fcf5ef2aSThomas Huth  * Lesser General Public License for more details.
15fcf5ef2aSThomas Huth  *
16fcf5ef2aSThomas Huth  * You should have received a copy of the GNU Lesser General Public
17fcf5ef2aSThomas Huth  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18fcf5ef2aSThomas Huth  */
19db725815SMarkus Armbruster 
20fcf5ef2aSThomas Huth #include "qemu/osdep.h"
21fcf5ef2aSThomas Huth #include "cpu.h"
22fcf5ef2aSThomas Huth #include "internal.h"
23fcf5ef2aSThomas Huth #include "qemu/host-utils.h"
24db725815SMarkus Armbruster #include "qemu/main-loop.h"
258a05fd9aSRichard Henderson #include "qemu/log.h"
26fcf5ef2aSThomas Huth #include "exec/helper-proto.h"
27fcf5ef2aSThomas Huth #include "crypto/aes.h"
2824f91e81SAlex Bennée #include "fpu/softfloat.h"
293f74b632SRichard Henderson #include "qapi/error.h"
303f74b632SRichard Henderson #include "qemu/guest-random.h"
311015fcabSMatheus Ferst #include "tcg/tcg-gvec-desc.h"
32fcf5ef2aSThomas Huth 
33fcf5ef2aSThomas Huth #include "helper_regs.h"
34fcf5ef2aSThomas Huth /*****************************************************************************/
35fcf5ef2aSThomas Huth /* Fixed point operations helpers */
36fcf5ef2aSThomas Huth 
37f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov)
38f32899deSNikunj A Dadhania {
39f32899deSNikunj A Dadhania     if (unlikely(ov)) {
40af721a31SVíctor Colombo         env->so = env->ov = env->ov32 = 1;
41f32899deSNikunj A Dadhania     } else {
42af721a31SVíctor Colombo         env->ov = env->ov32 = 0;
43f32899deSNikunj A Dadhania     }
44f32899deSNikunj A Dadhania }
45f32899deSNikunj A Dadhania 
46fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb,
47fcf5ef2aSThomas Huth                            uint32_t oe)
48fcf5ef2aSThomas Huth {
49fcf5ef2aSThomas Huth     uint64_t rt = 0;
50fcf5ef2aSThomas Huth     int overflow = 0;
51fcf5ef2aSThomas Huth 
52fcf5ef2aSThomas Huth     uint64_t dividend = (uint64_t)ra << 32;
53fcf5ef2aSThomas Huth     uint64_t divisor = (uint32_t)rb;
54fcf5ef2aSThomas Huth 
55fcf5ef2aSThomas Huth     if (unlikely(divisor == 0)) {
56fcf5ef2aSThomas Huth         overflow = 1;
57fcf5ef2aSThomas Huth     } else {
58fcf5ef2aSThomas Huth         rt = dividend / divisor;
59fcf5ef2aSThomas Huth         overflow = rt > UINT32_MAX;
60fcf5ef2aSThomas Huth     }
61fcf5ef2aSThomas Huth 
62fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
63fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
64fcf5ef2aSThomas Huth     }
65fcf5ef2aSThomas Huth 
66fcf5ef2aSThomas Huth     if (oe) {
67f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
68fcf5ef2aSThomas Huth     }
69fcf5ef2aSThomas Huth 
70fcf5ef2aSThomas Huth     return (target_ulong)rt;
71fcf5ef2aSThomas Huth }
72fcf5ef2aSThomas Huth 
73fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb,
74fcf5ef2aSThomas Huth                           uint32_t oe)
75fcf5ef2aSThomas Huth {
76fcf5ef2aSThomas Huth     int64_t rt = 0;
77fcf5ef2aSThomas Huth     int overflow = 0;
78fcf5ef2aSThomas Huth 
79fcf5ef2aSThomas Huth     int64_t dividend = (int64_t)ra << 32;
80fcf5ef2aSThomas Huth     int64_t divisor = (int64_t)((int32_t)rb);
81fcf5ef2aSThomas Huth 
82fcf5ef2aSThomas Huth     if (unlikely((divisor == 0) ||
83fcf5ef2aSThomas Huth                  ((divisor == -1ull) && (dividend == INT64_MIN)))) {
84fcf5ef2aSThomas Huth         overflow = 1;
85fcf5ef2aSThomas Huth     } else {
86fcf5ef2aSThomas Huth         rt = dividend / divisor;
87fcf5ef2aSThomas Huth         overflow = rt != (int32_t)rt;
88fcf5ef2aSThomas Huth     }
89fcf5ef2aSThomas Huth 
90fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
91fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
92fcf5ef2aSThomas Huth     }
93fcf5ef2aSThomas Huth 
94fcf5ef2aSThomas Huth     if (oe) {
95f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
96fcf5ef2aSThomas Huth     }
97fcf5ef2aSThomas Huth 
98fcf5ef2aSThomas Huth     return (target_ulong)rt;
99fcf5ef2aSThomas Huth }
100fcf5ef2aSThomas Huth 
101fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
102fcf5ef2aSThomas Huth 
103fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe)
104fcf5ef2aSThomas Huth {
105fcf5ef2aSThomas Huth     uint64_t rt = 0;
106fcf5ef2aSThomas Huth     int overflow = 0;
107fcf5ef2aSThomas Huth 
1089276a31cSLuis Pires     if (unlikely(rb == 0 || ra >= rb)) {
1099276a31cSLuis Pires         overflow = 1;
110fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1119276a31cSLuis Pires     } else {
1129276a31cSLuis Pires         divu128(&rt, &ra, rb);
113fcf5ef2aSThomas Huth     }
114fcf5ef2aSThomas Huth 
115fcf5ef2aSThomas Huth     if (oe) {
116f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
117fcf5ef2aSThomas Huth     }
118fcf5ef2aSThomas Huth 
119fcf5ef2aSThomas Huth     return rt;
120fcf5ef2aSThomas Huth }
121fcf5ef2aSThomas Huth 
122fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe)
123fcf5ef2aSThomas Huth {
12440f3e79aSLuis Pires     uint64_t rt = 0;
125fcf5ef2aSThomas Huth     int64_t ra = (int64_t)rau;
126fcf5ef2aSThomas Huth     int64_t rb = (int64_t)rbu;
1279276a31cSLuis Pires     int overflow = 0;
128fcf5ef2aSThomas Huth 
1299276a31cSLuis Pires     if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) {
1309276a31cSLuis Pires         overflow = 1;
131fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1329276a31cSLuis Pires     } else {
1339276a31cSLuis Pires         divs128(&rt, &ra, rb);
134fcf5ef2aSThomas Huth     }
135fcf5ef2aSThomas Huth 
136fcf5ef2aSThomas Huth     if (oe) {
137f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
138fcf5ef2aSThomas Huth     }
139fcf5ef2aSThomas Huth 
140fcf5ef2aSThomas Huth     return rt;
141fcf5ef2aSThomas Huth }
142fcf5ef2aSThomas Huth 
143fcf5ef2aSThomas Huth #endif
144fcf5ef2aSThomas Huth 
145fcf5ef2aSThomas Huth 
146fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
147fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */
148fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff))
149fcf5ef2aSThomas Huth 
150b6cb41b2SDavid Gibson /*
151b6cb41b2SDavid Gibson  * subtract 1 from each byte, and with inverse, check if MSB is set at each
152fcf5ef2aSThomas Huth  * byte.
153fcf5ef2aSThomas Huth  * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80
154fcf5ef2aSThomas Huth  *      (0xFF & 0xFF) & 0x80 = 0x80 (zero found)
155fcf5ef2aSThomas Huth  */
156fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80))
157fcf5ef2aSThomas Huth 
158fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */
159fcf5ef2aSThomas Huth #define hasvalue(x, n)  (haszero((x) ^ pattern(n)))
160fcf5ef2aSThomas Huth 
161fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb)
162fcf5ef2aSThomas Huth {
163efa73196SNikunj A Dadhania     return hasvalue(rb, ra) ? CRF_GT : 0;
164fcf5ef2aSThomas Huth }
165fcf5ef2aSThomas Huth 
166fcf5ef2aSThomas Huth #undef pattern
167fcf5ef2aSThomas Huth #undef haszero
168fcf5ef2aSThomas Huth #undef hasvalue
169fcf5ef2aSThomas Huth 
170b6cb41b2SDavid Gibson /*
1713f74b632SRichard Henderson  * Return a random number.
172fcf5ef2aSThomas Huth  */
1733f74b632SRichard Henderson uint64_t helper_darn32(void)
174fcf5ef2aSThomas Huth {
1753f74b632SRichard Henderson     Error *err = NULL;
1763f74b632SRichard Henderson     uint32_t ret;
1773f74b632SRichard Henderson 
1783f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1793f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1803f74b632SRichard Henderson                       error_get_pretty(err));
1813f74b632SRichard Henderson         error_free(err);
182fcf5ef2aSThomas Huth         return -1;
183fcf5ef2aSThomas Huth     }
184fcf5ef2aSThomas Huth 
1853f74b632SRichard Henderson     return ret;
1863f74b632SRichard Henderson }
1873f74b632SRichard Henderson 
1883f74b632SRichard Henderson uint64_t helper_darn64(void)
189fcf5ef2aSThomas Huth {
1903f74b632SRichard Henderson     Error *err = NULL;
1913f74b632SRichard Henderson     uint64_t ret;
1923f74b632SRichard Henderson 
1933f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1943f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1953f74b632SRichard Henderson                       error_get_pretty(err));
1963f74b632SRichard Henderson         error_free(err);
197fcf5ef2aSThomas Huth         return -1;
198fcf5ef2aSThomas Huth     }
199fcf5ef2aSThomas Huth 
2003f74b632SRichard Henderson     return ret;
2013f74b632SRichard Henderson }
202fcf5ef2aSThomas Huth 
203fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb)
204fcf5ef2aSThomas Huth {
205fcf5ef2aSThomas Huth     int i;
206fcf5ef2aSThomas Huth     uint64_t ra = 0;
207fcf5ef2aSThomas Huth 
208fcf5ef2aSThomas Huth     for (i = 0; i < 8; i++) {
209fcf5ef2aSThomas Huth         int index = (rs >> (i * 8)) & 0xFF;
210fcf5ef2aSThomas Huth         if (index < 64) {
211a6a444a8SCédric Le Goater             if (rb & PPC_BIT(index)) {
212fcf5ef2aSThomas Huth                 ra |= 1 << i;
213fcf5ef2aSThomas Huth             }
214fcf5ef2aSThomas Huth         }
215fcf5ef2aSThomas Huth     }
216fcf5ef2aSThomas Huth     return ra;
217fcf5ef2aSThomas Huth }
218fcf5ef2aSThomas Huth 
219fcf5ef2aSThomas Huth #endif
220fcf5ef2aSThomas Huth 
221fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb)
222fcf5ef2aSThomas Huth {
223fcf5ef2aSThomas Huth     target_ulong mask = 0xff;
224fcf5ef2aSThomas Huth     target_ulong ra = 0;
225fcf5ef2aSThomas Huth     int i;
226fcf5ef2aSThomas Huth 
227fcf5ef2aSThomas Huth     for (i = 0; i < sizeof(target_ulong); i++) {
228fcf5ef2aSThomas Huth         if ((rs & mask) == (rb & mask)) {
229fcf5ef2aSThomas Huth             ra |= mask;
230fcf5ef2aSThomas Huth         }
231fcf5ef2aSThomas Huth         mask <<= 8;
232fcf5ef2aSThomas Huth     }
233fcf5ef2aSThomas Huth     return ra;
234fcf5ef2aSThomas Huth }
235fcf5ef2aSThomas Huth 
236fcf5ef2aSThomas Huth /* shift right arithmetic helper */
237fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value,
238fcf5ef2aSThomas Huth                          target_ulong shift)
239fcf5ef2aSThomas Huth {
240fcf5ef2aSThomas Huth     int32_t ret;
241fcf5ef2aSThomas Huth 
242fcf5ef2aSThomas Huth     if (likely(!(shift & 0x20))) {
243fcf5ef2aSThomas Huth         if (likely((uint32_t)shift != 0)) {
244fcf5ef2aSThomas Huth             shift &= 0x1f;
245fcf5ef2aSThomas Huth             ret = (int32_t)value >> shift;
246fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) {
247af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
248fcf5ef2aSThomas Huth             } else {
249af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
250fcf5ef2aSThomas Huth             }
251fcf5ef2aSThomas Huth         } else {
252fcf5ef2aSThomas Huth             ret = (int32_t)value;
253af1c259fSSandipan Das             env->ca32 = env->ca = 0;
254fcf5ef2aSThomas Huth         }
255fcf5ef2aSThomas Huth     } else {
256fcf5ef2aSThomas Huth         ret = (int32_t)value >> 31;
257af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
258fcf5ef2aSThomas Huth     }
259fcf5ef2aSThomas Huth     return (target_long)ret;
260fcf5ef2aSThomas Huth }
261fcf5ef2aSThomas Huth 
262fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
263fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value,
264fcf5ef2aSThomas Huth                          target_ulong shift)
265fcf5ef2aSThomas Huth {
266fcf5ef2aSThomas Huth     int64_t ret;
267fcf5ef2aSThomas Huth 
268fcf5ef2aSThomas Huth     if (likely(!(shift & 0x40))) {
269fcf5ef2aSThomas Huth         if (likely((uint64_t)shift != 0)) {
270fcf5ef2aSThomas Huth             shift &= 0x3f;
271fcf5ef2aSThomas Huth             ret = (int64_t)value >> shift;
272fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) {
273af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
274fcf5ef2aSThomas Huth             } else {
275af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
276fcf5ef2aSThomas Huth             }
277fcf5ef2aSThomas Huth         } else {
278fcf5ef2aSThomas Huth             ret = (int64_t)value;
279af1c259fSSandipan Das             env->ca32 = env->ca = 0;
280fcf5ef2aSThomas Huth         }
281fcf5ef2aSThomas Huth     } else {
282fcf5ef2aSThomas Huth         ret = (int64_t)value >> 63;
283af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
284fcf5ef2aSThomas Huth     }
285fcf5ef2aSThomas Huth     return ret;
286fcf5ef2aSThomas Huth }
287fcf5ef2aSThomas Huth #endif
288fcf5ef2aSThomas Huth 
289fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
290fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
291fcf5ef2aSThomas Huth {
29279770002SRichard Henderson     /* Note that we don't fold past bytes */
293fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
294fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
295fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
296fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
297fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
298fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
299fcf5ef2aSThomas Huth     return val;
300fcf5ef2aSThomas Huth }
301fcf5ef2aSThomas Huth 
302fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val)
303fcf5ef2aSThomas Huth {
30479770002SRichard Henderson     /* Note that we don't fold past words.  */
305fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
306fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
307fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
308fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
309fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
310fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
311fcf5ef2aSThomas Huth     val = (val & 0x00ff00ff00ff00ffULL) + ((val >>  8) &
312fcf5ef2aSThomas Huth                                            0x00ff00ff00ff00ffULL);
313fcf5ef2aSThomas Huth     val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) &
314fcf5ef2aSThomas Huth                                            0x0000ffff0000ffffULL);
315fcf5ef2aSThomas Huth     return val;
316fcf5ef2aSThomas Huth }
317fcf5ef2aSThomas Huth #else
318fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
319fcf5ef2aSThomas Huth {
32079770002SRichard Henderson     /* Note that we don't fold past bytes */
321fcf5ef2aSThomas Huth     val = (val & 0x55555555) + ((val >>  1) & 0x55555555);
322fcf5ef2aSThomas Huth     val = (val & 0x33333333) + ((val >>  2) & 0x33333333);
323fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f) + ((val >>  4) & 0x0f0f0f0f);
324fcf5ef2aSThomas Huth     return val;
325fcf5ef2aSThomas Huth }
326fcf5ef2aSThomas Huth #endif
327fcf5ef2aSThomas Huth 
3286e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask)
32989ccd7dcSMatheus Ferst {
33089ccd7dcSMatheus Ferst     /*
33189ccd7dcSMatheus Ferst      * Instead of processing the mask bit-by-bit from the most significant to
33289ccd7dcSMatheus Ferst      * the least significant bit, as described in PowerISA, we'll handle it in
33389ccd7dcSMatheus Ferst      * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use
33489ccd7dcSMatheus Ferst      * ctz or cto, we negate the mask at the end of the loop.
33589ccd7dcSMatheus Ferst      */
33689ccd7dcSMatheus Ferst     target_ulong m, left = 0, right = 0;
33789ccd7dcSMatheus Ferst     unsigned int n, i = 64;
33889ccd7dcSMatheus Ferst     bool bit = false; /* tracks if we are processing zeros or ones */
33989ccd7dcSMatheus Ferst 
34089ccd7dcSMatheus Ferst     if (mask == 0 || mask == -1) {
34189ccd7dcSMatheus Ferst         return src;
34289ccd7dcSMatheus Ferst     }
34389ccd7dcSMatheus Ferst 
34489ccd7dcSMatheus Ferst     /* Processes the mask in blocks, from LSB to MSB */
34589ccd7dcSMatheus Ferst     while (i) {
34689ccd7dcSMatheus Ferst         /* Find how many bits we should take */
34789ccd7dcSMatheus Ferst         n = ctz64(mask);
34889ccd7dcSMatheus Ferst         if (n > i) {
34989ccd7dcSMatheus Ferst             n = i;
35089ccd7dcSMatheus Ferst         }
35189ccd7dcSMatheus Ferst 
35289ccd7dcSMatheus Ferst         /*
35389ccd7dcSMatheus Ferst          * Extracts 'n' trailing bits of src and put them on the leading 'n'
35489ccd7dcSMatheus Ferst          * bits of 'right' or 'left', pushing down the previously extracted
35589ccd7dcSMatheus Ferst          * values.
35689ccd7dcSMatheus Ferst          */
35789ccd7dcSMatheus Ferst         m = (1ll << n) - 1;
35889ccd7dcSMatheus Ferst         if (bit) {
35989ccd7dcSMatheus Ferst             right = ror64(right | (src & m), n);
36089ccd7dcSMatheus Ferst         } else {
36189ccd7dcSMatheus Ferst             left = ror64(left | (src & m), n);
36289ccd7dcSMatheus Ferst         }
36389ccd7dcSMatheus Ferst 
36489ccd7dcSMatheus Ferst         /*
36589ccd7dcSMatheus Ferst          * Discards the processed bits from 'src' and 'mask'. Note that we are
36689ccd7dcSMatheus Ferst          * removing 'n' trailing zeros from 'mask', but the logical shift will
36789ccd7dcSMatheus Ferst          * add 'n' leading zeros back, so the population count of 'mask' is kept
36889ccd7dcSMatheus Ferst          * the same.
36989ccd7dcSMatheus Ferst          */
37089ccd7dcSMatheus Ferst         src >>= n;
37189ccd7dcSMatheus Ferst         mask >>= n;
37289ccd7dcSMatheus Ferst         i -= n;
37389ccd7dcSMatheus Ferst         bit = !bit;
37489ccd7dcSMatheus Ferst         mask = ~mask;
37589ccd7dcSMatheus Ferst     }
37689ccd7dcSMatheus Ferst 
37789ccd7dcSMatheus Ferst     /*
37889ccd7dcSMatheus Ferst      * At the end, right was ror'ed ctpop(mask) times. To put it back in place,
37989ccd7dcSMatheus Ferst      * we'll shift it more 64-ctpop(mask) times.
38089ccd7dcSMatheus Ferst      */
38189ccd7dcSMatheus Ferst     if (bit) {
38289ccd7dcSMatheus Ferst         n = ctpop64(mask);
38389ccd7dcSMatheus Ferst     } else {
38489ccd7dcSMatheus Ferst         n = 64 - ctpop64(mask);
38589ccd7dcSMatheus Ferst     }
38689ccd7dcSMatheus Ferst 
38789ccd7dcSMatheus Ferst     return left | (right >> n);
38889ccd7dcSMatheus Ferst }
38989ccd7dcSMatheus Ferst 
39021ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask)
39121ba6e58SMatheus Ferst {
39221ba6e58SMatheus Ferst     int i, o;
39321ba6e58SMatheus Ferst     uint64_t result = 0;
39421ba6e58SMatheus Ferst 
39521ba6e58SMatheus Ferst     if (mask == -1) {
39621ba6e58SMatheus Ferst         return src;
39721ba6e58SMatheus Ferst     }
39821ba6e58SMatheus Ferst 
39921ba6e58SMatheus Ferst     for (i = 0; mask != 0; i++) {
40021ba6e58SMatheus Ferst         o = ctz64(mask);
40121ba6e58SMatheus Ferst         mask &= mask - 1;
40221ba6e58SMatheus Ferst         result |= ((src >> i) & 1) << o;
40321ba6e58SMatheus Ferst     }
40421ba6e58SMatheus Ferst 
40521ba6e58SMatheus Ferst     return result;
40621ba6e58SMatheus Ferst }
4078bdb7606SMatheus Ferst 
4088bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask)
4098bdb7606SMatheus Ferst {
4108bdb7606SMatheus Ferst     int i, o;
4118bdb7606SMatheus Ferst     uint64_t result = 0;
4128bdb7606SMatheus Ferst 
4138bdb7606SMatheus Ferst     if (mask == -1) {
4148bdb7606SMatheus Ferst         return src;
4158bdb7606SMatheus Ferst     }
4168bdb7606SMatheus Ferst 
4178bdb7606SMatheus Ferst     for (o = 0; mask != 0; o++) {
4188bdb7606SMatheus Ferst         i = ctz64(mask);
4198bdb7606SMatheus Ferst         mask &= mask - 1;
4208bdb7606SMatheus Ferst         result |= ((src >> i) & 1) << o;
4218bdb7606SMatheus Ferst     }
4228bdb7606SMatheus Ferst 
4238bdb7606SMatheus Ferst     return result;
4248bdb7606SMatheus Ferst }
42521ba6e58SMatheus Ferst 
426fcf5ef2aSThomas Huth /*****************************************************************************/
427fcf5ef2aSThomas Huth /* Altivec extension helpers */
428e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
429fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
430fcf5ef2aSThomas Huth     for (index = 0; index < ARRAY_SIZE(r->element); index++)
431fcf5ef2aSThomas Huth #else
432fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
433fcf5ef2aSThomas Huth     for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--)
434fcf5ef2aSThomas Huth #endif
435fcf5ef2aSThomas Huth 
436fcf5ef2aSThomas Huth /* Saturating arithmetic helpers.  */
437fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max)          \
438fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
439fcf5ef2aSThomas Huth     {                                                           \
440fcf5ef2aSThomas Huth         to_type r;                                              \
441fcf5ef2aSThomas Huth                                                                 \
442fcf5ef2aSThomas Huth         if (x < (from_type)min) {                               \
443fcf5ef2aSThomas Huth             r = min;                                            \
444fcf5ef2aSThomas Huth             *sat = 1;                                           \
445fcf5ef2aSThomas Huth         } else if (x > (from_type)max) {                        \
446fcf5ef2aSThomas Huth             r = max;                                            \
447fcf5ef2aSThomas Huth             *sat = 1;                                           \
448fcf5ef2aSThomas Huth         } else {                                                \
449fcf5ef2aSThomas Huth             r = x;                                              \
450fcf5ef2aSThomas Huth         }                                                       \
451fcf5ef2aSThomas Huth         return r;                                               \
452fcf5ef2aSThomas Huth     }
453fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max)         \
454fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
455fcf5ef2aSThomas Huth     {                                                           \
456fcf5ef2aSThomas Huth         to_type r;                                              \
457fcf5ef2aSThomas Huth                                                                 \
458fcf5ef2aSThomas Huth         if (x > (from_type)max) {                               \
459fcf5ef2aSThomas Huth             r = max;                                            \
460fcf5ef2aSThomas Huth             *sat = 1;                                           \
461fcf5ef2aSThomas Huth         } else {                                                \
462fcf5ef2aSThomas Huth             r = x;                                              \
463fcf5ef2aSThomas Huth         }                                                       \
464fcf5ef2aSThomas Huth         return r;                                               \
465fcf5ef2aSThomas Huth     }
466fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX)
467fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX)
468fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX)
469fcf5ef2aSThomas Huth 
470fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX)
471fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX)
472fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX)
473fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX)
474fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX)
475fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX)
476fcf5ef2aSThomas Huth #undef SATCVT
477fcf5ef2aSThomas Huth #undef SATCVTU
478fcf5ef2aSThomas Huth 
479dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr)
480fcf5ef2aSThomas Huth {
481c19940dbSBruno Larsen (billionai)     ppc_store_vscr(env, vscr);
482fcf5ef2aSThomas Huth }
483fcf5ef2aSThomas Huth 
484cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env)
485cc2b90d7SRichard Henderson {
486c19940dbSBruno Larsen (billionai)     return ppc_get_vscr(env);
487cc2b90d7SRichard Henderson }
488cc2b90d7SRichard Henderson 
4896175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env)
4906175f5a0SRichard Henderson {
4919b5b74daSRichard Henderson     /* The choice of non-zero value is arbitrary.  */
4929b5b74daSRichard Henderson     env->vscr_sat.u32[0] = 1;
4936175f5a0SRichard Henderson }
4946175f5a0SRichard Henderson 
495fcf5ef2aSThomas Huth /* vprtybq */
496d57fbd8fSLucas Mateus Castro (alqotel) void helper_VPRTYBQ(ppc_avr_t *r, ppc_avr_t *b, uint32_t v)
497fcf5ef2aSThomas Huth {
498fcf5ef2aSThomas Huth     uint64_t res = b->u64[0] ^ b->u64[1];
499fcf5ef2aSThomas Huth     res ^= res >> 32;
500fcf5ef2aSThomas Huth     res ^= res >> 16;
501fcf5ef2aSThomas Huth     res ^= res >> 8;
5023c385a93SMark Cave-Ayland     r->VsrD(1) = res & 1;
5033c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
504fcf5ef2aSThomas Huth }
505fcf5ef2aSThomas Huth 
506fcf5ef2aSThomas Huth #define VARITHFP(suffix, func)                                          \
507fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
508fcf5ef2aSThomas Huth                           ppc_avr_t *b)                                 \
509fcf5ef2aSThomas Huth     {                                                                   \
510fcf5ef2aSThomas Huth         int i;                                                          \
511fcf5ef2aSThomas Huth                                                                         \
51205ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
51305ee3e8aSMark Cave-Ayland             r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status);   \
514fcf5ef2aSThomas Huth         }                                                               \
515fcf5ef2aSThomas Huth     }
516fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add)
517fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub)
518fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min)
519fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max)
520fcf5ef2aSThomas Huth #undef VARITHFP
521fcf5ef2aSThomas Huth 
522fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type)                                       \
523fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
524fcf5ef2aSThomas Huth                            ppc_avr_t *b, ppc_avr_t *c)                  \
525fcf5ef2aSThomas Huth     {                                                                   \
526fcf5ef2aSThomas Huth         int i;                                                          \
52705ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
52805ee3e8aSMark Cave-Ayland             r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \
529fcf5ef2aSThomas Huth                                        type, &env->vec_status);         \
530fcf5ef2aSThomas Huth         }                                                               \
531fcf5ef2aSThomas Huth     }
532fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0);
533fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c);
534fcf5ef2aSThomas Huth #undef VARITHFPFMA
535fcf5ef2aSThomas Huth 
536fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element)                          \
537fcf5ef2aSThomas Huth     {                                                                   \
538fcf5ef2aSThomas Huth         type result = (type)a->element[i] op (type)b->element[i];       \
539fcf5ef2aSThomas Huth         r->element[i] = cvt(result, &sat);                              \
540fcf5ef2aSThomas Huth     }
541fcf5ef2aSThomas Huth 
542fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element)                    \
543fb11ae7dSRichard Henderson     void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat,              \
544fb11ae7dSRichard Henderson                         ppc_avr_t *a, ppc_avr_t *b, uint32_t desc)      \
545fcf5ef2aSThomas Huth     {                                                                   \
546fcf5ef2aSThomas Huth         int sat = 0;                                                    \
547fcf5ef2aSThomas Huth         int i;                                                          \
548fcf5ef2aSThomas Huth                                                                         \
549fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
550fcf5ef2aSThomas Huth             VARITHSAT_CASE(optype, op, cvt, element);                   \
551fcf5ef2aSThomas Huth         }                                                               \
552fcf5ef2aSThomas Huth         if (sat) {                                                      \
553fb11ae7dSRichard Henderson             vscr_sat->u32[0] = 1;                                       \
554fcf5ef2aSThomas Huth         }                                                               \
555fcf5ef2aSThomas Huth     }
556fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt)          \
557fcf5ef2aSThomas Huth     VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element)      \
558fcf5ef2aSThomas Huth     VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element)
559fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt)        \
560fcf5ef2aSThomas Huth     VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element)      \
561fcf5ef2aSThomas Huth     VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element)
562fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb)
563fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh)
564fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw)
565fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub)
566fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh)
567fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw)
568fcf5ef2aSThomas Huth #undef VARITHSAT_CASE
569fcf5ef2aSThomas Huth #undef VARITHSAT_DO
570fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED
571fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED
572fcf5ef2aSThomas Huth 
573c85929b2SLucas Mateus Castro (alqotel) #define VAVG(name, element, etype)                                          \
574c85929b2SLucas Mateus Castro (alqotel)     void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t v)\
575fcf5ef2aSThomas Huth     {                                                                       \
576fcf5ef2aSThomas Huth         int i;                                                              \
577fcf5ef2aSThomas Huth                                                                             \
578fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
579fcf5ef2aSThomas Huth             etype x = (etype)a->element[i] + (etype)b->element[i] + 1;      \
580fcf5ef2aSThomas Huth             r->element[i] = x >> 1;                                         \
581fcf5ef2aSThomas Huth         }                                                                   \
582fcf5ef2aSThomas Huth     }
583fcf5ef2aSThomas Huth 
584c85929b2SLucas Mateus Castro (alqotel) VAVG(VAVGSB, s8, int16_t)
585c85929b2SLucas Mateus Castro (alqotel) VAVG(VAVGUB, u8, uint16_t)
586c85929b2SLucas Mateus Castro (alqotel) VAVG(VAVGSH, s16, int32_t)
587c85929b2SLucas Mateus Castro (alqotel) VAVG(VAVGUH, u16, uint32_t)
588c85929b2SLucas Mateus Castro (alqotel) VAVG(VAVGSW, s32, int64_t)
589c85929b2SLucas Mateus Castro (alqotel) VAVG(VAVGUW, u32, uint64_t)
590fcf5ef2aSThomas Huth #undef VAVG
591fcf5ef2aSThomas Huth 
592*26c964f8SLucas Mateus Castro (alqotel) #define VABSDU(name, element)                                           \
593*26c964f8SLucas Mateus Castro (alqotel) void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t v)\
594fcf5ef2aSThomas Huth {                                                                       \
595fcf5ef2aSThomas Huth     int i;                                                              \
596fcf5ef2aSThomas Huth                                                                         \
597fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
598fcf5ef2aSThomas Huth         r->element[i] = (a->element[i] > b->element[i]) ?               \
599fcf5ef2aSThomas Huth             (a->element[i] - b->element[i]) :                           \
600fcf5ef2aSThomas Huth             (b->element[i] - a->element[i]);                            \
601fcf5ef2aSThomas Huth     }                                                                   \
602fcf5ef2aSThomas Huth }
603fcf5ef2aSThomas Huth 
604b6cb41b2SDavid Gibson /*
605b6cb41b2SDavid Gibson  * VABSDU - Vector absolute difference unsigned
606fcf5ef2aSThomas Huth  *   name    - instruction mnemonic suffix (b: byte, h: halfword, w: word)
607fcf5ef2aSThomas Huth  *   element - element type to access from vector
608fcf5ef2aSThomas Huth  */
609*26c964f8SLucas Mateus Castro (alqotel) VABSDU(VABSDUB, u8)
610*26c964f8SLucas Mateus Castro (alqotel) VABSDU(VABSDUH, u16)
611*26c964f8SLucas Mateus Castro (alqotel) VABSDU(VABSDUW, u32)
612fcf5ef2aSThomas Huth #undef VABSDU
613fcf5ef2aSThomas Huth 
614fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element)                                       \
615fcf5ef2aSThomas Huth     void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r,             \
616fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
617fcf5ef2aSThomas Huth     {                                                                   \
618fcf5ef2aSThomas Huth         int i;                                                          \
619fcf5ef2aSThomas Huth                                                                         \
62005ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
621fcf5ef2aSThomas Huth             float32 t = cvt(b->element[i], &env->vec_status);           \
62205ee3e8aSMark Cave-Ayland             r->f32[i] = float32_scalbn(t, -uim, &env->vec_status);      \
623fcf5ef2aSThomas Huth         }                                                               \
624fcf5ef2aSThomas Huth     }
625fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32)
626fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32)
627fcf5ef2aSThomas Huth #undef VCF
628fcf5ef2aSThomas Huth 
629eb936dc0SMatheus Ferst #define VCMPNEZ(NAME, ELEM) \
630eb936dc0SMatheus Ferst void helper_##NAME(ppc_vsr_t *t, ppc_vsr_t *a, ppc_vsr_t *b, uint32_t desc) \
631fcf5ef2aSThomas Huth {                                                                           \
632eb936dc0SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->ELEM); i++) {                         \
633eb936dc0SMatheus Ferst         t->ELEM[i] = ((a->ELEM[i] == 0) || (b->ELEM[i] == 0) ||             \
634eb936dc0SMatheus Ferst                       (a->ELEM[i] != b->ELEM[i])) ? -1 : 0;                 \
635fcf5ef2aSThomas Huth     }                                                                       \
636fcf5ef2aSThomas Huth }
637eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZB, u8)
638eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZH, u16)
639eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZW, u32)
640eb936dc0SMatheus Ferst #undef VCMPNEZ
641fcf5ef2aSThomas Huth 
642fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record)                       \
643fcf5ef2aSThomas Huth     void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r,            \
644fcf5ef2aSThomas Huth                              ppc_avr_t *a, ppc_avr_t *b)                \
645fcf5ef2aSThomas Huth     {                                                                   \
646fcf5ef2aSThomas Huth         uint32_t ones = (uint32_t)-1;                                   \
647fcf5ef2aSThomas Huth         uint32_t all = ones;                                            \
648fcf5ef2aSThomas Huth         uint32_t none = 0;                                              \
649fcf5ef2aSThomas Huth         int i;                                                          \
650fcf5ef2aSThomas Huth                                                                         \
65105ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
652fcf5ef2aSThomas Huth             uint32_t result;                                            \
65371bfd65cSRichard Henderson             FloatRelation rel =                                         \
65471bfd65cSRichard Henderson                 float32_compare_quiet(a->f32[i], b->f32[i],             \
655fcf5ef2aSThomas Huth                                       &env->vec_status);                \
656fcf5ef2aSThomas Huth             if (rel == float_relation_unordered) {                      \
657fcf5ef2aSThomas Huth                 result = 0;                                             \
658fcf5ef2aSThomas Huth             } else if (rel compare order) {                             \
659fcf5ef2aSThomas Huth                 result = ones;                                          \
660fcf5ef2aSThomas Huth             } else {                                                    \
661fcf5ef2aSThomas Huth                 result = 0;                                             \
662fcf5ef2aSThomas Huth             }                                                           \
663fcf5ef2aSThomas Huth             r->u32[i] = result;                                         \
664fcf5ef2aSThomas Huth             all &= result;                                              \
665fcf5ef2aSThomas Huth             none |= result;                                             \
666fcf5ef2aSThomas Huth         }                                                               \
667fcf5ef2aSThomas Huth         if (record) {                                                   \
668fcf5ef2aSThomas Huth             env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1);       \
669fcf5ef2aSThomas Huth         }                                                               \
670fcf5ef2aSThomas Huth     }
671fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order)          \
672fcf5ef2aSThomas Huth     VCMPFP_DO(suffix, compare, order, 0)        \
673fcf5ef2aSThomas Huth     VCMPFP_DO(suffix##_dot, compare, order, 1)
674fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal)
675fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less)
676fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater)
677fcf5ef2aSThomas Huth #undef VCMPFP_DO
678fcf5ef2aSThomas Huth #undef VCMPFP
679fcf5ef2aSThomas Huth 
680fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r,
681fcf5ef2aSThomas Huth                                     ppc_avr_t *a, ppc_avr_t *b, int record)
682fcf5ef2aSThomas Huth {
683fcf5ef2aSThomas Huth     int i;
684fcf5ef2aSThomas Huth     int all_in = 0;
685fcf5ef2aSThomas Huth 
68605ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
68771bfd65cSRichard Henderson         FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i],
68805ee3e8aSMark Cave-Ayland                                                      &env->vec_status);
689fcf5ef2aSThomas Huth         if (le_rel == float_relation_unordered) {
690fcf5ef2aSThomas Huth             r->u32[i] = 0xc0000000;
691fcf5ef2aSThomas Huth             all_in = 1;
692fcf5ef2aSThomas Huth         } else {
69305ee3e8aSMark Cave-Ayland             float32 bneg = float32_chs(b->f32[i]);
69471bfd65cSRichard Henderson             FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg,
69505ee3e8aSMark Cave-Ayland                                                          &env->vec_status);
696fcf5ef2aSThomas Huth             int le = le_rel != float_relation_greater;
697fcf5ef2aSThomas Huth             int ge = ge_rel != float_relation_less;
698fcf5ef2aSThomas Huth 
699fcf5ef2aSThomas Huth             r->u32[i] = ((!le) << 31) | ((!ge) << 30);
700fcf5ef2aSThomas Huth             all_in |= (!le | !ge);
701fcf5ef2aSThomas Huth         }
702fcf5ef2aSThomas Huth     }
703fcf5ef2aSThomas Huth     if (record) {
704fcf5ef2aSThomas Huth         env->crf[6] = (all_in == 0) << 1;
705fcf5ef2aSThomas Huth     }
706fcf5ef2aSThomas Huth }
707fcf5ef2aSThomas Huth 
708fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
709fcf5ef2aSThomas Huth {
710fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 0);
711fcf5ef2aSThomas Huth }
712fcf5ef2aSThomas Huth 
713fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
714fcf5ef2aSThomas Huth                         ppc_avr_t *b)
715fcf5ef2aSThomas Huth {
716fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 1);
717fcf5ef2aSThomas Huth }
718fcf5ef2aSThomas Huth 
719fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element)                                    \
720fcf5ef2aSThomas Huth     void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r,             \
721fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
722fcf5ef2aSThomas Huth     {                                                                   \
723fcf5ef2aSThomas Huth         int i;                                                          \
724fcf5ef2aSThomas Huth         int sat = 0;                                                    \
725fcf5ef2aSThomas Huth         float_status s = env->vec_status;                               \
726fcf5ef2aSThomas Huth                                                                         \
727fcf5ef2aSThomas Huth         set_float_rounding_mode(float_round_to_zero, &s);               \
72805ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
72905ee3e8aSMark Cave-Ayland             if (float32_is_any_nan(b->f32[i])) {                        \
730fcf5ef2aSThomas Huth                 r->element[i] = 0;                                      \
731fcf5ef2aSThomas Huth             } else {                                                    \
73205ee3e8aSMark Cave-Ayland                 float64 t = float32_to_float64(b->f32[i], &s);          \
733fcf5ef2aSThomas Huth                 int64_t j;                                              \
734fcf5ef2aSThomas Huth                                                                         \
735fcf5ef2aSThomas Huth                 t = float64_scalbn(t, uim, &s);                         \
736fcf5ef2aSThomas Huth                 j = float64_to_int64(t, &s);                            \
737fcf5ef2aSThomas Huth                 r->element[i] = satcvt(j, &sat);                        \
738fcf5ef2aSThomas Huth             }                                                           \
739fcf5ef2aSThomas Huth         }                                                               \
740fcf5ef2aSThomas Huth         if (sat) {                                                      \
7416175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
742fcf5ef2aSThomas Huth         }                                                               \
743fcf5ef2aSThomas Huth     }
744fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32)
745fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32)
746fcf5ef2aSThomas Huth #undef VCT
747fcf5ef2aSThomas Huth 
74834553153SLucas Mateus Castro (alqotel) typedef int64_t do_ger(uint32_t, uint32_t, uint32_t);
74934553153SLucas Mateus Castro (alqotel) 
75034553153SLucas Mateus Castro (alqotel) static int64_t ger_rank8(uint32_t a, uint32_t b, uint32_t mask)
75134553153SLucas Mateus Castro (alqotel) {
75234553153SLucas Mateus Castro (alqotel)     int64_t psum = 0;
75334553153SLucas Mateus Castro (alqotel)     for (int i = 0; i < 8; i++, mask >>= 1) {
75434553153SLucas Mateus Castro (alqotel)         if (mask & 1) {
755feeef6b6SDaniel Henrique Barboza             psum += (int64_t)sextract32(a, 4 * i, 4) * sextract32(b, 4 * i, 4);
75634553153SLucas Mateus Castro (alqotel)         }
75734553153SLucas Mateus Castro (alqotel)     }
75834553153SLucas Mateus Castro (alqotel)     return psum;
75934553153SLucas Mateus Castro (alqotel) }
76034553153SLucas Mateus Castro (alqotel) 
76134553153SLucas Mateus Castro (alqotel) static int64_t ger_rank4(uint32_t a, uint32_t b, uint32_t mask)
76234553153SLucas Mateus Castro (alqotel) {
76334553153SLucas Mateus Castro (alqotel)     int64_t psum = 0;
76434553153SLucas Mateus Castro (alqotel)     for (int i = 0; i < 4; i++, mask >>= 1) {
76534553153SLucas Mateus Castro (alqotel)         if (mask & 1) {
76634553153SLucas Mateus Castro (alqotel)             psum += sextract32(a, 8 * i, 8) * (int64_t)extract32(b, 8 * i, 8);
76734553153SLucas Mateus Castro (alqotel)         }
76834553153SLucas Mateus Castro (alqotel)     }
76934553153SLucas Mateus Castro (alqotel)     return psum;
77034553153SLucas Mateus Castro (alqotel) }
77134553153SLucas Mateus Castro (alqotel) 
77234553153SLucas Mateus Castro (alqotel) static int64_t ger_rank2(uint32_t a, uint32_t b, uint32_t mask)
77334553153SLucas Mateus Castro (alqotel) {
77434553153SLucas Mateus Castro (alqotel)     int64_t psum = 0;
77534553153SLucas Mateus Castro (alqotel)     for (int i = 0; i < 2; i++, mask >>= 1) {
77634553153SLucas Mateus Castro (alqotel)         if (mask & 1) {
777feeef6b6SDaniel Henrique Barboza             psum += (int64_t)sextract32(a, 16 * i, 16) *
778feeef6b6SDaniel Henrique Barboza                              sextract32(b, 16 * i, 16);
77934553153SLucas Mateus Castro (alqotel)         }
78034553153SLucas Mateus Castro (alqotel)     }
78134553153SLucas Mateus Castro (alqotel)     return psum;
78234553153SLucas Mateus Castro (alqotel) }
78334553153SLucas Mateus Castro (alqotel) 
78434553153SLucas Mateus Castro (alqotel) static void xviger(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, ppc_acc_t  *at,
78534553153SLucas Mateus Castro (alqotel)                    uint32_t mask, bool sat, bool acc, do_ger ger)
78634553153SLucas Mateus Castro (alqotel) {
78734553153SLucas Mateus Castro (alqotel)     uint8_t pmsk = FIELD_EX32(mask, GER_MSK, PMSK),
78834553153SLucas Mateus Castro (alqotel)             xmsk = FIELD_EX32(mask, GER_MSK, XMSK),
78934553153SLucas Mateus Castro (alqotel)             ymsk = FIELD_EX32(mask, GER_MSK, YMSK);
79034553153SLucas Mateus Castro (alqotel)     uint8_t xmsk_bit, ymsk_bit;
79134553153SLucas Mateus Castro (alqotel)     int64_t psum;
79234553153SLucas Mateus Castro (alqotel)     int i, j;
79334553153SLucas Mateus Castro (alqotel)     for (i = 0, xmsk_bit = 1 << 3; i < 4; i++, xmsk_bit >>= 1) {
79434553153SLucas Mateus Castro (alqotel)         for (j = 0, ymsk_bit = 1 << 3; j < 4; j++, ymsk_bit >>= 1) {
79534553153SLucas Mateus Castro (alqotel)             if ((xmsk_bit & xmsk) && (ymsk_bit & ymsk)) {
79634553153SLucas Mateus Castro (alqotel)                 psum = ger(a->VsrW(i), b->VsrW(j), pmsk);
79734553153SLucas Mateus Castro (alqotel)                 if (acc) {
79834553153SLucas Mateus Castro (alqotel)                     psum += at[i].VsrSW(j);
79934553153SLucas Mateus Castro (alqotel)                 }
80034553153SLucas Mateus Castro (alqotel)                 if (sat && psum > INT32_MAX) {
80134553153SLucas Mateus Castro (alqotel)                     set_vscr_sat(env);
80234553153SLucas Mateus Castro (alqotel)                     at[i].VsrSW(j) = INT32_MAX;
80334553153SLucas Mateus Castro (alqotel)                 } else if (sat && psum < INT32_MIN) {
80434553153SLucas Mateus Castro (alqotel)                     set_vscr_sat(env);
80534553153SLucas Mateus Castro (alqotel)                     at[i].VsrSW(j) = INT32_MIN;
80634553153SLucas Mateus Castro (alqotel)                 } else {
80734553153SLucas Mateus Castro (alqotel)                     at[i].VsrSW(j) = (int32_t) psum;
80834553153SLucas Mateus Castro (alqotel)                 }
80934553153SLucas Mateus Castro (alqotel)             } else {
81034553153SLucas Mateus Castro (alqotel)                 at[i].VsrSW(j) = 0;
81134553153SLucas Mateus Castro (alqotel)             }
81234553153SLucas Mateus Castro (alqotel)         }
81334553153SLucas Mateus Castro (alqotel)     }
81434553153SLucas Mateus Castro (alqotel) }
81534553153SLucas Mateus Castro (alqotel) 
81634553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
81734553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
81834553153SLucas Mateus Castro (alqotel)                      ppc_acc_t *at, uint32_t mask)
81934553153SLucas Mateus Castro (alqotel) {
82034553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, false, ger_rank8);
82134553153SLucas Mateus Castro (alqotel) }
82234553153SLucas Mateus Castro (alqotel) 
82334553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
82434553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
82534553153SLucas Mateus Castro (alqotel)                        ppc_acc_t *at, uint32_t mask)
82634553153SLucas Mateus Castro (alqotel) {
82734553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, true, ger_rank8);
82834553153SLucas Mateus Castro (alqotel) }
82934553153SLucas Mateus Castro (alqotel) 
83034553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
83134553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
83234553153SLucas Mateus Castro (alqotel)                      ppc_acc_t *at, uint32_t mask)
83334553153SLucas Mateus Castro (alqotel) {
83434553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, false, ger_rank4);
83534553153SLucas Mateus Castro (alqotel) }
83634553153SLucas Mateus Castro (alqotel) 
83734553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
83834553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
83934553153SLucas Mateus Castro (alqotel)                        ppc_acc_t *at, uint32_t mask)
84034553153SLucas Mateus Castro (alqotel) {
84134553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, true, ger_rank4);
84234553153SLucas Mateus Castro (alqotel) }
84334553153SLucas Mateus Castro (alqotel) 
84434553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
84534553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
84634553153SLucas Mateus Castro (alqotel)                         ppc_acc_t *at, uint32_t mask)
84734553153SLucas Mateus Castro (alqotel) {
84834553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, true, true, ger_rank4);
84934553153SLucas Mateus Castro (alqotel) }
85034553153SLucas Mateus Castro (alqotel) 
85134553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
85234553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
85334553153SLucas Mateus Castro (alqotel)                       ppc_acc_t *at, uint32_t mask)
85434553153SLucas Mateus Castro (alqotel) {
85534553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, false, ger_rank2);
85634553153SLucas Mateus Castro (alqotel) }
85734553153SLucas Mateus Castro (alqotel) 
85834553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
85934553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2S(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
86034553153SLucas Mateus Castro (alqotel)                        ppc_acc_t *at, uint32_t mask)
86134553153SLucas Mateus Castro (alqotel) {
86234553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, true, false, ger_rank2);
86334553153SLucas Mateus Castro (alqotel) }
86434553153SLucas Mateus Castro (alqotel) 
86534553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
86634553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
86734553153SLucas Mateus Castro (alqotel)                         ppc_acc_t *at, uint32_t mask)
86834553153SLucas Mateus Castro (alqotel) {
86934553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, true, ger_rank2);
87034553153SLucas Mateus Castro (alqotel) }
87134553153SLucas Mateus Castro (alqotel) 
87234553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
87334553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
87434553153SLucas Mateus Castro (alqotel)                          ppc_acc_t *at, uint32_t mask)
87534553153SLucas Mateus Castro (alqotel) {
87634553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, true, true, ger_rank2);
87734553153SLucas Mateus Castro (alqotel) }
87834553153SLucas Mateus Castro (alqotel) 
879fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r)
880fcf5ef2aSThomas Huth {
881fcf5ef2aSThomas Huth     target_ulong count = 0;
882fcf5ef2aSThomas Huth     int i;
88360594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
88460594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
885fcf5ef2aSThomas Huth             break;
886fcf5ef2aSThomas Huth         }
887fcf5ef2aSThomas Huth         count++;
888fcf5ef2aSThomas Huth     }
889fcf5ef2aSThomas Huth     return count;
890fcf5ef2aSThomas Huth }
891fcf5ef2aSThomas Huth 
892fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r)
893fcf5ef2aSThomas Huth {
894fcf5ef2aSThomas Huth     target_ulong count = 0;
895fcf5ef2aSThomas Huth     int i;
896fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
89760594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
898fcf5ef2aSThomas Huth             break;
899fcf5ef2aSThomas Huth         }
900fcf5ef2aSThomas Huth         count++;
901fcf5ef2aSThomas Huth     }
902fcf5ef2aSThomas Huth     return count;
903fcf5ef2aSThomas Huth }
904fcf5ef2aSThomas Huth 
905306e4753SLucas Mateus Castro (alqotel) void helper_VMHADDSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
906fcf5ef2aSThomas Huth                       ppc_avr_t *b, ppc_avr_t *c)
907fcf5ef2aSThomas Huth {
908fcf5ef2aSThomas Huth     int sat = 0;
909fcf5ef2aSThomas Huth     int i;
910fcf5ef2aSThomas Huth 
911fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
912fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
913fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
914fcf5ef2aSThomas Huth 
915fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
916fcf5ef2aSThomas Huth     }
917fcf5ef2aSThomas Huth 
918fcf5ef2aSThomas Huth     if (sat) {
9196175f5a0SRichard Henderson         set_vscr_sat(env);
920fcf5ef2aSThomas Huth     }
921fcf5ef2aSThomas Huth }
922fcf5ef2aSThomas Huth 
923306e4753SLucas Mateus Castro (alqotel) void helper_VMHRADDSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
924fcf5ef2aSThomas Huth                        ppc_avr_t *b, ppc_avr_t *c)
925fcf5ef2aSThomas Huth {
926fcf5ef2aSThomas Huth     int sat = 0;
927fcf5ef2aSThomas Huth     int i;
928fcf5ef2aSThomas Huth 
929fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
930fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i] + 0x00004000;
931fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
932fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
933fcf5ef2aSThomas Huth     }
934fcf5ef2aSThomas Huth 
935fcf5ef2aSThomas Huth     if (sat) {
9366175f5a0SRichard Henderson         set_vscr_sat(env);
937fcf5ef2aSThomas Huth     }
938fcf5ef2aSThomas Huth }
939fcf5ef2aSThomas Huth 
940dc46167aSLucas Mateus Castro (alqotel) void helper_VMLADDUHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c,
941dc46167aSLucas Mateus Castro (alqotel)                       uint32_t v)
942fcf5ef2aSThomas Huth {
943fcf5ef2aSThomas Huth     int i;
944fcf5ef2aSThomas Huth 
945fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
946fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
947fcf5ef2aSThomas Huth         r->s16[i] = (int16_t) (prod + c->s16[i]);
948fcf5ef2aSThomas Huth     }
949fcf5ef2aSThomas Huth }
950fcf5ef2aSThomas Huth 
951d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs)                                  \
952fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)            \
953fcf5ef2aSThomas Huth     {                                                                        \
954fcf5ef2aSThomas Huth         ppc_avr_t result;                                                    \
955d81c2040SMark Cave-Ayland         int i, half = ARRAY_SIZE(r->element) / 2;                            \
956fcf5ef2aSThomas Huth                                                                              \
957d81c2040SMark Cave-Ayland         for (i = 0; i < half; i++) {                                         \
958d81c2040SMark Cave-Ayland             result.access(i * 2 + 0) = a->access(i + ofs);                   \
959d81c2040SMark Cave-Ayland             result.access(i * 2 + 1) = b->access(i + ofs);                   \
960fcf5ef2aSThomas Huth         }                                                                    \
961fcf5ef2aSThomas Huth         *r = result;                                                         \
962fcf5ef2aSThomas Huth     }
963d81c2040SMark Cave-Ayland 
964d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access)          \
965d81c2040SMark Cave-Ayland     VMRG_DO(mrgl##suffix, element, access, half)   \
966d81c2040SMark Cave-Ayland     VMRG_DO(mrgh##suffix, element, access, 0)
967d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB)
968d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH)
969d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW)
970fcf5ef2aSThomas Huth #undef VMRG_DO
971fcf5ef2aSThomas Huth #undef VMRG
972fcf5ef2aSThomas Huth 
973b2dc03a5SMatheus Ferst void helper_VMSUMMBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
974fcf5ef2aSThomas Huth {
975fcf5ef2aSThomas Huth     int32_t prod[16];
976fcf5ef2aSThomas Huth     int i;
977fcf5ef2aSThomas Huth 
978fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s8); i++) {
979fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s8[i] * b->u8[i];
980fcf5ef2aSThomas Huth     }
981fcf5ef2aSThomas Huth 
982fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
983fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] +
984fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
985fcf5ef2aSThomas Huth     }
986fcf5ef2aSThomas Huth }
987fcf5ef2aSThomas Huth 
9886f52f731SMatheus Ferst void helper_VMSUMSHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
989fcf5ef2aSThomas Huth {
990fcf5ef2aSThomas Huth     int32_t prod[8];
991fcf5ef2aSThomas Huth     int i;
992fcf5ef2aSThomas Huth 
993fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
994fcf5ef2aSThomas Huth         prod[i] = a->s16[i] * b->s16[i];
995fcf5ef2aSThomas Huth     }
996fcf5ef2aSThomas Huth 
997fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
998fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1];
999fcf5ef2aSThomas Huth     }
1000fcf5ef2aSThomas Huth }
1001fcf5ef2aSThomas Huth 
10026f52f731SMatheus Ferst void helper_VMSUMSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1003fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1004fcf5ef2aSThomas Huth {
1005fcf5ef2aSThomas Huth     int32_t prod[8];
1006fcf5ef2aSThomas Huth     int i;
1007fcf5ef2aSThomas Huth     int sat = 0;
1008fcf5ef2aSThomas Huth 
1009fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1010fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s16[i] * b->s16[i];
1011fcf5ef2aSThomas Huth     }
1012fcf5ef2aSThomas Huth 
1013fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1014fcf5ef2aSThomas Huth         int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1];
1015fcf5ef2aSThomas Huth 
1016fcf5ef2aSThomas Huth         r->u32[i] = cvtsdsw(t, &sat);
1017fcf5ef2aSThomas Huth     }
1018fcf5ef2aSThomas Huth 
1019fcf5ef2aSThomas Huth     if (sat) {
10206175f5a0SRichard Henderson         set_vscr_sat(env);
1021fcf5ef2aSThomas Huth     }
1022fcf5ef2aSThomas Huth }
1023fcf5ef2aSThomas Huth 
1024b2dc03a5SMatheus Ferst void helper_VMSUMUBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1025fcf5ef2aSThomas Huth {
1026fcf5ef2aSThomas Huth     uint16_t prod[16];
1027fcf5ef2aSThomas Huth     int i;
1028fcf5ef2aSThomas Huth 
1029fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1030fcf5ef2aSThomas Huth         prod[i] = a->u8[i] * b->u8[i];
1031fcf5ef2aSThomas Huth     }
1032fcf5ef2aSThomas Huth 
1033fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
1034fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] +
1035fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
1036fcf5ef2aSThomas Huth     }
1037fcf5ef2aSThomas Huth }
1038fcf5ef2aSThomas Huth 
103989a5a1aeSMatheus Ferst void helper_VMSUMUHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1040fcf5ef2aSThomas Huth {
1041fcf5ef2aSThomas Huth     uint32_t prod[8];
1042fcf5ef2aSThomas Huth     int i;
1043fcf5ef2aSThomas Huth 
1044fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
1045fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
1046fcf5ef2aSThomas Huth     }
1047fcf5ef2aSThomas Huth 
1048fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
1049fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1];
1050fcf5ef2aSThomas Huth     }
1051fcf5ef2aSThomas Huth }
1052fcf5ef2aSThomas Huth 
105389a5a1aeSMatheus Ferst void helper_VMSUMUHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1054fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1055fcf5ef2aSThomas Huth {
1056fcf5ef2aSThomas Huth     uint32_t prod[8];
1057fcf5ef2aSThomas Huth     int i;
1058fcf5ef2aSThomas Huth     int sat = 0;
1059fcf5ef2aSThomas Huth 
1060fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
1061fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
1062fcf5ef2aSThomas Huth     }
1063fcf5ef2aSThomas Huth 
1064fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1065fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1];
1066fcf5ef2aSThomas Huth 
1067fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
1068fcf5ef2aSThomas Huth     }
1069fcf5ef2aSThomas Huth 
1070fcf5ef2aSThomas Huth     if (sat) {
10716175f5a0SRichard Henderson         set_vscr_sat(env);
1072fcf5ef2aSThomas Huth     }
1073fcf5ef2aSThomas Huth }
1074fcf5ef2aSThomas Huth 
10754fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast)   \
107680eca687SLucas Mateus Castro (alqotel)     void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
1077fcf5ef2aSThomas Huth     {                                                                   \
1078fcf5ef2aSThomas Huth         int i;                                                          \
1079fcf5ef2aSThomas Huth                                                                         \
10804fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
10814fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i) *           \
10824fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i);            \
1083fcf5ef2aSThomas Huth         }                                                               \
1084fcf5ef2aSThomas Huth     }
10854fbc89edSMark Cave-Ayland 
10864fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast)   \
108780eca687SLucas Mateus Castro (alqotel)     void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
10884fbc89edSMark Cave-Ayland     {                                                                   \
10894fbc89edSMark Cave-Ayland         int i;                                                          \
10904fbc89edSMark Cave-Ayland                                                                         \
10914fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
10924fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) *       \
10934fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i + 1);        \
10944fbc89edSMark Cave-Ayland         }                                                               \
10954fbc89edSMark Cave-Ayland     }
10964fbc89edSMark Cave-Ayland 
10974fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast)       \
109880eca687SLucas Mateus Castro (alqotel)     VMUL_DO_EVN(MULE##suffix, mul_element, mul_access, prod_access, cast)  \
109980eca687SLucas Mateus Castro (alqotel)     VMUL_DO_ODD(MULO##suffix, mul_element, mul_access, prod_access, cast)
110080eca687SLucas Mateus Castro (alqotel) VMUL(SB, s8, VsrSB, VsrSH, int16_t)
110180eca687SLucas Mateus Castro (alqotel) VMUL(SH, s16, VsrSH, VsrSW, int32_t)
110280eca687SLucas Mateus Castro (alqotel) VMUL(SW, s32, VsrSW, VsrSD, int64_t)
110380eca687SLucas Mateus Castro (alqotel) VMUL(UB, u8, VsrB, VsrH, uint16_t)
110480eca687SLucas Mateus Castro (alqotel) VMUL(UH, u16, VsrH, VsrW, uint32_t)
110580eca687SLucas Mateus Castro (alqotel) VMUL(UW, u32, VsrW, VsrD, uint64_t)
11064fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN
11074fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD
1108fcf5ef2aSThomas Huth #undef VMUL
1109fcf5ef2aSThomas Huth 
111041c2877fSMatheus Ferst void helper_XXPERMX(ppc_vsr_t *t, ppc_vsr_t *s0, ppc_vsr_t *s1, ppc_vsr_t *pcv,
111141c2877fSMatheus Ferst                     target_ulong uim)
111241c2877fSMatheus Ferst {
111341c2877fSMatheus Ferst     int i, idx;
111441c2877fSMatheus Ferst     ppc_vsr_t tmp = { .u64 = {0, 0} };
111541c2877fSMatheus Ferst 
111641c2877fSMatheus Ferst     for (i = 0; i < ARRAY_SIZE(t->u8); i++) {
111741c2877fSMatheus Ferst         if ((pcv->VsrB(i) >> 5) == uim) {
111841c2877fSMatheus Ferst             idx = pcv->VsrB(i) & 0x1f;
111941c2877fSMatheus Ferst             if (idx < ARRAY_SIZE(t->u8)) {
112041c2877fSMatheus Ferst                 tmp.VsrB(i) = s0->VsrB(idx);
112141c2877fSMatheus Ferst             } else {
112241c2877fSMatheus Ferst                 tmp.VsrB(i) = s1->VsrB(idx - ARRAY_SIZE(t->u8));
112341c2877fSMatheus Ferst             }
112441c2877fSMatheus Ferst         }
112541c2877fSMatheus Ferst     }
112641c2877fSMatheus Ferst 
112741c2877fSMatheus Ferst     *t = tmp;
112841c2877fSMatheus Ferst }
112941c2877fSMatheus Ferst 
11301700f2bfSLucas Mateus Castro (alqotel) void helper_VDIVSQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
11311700f2bfSLucas Mateus Castro (alqotel) {
11321700f2bfSLucas Mateus Castro (alqotel)     Int128 neg1 = int128_makes64(-1);
11331700f2bfSLucas Mateus Castro (alqotel)     Int128 int128_min = int128_make128(0, INT64_MIN);
11341700f2bfSLucas Mateus Castro (alqotel)     if (likely(int128_nz(b->s128) &&
11351700f2bfSLucas Mateus Castro (alqotel)               (int128_ne(a->s128, int128_min) || int128_ne(b->s128, neg1)))) {
11361700f2bfSLucas Mateus Castro (alqotel)         t->s128 = int128_divs(a->s128, b->s128);
11371700f2bfSLucas Mateus Castro (alqotel)     } else {
11381700f2bfSLucas Mateus Castro (alqotel)         t->s128 = a->s128; /* Undefined behavior */
11391700f2bfSLucas Mateus Castro (alqotel)     }
11401700f2bfSLucas Mateus Castro (alqotel) }
11411700f2bfSLucas Mateus Castro (alqotel) 
11421700f2bfSLucas Mateus Castro (alqotel) void helper_VDIVUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
11431700f2bfSLucas Mateus Castro (alqotel) {
11441700f2bfSLucas Mateus Castro (alqotel)     if (int128_nz(b->s128)) {
11451700f2bfSLucas Mateus Castro (alqotel)         t->s128 = int128_divu(a->s128, b->s128);
11461700f2bfSLucas Mateus Castro (alqotel)     } else {
11471700f2bfSLucas Mateus Castro (alqotel)         t->s128 = a->s128; /* Undefined behavior */
11481700f2bfSLucas Mateus Castro (alqotel)     }
11491700f2bfSLucas Mateus Castro (alqotel) }
11501700f2bfSLucas Mateus Castro (alqotel) 
1151a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVESD(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
1152a173ba88SLucas Mateus Castro (alqotel) {
1153a173ba88SLucas Mateus Castro (alqotel)     int i;
1154a173ba88SLucas Mateus Castro (alqotel)     int64_t high;
1155a173ba88SLucas Mateus Castro (alqotel)     uint64_t low;
1156a173ba88SLucas Mateus Castro (alqotel)     for (i = 0; i < 2; i++) {
1157a173ba88SLucas Mateus Castro (alqotel)         high = a->s64[i];
1158a173ba88SLucas Mateus Castro (alqotel)         low = 0;
1159a173ba88SLucas Mateus Castro (alqotel)         if (unlikely((high == INT64_MIN && b->s64[i] == -1) || !b->s64[i])) {
1160a173ba88SLucas Mateus Castro (alqotel)             t->s64[i] = a->s64[i]; /* Undefined behavior */
1161a173ba88SLucas Mateus Castro (alqotel)         } else {
1162a173ba88SLucas Mateus Castro (alqotel)             divs128(&low, &high, b->s64[i]);
1163a173ba88SLucas Mateus Castro (alqotel)             t->s64[i] = low;
1164a173ba88SLucas Mateus Castro (alqotel)         }
1165a173ba88SLucas Mateus Castro (alqotel)     }
1166a173ba88SLucas Mateus Castro (alqotel) }
1167a173ba88SLucas Mateus Castro (alqotel) 
1168a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVEUD(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
1169a173ba88SLucas Mateus Castro (alqotel) {
1170a173ba88SLucas Mateus Castro (alqotel)     int i;
1171a173ba88SLucas Mateus Castro (alqotel)     uint64_t high, low;
1172a173ba88SLucas Mateus Castro (alqotel)     for (i = 0; i < 2; i++) {
1173a173ba88SLucas Mateus Castro (alqotel)         high = a->u64[i];
1174a173ba88SLucas Mateus Castro (alqotel)         low = 0;
1175a173ba88SLucas Mateus Castro (alqotel)         if (unlikely(!b->u64[i])) {
1176a173ba88SLucas Mateus Castro (alqotel)             t->u64[i] = a->u64[i]; /* Undefined behavior */
1177a173ba88SLucas Mateus Castro (alqotel)         } else {
1178a173ba88SLucas Mateus Castro (alqotel)             divu128(&low, &high, b->u64[i]);
1179a173ba88SLucas Mateus Castro (alqotel)             t->u64[i] = low;
1180a173ba88SLucas Mateus Castro (alqotel)         }
1181a173ba88SLucas Mateus Castro (alqotel)     }
1182a173ba88SLucas Mateus Castro (alqotel) }
1183a173ba88SLucas Mateus Castro (alqotel) 
1184a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVESQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
1185a173ba88SLucas Mateus Castro (alqotel) {
1186a173ba88SLucas Mateus Castro (alqotel)     Int128 high, low;
1187a173ba88SLucas Mateus Castro (alqotel)     Int128 int128_min = int128_make128(0, INT64_MIN);
1188a173ba88SLucas Mateus Castro (alqotel)     Int128 neg1 = int128_makes64(-1);
1189a173ba88SLucas Mateus Castro (alqotel) 
1190a173ba88SLucas Mateus Castro (alqotel)     high = a->s128;
1191a173ba88SLucas Mateus Castro (alqotel)     low = int128_zero();
1192a173ba88SLucas Mateus Castro (alqotel)     if (unlikely(!int128_nz(b->s128) ||
1193a173ba88SLucas Mateus Castro (alqotel)                  (int128_eq(b->s128, neg1) && int128_eq(high, int128_min)))) {
1194a173ba88SLucas Mateus Castro (alqotel)         t->s128 = a->s128; /* Undefined behavior */
1195a173ba88SLucas Mateus Castro (alqotel)     } else {
1196a173ba88SLucas Mateus Castro (alqotel)         divs256(&low, &high, b->s128);
1197a173ba88SLucas Mateus Castro (alqotel)         t->s128 = low;
1198a173ba88SLucas Mateus Castro (alqotel)     }
1199a173ba88SLucas Mateus Castro (alqotel) }
1200a173ba88SLucas Mateus Castro (alqotel) 
1201a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVEUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
1202a173ba88SLucas Mateus Castro (alqotel) {
1203a173ba88SLucas Mateus Castro (alqotel)     Int128 high, low;
1204a173ba88SLucas Mateus Castro (alqotel) 
1205a173ba88SLucas Mateus Castro (alqotel)     high = a->s128;
1206a173ba88SLucas Mateus Castro (alqotel)     low = int128_zero();
1207a173ba88SLucas Mateus Castro (alqotel)     if (unlikely(!int128_nz(b->s128))) {
1208a173ba88SLucas Mateus Castro (alqotel)         t->s128 = a->s128; /* Undefined behavior */
1209a173ba88SLucas Mateus Castro (alqotel)     } else {
1210a173ba88SLucas Mateus Castro (alqotel)         divu256(&low, &high, b->s128);
1211a173ba88SLucas Mateus Castro (alqotel)         t->s128 = low;
1212a173ba88SLucas Mateus Castro (alqotel)     }
1213a173ba88SLucas Mateus Castro (alqotel) }
1214a173ba88SLucas Mateus Castro (alqotel) 
1215b80bec3aSLucas Mateus Castro (alqotel) void helper_VMODSQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
1216b80bec3aSLucas Mateus Castro (alqotel) {
1217b80bec3aSLucas Mateus Castro (alqotel)     Int128 neg1 = int128_makes64(-1);
1218b80bec3aSLucas Mateus Castro (alqotel)     Int128 int128_min = int128_make128(0, INT64_MIN);
1219b80bec3aSLucas Mateus Castro (alqotel)     if (likely(int128_nz(b->s128) &&
1220b80bec3aSLucas Mateus Castro (alqotel)               (int128_ne(a->s128, int128_min) || int128_ne(b->s128, neg1)))) {
1221b80bec3aSLucas Mateus Castro (alqotel)         t->s128 = int128_rems(a->s128, b->s128);
1222b80bec3aSLucas Mateus Castro (alqotel)     } else {
1223b80bec3aSLucas Mateus Castro (alqotel)         t->s128 = int128_zero(); /* Undefined behavior */
1224b80bec3aSLucas Mateus Castro (alqotel)     }
1225b80bec3aSLucas Mateus Castro (alqotel) }
1226b80bec3aSLucas Mateus Castro (alqotel) 
1227b80bec3aSLucas Mateus Castro (alqotel) void helper_VMODUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b)
1228b80bec3aSLucas Mateus Castro (alqotel) {
1229b80bec3aSLucas Mateus Castro (alqotel)     if (likely(int128_nz(b->s128))) {
1230b80bec3aSLucas Mateus Castro (alqotel)         t->s128 = int128_remu(a->s128, b->s128);
1231b80bec3aSLucas Mateus Castro (alqotel)     } else {
1232b80bec3aSLucas Mateus Castro (alqotel)         t->s128 = int128_zero(); /* Undefined behavior */
1233b80bec3aSLucas Mateus Castro (alqotel)     }
1234b80bec3aSLucas Mateus Castro (alqotel) }
1235b80bec3aSLucas Mateus Castro (alqotel) 
123628347fe2SMatheus Ferst void helper_VPERM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1237fcf5ef2aSThomas Huth {
1238fcf5ef2aSThomas Huth     ppc_avr_t result;
1239fcf5ef2aSThomas Huth     int i;
1240fcf5ef2aSThomas Huth 
124160594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
124260594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1243fcf5ef2aSThomas Huth         int index = s & 0xf;
1244fcf5ef2aSThomas Huth 
1245fcf5ef2aSThomas Huth         if (s & 0x10) {
124660594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1247fcf5ef2aSThomas Huth         } else {
124860594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1249fcf5ef2aSThomas Huth         }
1250fcf5ef2aSThomas Huth     }
1251fcf5ef2aSThomas Huth     *r = result;
1252fcf5ef2aSThomas Huth }
1253fcf5ef2aSThomas Huth 
125428347fe2SMatheus Ferst void helper_VPERMR(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1255fcf5ef2aSThomas Huth {
1256fcf5ef2aSThomas Huth     ppc_avr_t result;
1257fcf5ef2aSThomas Huth     int i;
1258fcf5ef2aSThomas Huth 
125960594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
126060594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1261fcf5ef2aSThomas Huth         int index = 15 - (s & 0xf);
1262fcf5ef2aSThomas Huth 
1263fcf5ef2aSThomas Huth         if (s & 0x10) {
126460594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1265fcf5ef2aSThomas Huth         } else {
126660594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1267fcf5ef2aSThomas Huth         }
1268fcf5ef2aSThomas Huth     }
1269fcf5ef2aSThomas Huth     *r = result;
1270fcf5ef2aSThomas Huth }
1271fcf5ef2aSThomas Huth 
1272618574ddSMatheus Ferst #define XXGENPCV_BE_EXP(NAME, SZ) \
1273b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \
1274b090f4f1SMatheus Ferst {                                                                   \
1275b090f4f1SMatheus Ferst     ppc_vsr_t tmp;                                                  \
1276b090f4f1SMatheus Ferst                                                                     \
1277b090f4f1SMatheus Ferst     /* Initialize tmp with the result of an all-zeros mask */       \
1278b090f4f1SMatheus Ferst     tmp.VsrD(0) = 0x1011121314151617;                               \
1279b090f4f1SMatheus Ferst     tmp.VsrD(1) = 0x18191A1B1C1D1E1F;                               \
1280b090f4f1SMatheus Ferst                                                                     \
1281b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1282b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1283b090f4f1SMatheus Ferst         if (b->VsrB(i) & 0x80) {                                    \
1284b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1285b090f4f1SMatheus Ferst             for (int k = 0; k < SZ; k++) {                          \
1286b090f4f1SMatheus Ferst                 tmp.VsrB(i + k) = j + k;                            \
1287b090f4f1SMatheus Ferst             }                                                       \
1288b090f4f1SMatheus Ferst             j += SZ;                                                \
1289b090f4f1SMatheus Ferst         }                                                           \
1290b090f4f1SMatheus Ferst     }                                                               \
1291b090f4f1SMatheus Ferst                                                                     \
1292b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1293618574ddSMatheus Ferst }
1294618574ddSMatheus Ferst 
1295618574ddSMatheus Ferst #define XXGENPCV_BE_COMP(NAME, SZ) \
1296b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\
1297b090f4f1SMatheus Ferst {                                                                   \
1298b090f4f1SMatheus Ferst     ppc_vsr_t tmp = { .u64 = { 0, 0 } };                            \
1299b090f4f1SMatheus Ferst                                                                     \
1300b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1301b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1302b090f4f1SMatheus Ferst         if (b->VsrB(i) & 0x80) {                                    \
1303b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1304b090f4f1SMatheus Ferst             for (int k = 0; k < SZ; k++) {                          \
1305b090f4f1SMatheus Ferst                 tmp.VsrB(j + k) = i + k;                            \
1306b090f4f1SMatheus Ferst             }                                                       \
1307b090f4f1SMatheus Ferst             j += SZ;                                                \
1308b090f4f1SMatheus Ferst         }                                                           \
1309b090f4f1SMatheus Ferst     }                                                               \
1310b090f4f1SMatheus Ferst                                                                     \
1311b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1312618574ddSMatheus Ferst }
1313618574ddSMatheus Ferst 
1314618574ddSMatheus Ferst #define XXGENPCV_LE_EXP(NAME, SZ) \
1315b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \
1316b090f4f1SMatheus Ferst {                                                                   \
1317b090f4f1SMatheus Ferst     ppc_vsr_t tmp;                                                  \
1318b090f4f1SMatheus Ferst                                                                     \
1319b090f4f1SMatheus Ferst     /* Initialize tmp with the result of an all-zeros mask */       \
1320b090f4f1SMatheus Ferst     tmp.VsrD(0) = 0x1F1E1D1C1B1A1918;                               \
1321b090f4f1SMatheus Ferst     tmp.VsrD(1) = 0x1716151413121110;                               \
1322b090f4f1SMatheus Ferst                                                                     \
1323b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1324b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1325b090f4f1SMatheus Ferst         /* Reverse indexing of "i" */                               \
1326b090f4f1SMatheus Ferst         const int idx = ARRAY_SIZE(b->u8) - i - SZ;                 \
1327b090f4f1SMatheus Ferst         if (b->VsrB(idx) & 0x80) {                                  \
1328b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1329b090f4f1SMatheus Ferst             for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) {       \
1330b090f4f1SMatheus Ferst                 tmp.VsrB(idx + rk) = j + k;                         \
1331b090f4f1SMatheus Ferst             }                                                       \
1332b090f4f1SMatheus Ferst             j += SZ;                                                \
1333b090f4f1SMatheus Ferst         }                                                           \
1334b090f4f1SMatheus Ferst     }                                                               \
1335b090f4f1SMatheus Ferst                                                                     \
1336b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1337618574ddSMatheus Ferst }
1338618574ddSMatheus Ferst 
1339618574ddSMatheus Ferst #define XXGENPCV_LE_COMP(NAME, SZ) \
1340b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\
1341b090f4f1SMatheus Ferst {                                                                   \
1342b090f4f1SMatheus Ferst     ppc_vsr_t tmp = { .u64 = { 0, 0 } };                            \
1343b090f4f1SMatheus Ferst                                                                     \
1344b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1345b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1346b090f4f1SMatheus Ferst         if (b->VsrB(ARRAY_SIZE(b->u8) - i - SZ) & 0x80) {           \
1347b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1348b090f4f1SMatheus Ferst             for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) {       \
1349b090f4f1SMatheus Ferst                 /* Reverse indexing of "j" */                       \
1350b090f4f1SMatheus Ferst                 const int idx = ARRAY_SIZE(b->u8) - j - SZ;         \
1351b090f4f1SMatheus Ferst                 tmp.VsrB(idx + rk) = i + k;                         \
1352b090f4f1SMatheus Ferst             }                                                       \
1353b090f4f1SMatheus Ferst             j += SZ;                                                \
1354b090f4f1SMatheus Ferst         }                                                           \
1355b090f4f1SMatheus Ferst     }                                                               \
1356b090f4f1SMatheus Ferst                                                                     \
1357b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1358b090f4f1SMatheus Ferst }
1359b090f4f1SMatheus Ferst 
1360618574ddSMatheus Ferst #define XXGENPCV(NAME, SZ) \
1361618574ddSMatheus Ferst     XXGENPCV_BE_EXP(NAME, SZ)  \
1362618574ddSMatheus Ferst     XXGENPCV_BE_COMP(NAME, SZ) \
1363618574ddSMatheus Ferst     XXGENPCV_LE_EXP(NAME, SZ)  \
1364618574ddSMatheus Ferst     XXGENPCV_LE_COMP(NAME, SZ) \
1365618574ddSMatheus Ferst 
1366b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVBM, 1)
1367b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVHM, 2)
1368b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVWM, 4)
1369b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVDM, 8)
1370618574ddSMatheus Ferst 
1371618574ddSMatheus Ferst #undef XXGENPCV_BE_EXP
1372618574ddSMatheus Ferst #undef XXGENPCV_BE_COMP
1373618574ddSMatheus Ferst #undef XXGENPCV_LE_EXP
1374618574ddSMatheus Ferst #undef XXGENPCV_LE_COMP
1375b090f4f1SMatheus Ferst #undef XXGENPCV
1376b090f4f1SMatheus Ferst 
1377e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1378fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)])
1379fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i)
1380fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0)
1381fcf5ef2aSThomas Huth #else
1382fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)])
1383fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i)
1384fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0)
1385fcf5ef2aSThomas Huth #endif
13868f7d41e0SMatheus Ferst #define EXTRACT_BIT(avr, i, index) \
13878f7d41e0SMatheus Ferst         (extract64((avr)->VsrD(i), 63 - index, 1))
1388fcf5ef2aSThomas Huth 
1389fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1390fcf5ef2aSThomas Huth {
1391fcf5ef2aSThomas Huth     int i, j;
1392fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
1393fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1394fcf5ef2aSThomas Huth         for (j = 0; j < 8; j++) {
1395fcf5ef2aSThomas Huth             int index = VBPERMQ_INDEX(b, (i * 8) + j);
1396fcf5ef2aSThomas Huth             if (index < 64 && EXTRACT_BIT(a, i, index)) {
1397fcf5ef2aSThomas Huth                 result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j);
1398fcf5ef2aSThomas Huth             }
1399fcf5ef2aSThomas Huth         }
1400fcf5ef2aSThomas Huth     }
1401fcf5ef2aSThomas Huth     *r = result;
1402fcf5ef2aSThomas Huth }
1403fcf5ef2aSThomas Huth 
1404fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1405fcf5ef2aSThomas Huth {
1406fcf5ef2aSThomas Huth     int i;
1407fcf5ef2aSThomas Huth     uint64_t perm = 0;
1408fcf5ef2aSThomas Huth 
1409fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
1410fcf5ef2aSThomas Huth         int index = VBPERMQ_INDEX(b, i);
1411fcf5ef2aSThomas Huth 
1412fcf5ef2aSThomas Huth         if (index < 128) {
1413fcf5ef2aSThomas Huth             uint64_t mask = (1ull << (63 - (index & 0x3F)));
1414fcf5ef2aSThomas Huth             if (a->u64[VBPERMQ_DW(index)] & mask) {
1415fcf5ef2aSThomas Huth                 perm |= (0x8000 >> i);
1416fcf5ef2aSThomas Huth             }
1417fcf5ef2aSThomas Huth         }
1418fcf5ef2aSThomas Huth     }
1419fcf5ef2aSThomas Huth 
14203c385a93SMark Cave-Ayland     r->VsrD(0) = perm;
14213c385a93SMark Cave-Ayland     r->VsrD(1) = 0;
1422fcf5ef2aSThomas Huth }
1423fcf5ef2aSThomas Huth 
1424fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX
1425fcf5ef2aSThomas Huth #undef VBPERMQ_DW
1426fcf5ef2aSThomas Huth 
1427fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp)                   \
1428fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)  \
1429fcf5ef2aSThomas Huth {                                                             \
1430fcf5ef2aSThomas Huth     int i, j;                                                 \
1431fcf5ef2aSThomas Huth     trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])];    \
1432fcf5ef2aSThomas Huth                                                               \
1433fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, srcfld) {                         \
1434fcf5ef2aSThomas Huth         prod[i] = 0;                                          \
1435fcf5ef2aSThomas Huth         for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) {      \
1436fcf5ef2aSThomas Huth             if (a->srcfld[i] & (1ull << j)) {                 \
1437fcf5ef2aSThomas Huth                 prod[i] ^= ((trgtyp)b->srcfld[i] << j);       \
1438fcf5ef2aSThomas Huth             }                                                 \
1439fcf5ef2aSThomas Huth         }                                                     \
1440fcf5ef2aSThomas Huth     }                                                         \
1441fcf5ef2aSThomas Huth                                                               \
1442fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, trgfld) {                         \
1443fcf5ef2aSThomas Huth         r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1];         \
1444fcf5ef2aSThomas Huth     }                                                         \
1445fcf5ef2aSThomas Huth }
1446fcf5ef2aSThomas Huth 
1447fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t)
1448fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t)
1449fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t)
1450fcf5ef2aSThomas Huth 
1451e82ca8acSMatheus Ferst void helper_VPMSUMD(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1452fcf5ef2aSThomas Huth {
1453fcf5ef2aSThomas Huth     int i, j;
1454e82ca8acSMatheus Ferst     Int128 tmp, prod[2] = {int128_zero(), int128_zero()};
1455fcf5ef2aSThomas Huth 
1456fcf5ef2aSThomas Huth     for (j = 0; j < 64; j++) {
1457e82ca8acSMatheus Ferst         for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
1458e82ca8acSMatheus Ferst             if (a->VsrD(i) & (1ull << j)) {
1459e82ca8acSMatheus Ferst                 tmp = int128_make64(b->VsrD(i));
1460e82ca8acSMatheus Ferst                 tmp = int128_lshift(tmp, j);
1461e82ca8acSMatheus Ferst                 prod[i] = int128_xor(prod[i], tmp);
1462fcf5ef2aSThomas Huth             }
1463fcf5ef2aSThomas Huth         }
1464fcf5ef2aSThomas Huth     }
1465fcf5ef2aSThomas Huth 
1466e82ca8acSMatheus Ferst     r->s128 = int128_xor(prod[0], prod[1]);
1467fcf5ef2aSThomas Huth }
1468fcf5ef2aSThomas Huth 
1469e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1470fcf5ef2aSThomas Huth #define PKBIG 1
1471fcf5ef2aSThomas Huth #else
1472fcf5ef2aSThomas Huth #define PKBIG 0
1473fcf5ef2aSThomas Huth #endif
1474fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1475fcf5ef2aSThomas Huth {
1476fcf5ef2aSThomas Huth     int i, j;
1477fcf5ef2aSThomas Huth     ppc_avr_t result;
1478e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1479fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { a, b };
1480fcf5ef2aSThomas Huth #else
1481fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { b, a };
1482fcf5ef2aSThomas Huth #endif
1483fcf5ef2aSThomas Huth 
1484fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1485fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(j, u32) {
1486fcf5ef2aSThomas Huth             uint32_t e = x[i]->u32[j];
1487fcf5ef2aSThomas Huth 
1488fcf5ef2aSThomas Huth             result.u16[4 * i + j] = (((e >> 9) & 0xfc00) |
1489fcf5ef2aSThomas Huth                                      ((e >> 6) & 0x3e0) |
1490fcf5ef2aSThomas Huth                                      ((e >> 3) & 0x1f));
1491fcf5ef2aSThomas Huth         }
1492fcf5ef2aSThomas Huth     }
1493fcf5ef2aSThomas Huth     *r = result;
1494fcf5ef2aSThomas Huth }
1495fcf5ef2aSThomas Huth 
1496fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat)                               \
1497fcf5ef2aSThomas Huth     void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r,             \
1498fcf5ef2aSThomas Huth                             ppc_avr_t *a, ppc_avr_t *b)                 \
1499fcf5ef2aSThomas Huth     {                                                                   \
1500fcf5ef2aSThomas Huth         int i;                                                          \
1501fcf5ef2aSThomas Huth         int sat = 0;                                                    \
1502fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1503fcf5ef2aSThomas Huth         ppc_avr_t *a0 = PKBIG ? a : b;                                  \
1504fcf5ef2aSThomas Huth         ppc_avr_t *a1 = PKBIG ? b : a;                                  \
1505fcf5ef2aSThomas Huth                                                                         \
1506fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(i, from) {                                 \
1507fcf5ef2aSThomas Huth             result.to[i] = cvt(a0->from[i], &sat);                      \
1508fcf5ef2aSThomas Huth             result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\
1509fcf5ef2aSThomas Huth         }                                                               \
1510fcf5ef2aSThomas Huth         *r = result;                                                    \
1511fcf5ef2aSThomas Huth         if (dosat && sat) {                                             \
15126175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
1513fcf5ef2aSThomas Huth         }                                                               \
1514fcf5ef2aSThomas Huth     }
1515fcf5ef2aSThomas Huth #define I(x, y) (x)
1516fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1)
1517fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1)
1518fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1)
1519fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1)
1520fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1)
1521fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1)
1522fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1)
1523fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1)
1524fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1)
1525fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0)
1526fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0)
1527fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0)
1528fcf5ef2aSThomas Huth #undef I
1529fcf5ef2aSThomas Huth #undef VPK
1530fcf5ef2aSThomas Huth #undef PKBIG
1531fcf5ef2aSThomas Huth 
1532fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1533fcf5ef2aSThomas Huth {
1534fcf5ef2aSThomas Huth     int i;
1535fcf5ef2aSThomas Huth 
153605ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
153705ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status);
1538fcf5ef2aSThomas Huth     }
1539fcf5ef2aSThomas Huth }
1540fcf5ef2aSThomas Huth 
1541fcf5ef2aSThomas Huth #define VRFI(suffix, rounding)                                  \
1542fcf5ef2aSThomas Huth     void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r,    \
1543fcf5ef2aSThomas Huth                              ppc_avr_t *b)                      \
1544fcf5ef2aSThomas Huth     {                                                           \
1545fcf5ef2aSThomas Huth         int i;                                                  \
1546fcf5ef2aSThomas Huth         float_status s = env->vec_status;                       \
1547fcf5ef2aSThomas Huth                                                                 \
1548fcf5ef2aSThomas Huth         set_float_rounding_mode(rounding, &s);                  \
154905ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {              \
155005ee3e8aSMark Cave-Ayland             r->f32[i] = float32_round_to_int (b->f32[i], &s);   \
1551fcf5ef2aSThomas Huth         }                                                       \
1552fcf5ef2aSThomas Huth     }
1553fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even)
1554fcf5ef2aSThomas Huth VRFI(m, float_round_down)
1555fcf5ef2aSThomas Huth VRFI(p, float_round_up)
1556fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero)
1557fcf5ef2aSThomas Huth #undef VRFI
1558fcf5ef2aSThomas Huth 
1559fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1560fcf5ef2aSThomas Huth {
1561fcf5ef2aSThomas Huth     int i;
1562fcf5ef2aSThomas Huth 
156305ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
156405ee3e8aSMark Cave-Ayland         float32 t = float32_sqrt(b->f32[i], &env->vec_status);
1565fcf5ef2aSThomas Huth 
156605ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, t, &env->vec_status);
1567fcf5ef2aSThomas Huth     }
1568fcf5ef2aSThomas Huth }
1569fcf5ef2aSThomas Huth 
1570fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert)                                  \
157102c74f0eSMatheus Ferst void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \
1572fcf5ef2aSThomas Huth {                                                                           \
1573fcf5ef2aSThomas Huth     int i;                                                                  \
1574fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                          \
1575fcf5ef2aSThomas Huth         uint##size##_t src1 = a->element[i];                                \
1576fcf5ef2aSThomas Huth         uint##size##_t src2 = b->element[i];                                \
1577fcf5ef2aSThomas Huth         uint##size##_t src3 = r->element[i];                                \
1578fcf5ef2aSThomas Huth         uint##size##_t begin, end, shift, mask, rot_val;                    \
1579fcf5ef2aSThomas Huth                                                                             \
1580fcf5ef2aSThomas Huth         shift = extract##size(src2, 0, 6);                                  \
1581fcf5ef2aSThomas Huth         end   = extract##size(src2, 8, 6);                                  \
1582fcf5ef2aSThomas Huth         begin = extract##size(src2, 16, 6);                                 \
1583fcf5ef2aSThomas Huth         rot_val = rol##size(src1, shift);                                   \
1584fcf5ef2aSThomas Huth         mask = mask_u##size(begin, end);                                    \
1585fcf5ef2aSThomas Huth         if (insert) {                                                       \
1586fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask) | (src3 & ~mask);              \
1587fcf5ef2aSThomas Huth         } else {                                                            \
1588fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask);                               \
1589fcf5ef2aSThomas Huth         }                                                                   \
1590fcf5ef2aSThomas Huth     }                                                                       \
1591fcf5ef2aSThomas Huth }
1592fcf5ef2aSThomas Huth 
159302c74f0eSMatheus Ferst VRLMI(VRLDMI, 64, u64, 1);
159402c74f0eSMatheus Ferst VRLMI(VRLWMI, 32, u32, 1);
159502c74f0eSMatheus Ferst VRLMI(VRLDNM, 64, u64, 0);
159602c74f0eSMatheus Ferst VRLMI(VRLWNM, 32, u32, 0);
1597fcf5ef2aSThomas Huth 
1598fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1599fcf5ef2aSThomas Huth {
1600fcf5ef2aSThomas Huth     int i;
1601fcf5ef2aSThomas Huth 
160205ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
160305ee3e8aSMark Cave-Ayland         r->f32[i] = float32_exp2(b->f32[i], &env->vec_status);
1604fcf5ef2aSThomas Huth     }
1605fcf5ef2aSThomas Huth }
1606fcf5ef2aSThomas Huth 
1607fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1608fcf5ef2aSThomas Huth {
1609fcf5ef2aSThomas Huth     int i;
1610fcf5ef2aSThomas Huth 
161105ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
161205ee3e8aSMark Cave-Ayland         r->f32[i] = float32_log2(b->f32[i], &env->vec_status);
1613fcf5ef2aSThomas Huth     }
1614fcf5ef2aSThomas Huth }
1615fcf5ef2aSThomas Huth 
161660caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left)                            \
161760caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b)  \
161860caf221SAvinesh Kumar {                                                               \
1619f297c4c6SMatheus Ferst     int index = (a & 0xf) * 8;                                  \
162060caf221SAvinesh Kumar     if (left) {                                                 \
1621f297c4c6SMatheus Ferst         index = 128 - index - size;                             \
162260caf221SAvinesh Kumar     }                                                           \
162360caf221SAvinesh Kumar     return int128_getlo(int128_rshift(b->s128, index)) &        \
162460caf221SAvinesh Kumar         MAKE_64BIT_MASK(0, size);                               \
162560caf221SAvinesh Kumar }
162660caf221SAvinesh Kumar VEXTU_X_DO(vextublx,  8, 1)
162760caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1)
162860caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1)
162960caf221SAvinesh Kumar VEXTU_X_DO(vextubrx,  8, 0)
163060caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0)
163160caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0)
163260caf221SAvinesh Kumar #undef VEXTU_X_DO
163360caf221SAvinesh Kumar 
1634fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1635fcf5ef2aSThomas Huth {
1636fcf5ef2aSThomas Huth     int i;
1637fcf5ef2aSThomas Huth     unsigned int shift, bytes, size;
1638fcf5ef2aSThomas Huth 
1639fcf5ef2aSThomas Huth     size = ARRAY_SIZE(r->u8);
1640fcf5ef2aSThomas Huth     for (i = 0; i < size; i++) {
164163be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;             /* extract shift value */
164263be02fcSAnton Blanchard         bytes = (a->VsrB(i) << 8) +           /* extract adjacent bytes */
164363be02fcSAnton Blanchard             (((i + 1) < size) ? a->VsrB(i + 1) : 0);
164463be02fcSAnton Blanchard         r->VsrB(i) = (bytes << shift) >> 8;   /* shift and store result */
1645fcf5ef2aSThomas Huth     }
1646fcf5ef2aSThomas Huth }
1647fcf5ef2aSThomas Huth 
1648fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1649fcf5ef2aSThomas Huth {
1650fcf5ef2aSThomas Huth     int i;
1651fcf5ef2aSThomas Huth     unsigned int shift, bytes;
1652fcf5ef2aSThomas Huth 
1653b6cb41b2SDavid Gibson     /*
1654b6cb41b2SDavid Gibson      * Use reverse order, as destination and source register can be
1655b6cb41b2SDavid Gibson      * same. Its being modified in place saving temporary, reverse
1656b6cb41b2SDavid Gibson      * order will guarantee that computed result is not fed back.
1657fcf5ef2aSThomas Huth      */
1658fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
165963be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;               /* extract shift value */
166063be02fcSAnton Blanchard         bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i);
1661fcf5ef2aSThomas Huth                                                 /* extract adjacent bytes */
166263be02fcSAnton Blanchard         r->VsrB(i) = (bytes >> shift) & 0xFF;   /* shift and store result */
1663fcf5ef2aSThomas Huth     }
1664fcf5ef2aSThomas Huth }
1665fcf5ef2aSThomas Huth 
1666fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift)
1667fcf5ef2aSThomas Huth {
1668fcf5ef2aSThomas Huth     int sh = shift & 0xf;
1669fcf5ef2aSThomas Huth     int i;
1670fcf5ef2aSThomas Huth     ppc_avr_t result;
1671fcf5ef2aSThomas Huth 
1672fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1673fcf5ef2aSThomas Huth         int index = sh + i;
1674fcf5ef2aSThomas Huth         if (index > 0xf) {
167560594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index - 0x10);
1676fcf5ef2aSThomas Huth         } else {
167760594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1678fcf5ef2aSThomas Huth         }
1679fcf5ef2aSThomas Huth     }
1680fcf5ef2aSThomas Huth     *r = result;
1681fcf5ef2aSThomas Huth }
1682fcf5ef2aSThomas Huth 
1683fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1684fcf5ef2aSThomas Huth {
16853c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1686fcf5ef2aSThomas Huth 
1687e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1688fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1689fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1690fcf5ef2aSThomas Huth #else
1691fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1692fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1693fcf5ef2aSThomas Huth #endif
1694fcf5ef2aSThomas Huth }
1695fcf5ef2aSThomas Huth 
1696e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
16972cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX])
16982cc12af3SMatheus Ferst #else
16992cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1)
17002cc12af3SMatheus Ferst #endif
17012cc12af3SMatheus Ferst 
17022cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \
17032cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t,       \
17042cc12af3SMatheus Ferst                                          uint64_t val, target_ulong index)     \
17052cc12af3SMatheus Ferst {                                                                              \
17062cc12af3SMatheus Ferst     const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE);                       \
17072cc12af3SMatheus Ferst     target_long idx = index;                                                   \
17082cc12af3SMatheus Ferst                                                                                \
17092cc12af3SMatheus Ferst     if (idx < 0 || idx > maxidx) {                                             \
17102cc12af3SMatheus Ferst         idx =  idx < 0 ? sizeof(TYPE) - idx : idx;                             \
17112cc12af3SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR,                                         \
17122cc12af3SMatheus Ferst             "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx   \
17132cc12af3SMatheus Ferst             ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx);         \
17142cc12af3SMatheus Ferst     } else {                                                                   \
17152cc12af3SMatheus Ferst         TYPE src = val;                                                        \
17162cc12af3SMatheus Ferst         memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE));           \
17172cc12af3SMatheus Ferst     }                                                                          \
17182cc12af3SMatheus Ferst }
17192cc12af3SMatheus Ferst VINSX(B, uint8_t)
17202cc12af3SMatheus Ferst VINSX(H, uint16_t)
17212cc12af3SMatheus Ferst VINSX(W, uint32_t)
17222cc12af3SMatheus Ferst VINSX(D, uint64_t)
17232cc12af3SMatheus Ferst #undef ELEM_ADDR
17242cc12af3SMatheus Ferst #undef VINSX
1725e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
172628110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
172728110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
172828110b72SMatheus Ferst                    target_ulong index)                                         \
172928110b72SMatheus Ferst {                                                                              \
173028110b72SMatheus Ferst     const target_long idx = index;                                             \
173128110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *a, *b };                                             \
173228110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
173328110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
173428110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \
173528110b72SMatheus Ferst     } else {                                                                   \
173628110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
173728110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
173828110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
173928110b72SMatheus Ferst     }                                                                          \
174028110b72SMatheus Ferst }
174128110b72SMatheus Ferst #else
174228110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
174328110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
174428110b72SMatheus Ferst                    target_ulong index)                                         \
174528110b72SMatheus Ferst {                                                                              \
174628110b72SMatheus Ferst     const target_long idx = index;                                             \
174728110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *b, *a };                                             \
174828110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
174928110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
175028110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2],                                  \
175128110b72SMatheus Ferst                (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE);                  \
175228110b72SMatheus Ferst     } else {                                                                   \
175328110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
175428110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
175528110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
175628110b72SMatheus Ferst     }                                                                          \
175728110b72SMatheus Ferst }
175828110b72SMatheus Ferst #endif
175928110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1)
176028110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2)
176128110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4)
176228110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8)
176328110b72SMatheus Ferst #undef VEXTDVLX
1764e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1765fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1766fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1767fcf5ef2aSThomas Huth     {                                                                        \
1768fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1769fcf5ef2aSThomas Huth         memmove(&r->u8[8 - es], &b->u8[index], es);                          \
1770fcf5ef2aSThomas Huth         memset(&r->u8[8], 0, 8);                                             \
1771fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8 - es);                                        \
1772fcf5ef2aSThomas Huth     }
1773fcf5ef2aSThomas Huth #else
1774fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1775fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1776fcf5ef2aSThomas Huth     {                                                                        \
1777fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1778fcf5ef2aSThomas Huth         uint32_t s = (16 - index) - es;                                      \
1779fcf5ef2aSThomas Huth         memmove(&r->u8[8], &b->u8[s], es);                                   \
1780fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8);                                             \
1781fcf5ef2aSThomas Huth         memset(&r->u8[8 + es], 0, 8 - es);                                   \
1782fcf5ef2aSThomas Huth     }
1783fcf5ef2aSThomas Huth #endif
1784fcf5ef2aSThomas Huth VEXTRACT(ub, u8)
1785fcf5ef2aSThomas Huth VEXTRACT(uh, u16)
1786fcf5ef2aSThomas Huth VEXTRACT(uw, u32)
1787fcf5ef2aSThomas Huth VEXTRACT(d, u64)
1788fcf5ef2aSThomas Huth #undef VEXTRACT
1789fcf5ef2aSThomas Huth 
1790fb5303ccSMatheus Ferst #define VSTRI(NAME, ELEM, NUM_ELEMS, LEFT) \
1791fb5303ccSMatheus Ferst uint32_t helper_##NAME(ppc_avr_t *t, ppc_avr_t *b) \
1792fb5303ccSMatheus Ferst {                                                   \
1793fb5303ccSMatheus Ferst     int i, idx, crf = 0;                            \
1794fb5303ccSMatheus Ferst                                                     \
1795fb5303ccSMatheus Ferst     for (i = 0; i < NUM_ELEMS; i++) {               \
1796fb5303ccSMatheus Ferst         idx = LEFT ? i : NUM_ELEMS - i - 1;         \
1797fb5303ccSMatheus Ferst         if (b->Vsr##ELEM(idx)) {                    \
1798fb5303ccSMatheus Ferst             t->Vsr##ELEM(idx) = b->Vsr##ELEM(idx);  \
1799fb5303ccSMatheus Ferst         } else {                                    \
1800fb5303ccSMatheus Ferst             crf = 0b0010;                           \
1801fb5303ccSMatheus Ferst             break;                                  \
1802fb5303ccSMatheus Ferst         }                                           \
1803fb5303ccSMatheus Ferst     }                                               \
1804fb5303ccSMatheus Ferst                                                     \
1805fb5303ccSMatheus Ferst     for (; i < NUM_ELEMS; i++) {                    \
1806fb5303ccSMatheus Ferst         idx = LEFT ? i : NUM_ELEMS - i - 1;         \
1807fb5303ccSMatheus Ferst         t->Vsr##ELEM(idx) = 0;                      \
1808fb5303ccSMatheus Ferst     }                                               \
1809fb5303ccSMatheus Ferst                                                     \
1810fb5303ccSMatheus Ferst     return crf;                                     \
1811fb5303ccSMatheus Ferst }
1812fb5303ccSMatheus Ferst VSTRI(VSTRIBL, B, 16, true)
1813fb5303ccSMatheus Ferst VSTRI(VSTRIBR, B, 16, false)
1814fb5303ccSMatheus Ferst VSTRI(VSTRIHL, H, 8, true)
1815fb5303ccSMatheus Ferst VSTRI(VSTRIHR, H, 8, false)
1816fb5303ccSMatheus Ferst #undef VSTRI
1817fb5303ccSMatheus Ferst 
18188f5eeee3SMatheus Ferst void helper_XXEXTRACTUW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index)
18198ad901e5SNikunj A Dadhania {
182003b32c09SMark Cave-Ayland     ppc_vsr_t t = { };
18218ad901e5SNikunj A Dadhania     size_t es = sizeof(uint32_t);
18228ad901e5SNikunj A Dadhania     uint32_t ext_index;
18238ad901e5SNikunj A Dadhania     int i;
18248ad901e5SNikunj A Dadhania 
18258ad901e5SNikunj A Dadhania     ext_index = index;
18268ad901e5SNikunj A Dadhania     for (i = 0; i < es; i++, ext_index++) {
182703b32c09SMark Cave-Ayland         t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16);
18288ad901e5SNikunj A Dadhania     }
18298ad901e5SNikunj A Dadhania 
183003b32c09SMark Cave-Ayland     *xt = t;
18318ad901e5SNikunj A Dadhania }
18328ad901e5SNikunj A Dadhania 
18338f5eeee3SMatheus Ferst void helper_XXINSERTW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index)
18343398b742SNikunj A Dadhania {
183503b32c09SMark Cave-Ayland     ppc_vsr_t t = *xt;
18363398b742SNikunj A Dadhania     size_t es = sizeof(uint32_t);
18373398b742SNikunj A Dadhania     int ins_index, i = 0;
18383398b742SNikunj A Dadhania 
18393398b742SNikunj A Dadhania     ins_index = index;
18403398b742SNikunj A Dadhania     for (i = 0; i < es && ins_index < 16; i++, ins_index++) {
184103b32c09SMark Cave-Ayland         t.VsrB(ins_index) = xb->VsrB(8 - es + i);
18423398b742SNikunj A Dadhania     }
18433398b742SNikunj A Dadhania 
184403b32c09SMark Cave-Ayland     *xt = t;
18453398b742SNikunj A Dadhania }
18463398b742SNikunj A Dadhania 
18471015fcabSMatheus Ferst void helper_XXEVAL(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c,
18481015fcabSMatheus Ferst                    uint32_t desc)
18491015fcabSMatheus Ferst {
18501015fcabSMatheus Ferst     /*
18511015fcabSMatheus Ferst      * Instead of processing imm bit-by-bit, we'll skip the computation of
18521015fcabSMatheus Ferst      * conjunctions whose corresponding bit is unset.
18531015fcabSMatheus Ferst      */
18541015fcabSMatheus Ferst     int bit, imm = simd_data(desc);
18551015fcabSMatheus Ferst     Int128 conj, disj = int128_zero();
18561015fcabSMatheus Ferst 
18571015fcabSMatheus Ferst     /* Iterate over set bits from the least to the most significant bit */
18581015fcabSMatheus Ferst     while (imm) {
18591015fcabSMatheus Ferst         /*
18601015fcabSMatheus Ferst          * Get the next bit to be processed with ctz64. Invert the result of
18611015fcabSMatheus Ferst          * ctz64 to match the indexing used by PowerISA.
18621015fcabSMatheus Ferst          */
18631015fcabSMatheus Ferst         bit = 7 - ctzl(imm);
18641015fcabSMatheus Ferst         if (bit & 0x4) {
18651015fcabSMatheus Ferst             conj = a->s128;
18661015fcabSMatheus Ferst         } else {
18671015fcabSMatheus Ferst             conj = int128_not(a->s128);
18681015fcabSMatheus Ferst         }
18691015fcabSMatheus Ferst         if (bit & 0x2) {
18701015fcabSMatheus Ferst             conj = int128_and(conj, b->s128);
18711015fcabSMatheus Ferst         } else {
18721015fcabSMatheus Ferst             conj = int128_and(conj, int128_not(b->s128));
18731015fcabSMatheus Ferst         }
18741015fcabSMatheus Ferst         if (bit & 0x1) {
18751015fcabSMatheus Ferst             conj = int128_and(conj, c->s128);
18761015fcabSMatheus Ferst         } else {
18771015fcabSMatheus Ferst             conj = int128_and(conj, int128_not(c->s128));
18781015fcabSMatheus Ferst         }
18791015fcabSMatheus Ferst         disj = int128_or(disj, conj);
18801015fcabSMatheus Ferst 
18811015fcabSMatheus Ferst         /* Unset the least significant bit that is set */
18821015fcabSMatheus Ferst         imm &= imm - 1;
18831015fcabSMatheus Ferst     }
18841015fcabSMatheus Ferst 
18851015fcabSMatheus Ferst     t->s128 = disj;
18861015fcabSMatheus Ferst }
18871015fcabSMatheus Ferst 
1888788c6399SMatheus Ferst #define XXBLEND(name, sz) \
1889788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b,  \
1890788c6399SMatheus Ferst                                  ppc_avr_t *c, uint32_t desc)               \
1891788c6399SMatheus Ferst {                                                                           \
1892788c6399SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) {                  \
1893788c6399SMatheus Ferst         t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ?               \
1894788c6399SMatheus Ferst             b->glue(u, sz)[i] : a->glue(u, sz)[i];                          \
1895788c6399SMatheus Ferst     }                                                                       \
1896788c6399SMatheus Ferst }
1897788c6399SMatheus Ferst XXBLEND(B, 8)
1898788c6399SMatheus Ferst XXBLEND(H, 16)
1899788c6399SMatheus Ferst XXBLEND(W, 32)
1900788c6399SMatheus Ferst XXBLEND(D, 64)
1901788c6399SMatheus Ferst #undef XXBLEND
1902788c6399SMatheus Ferst 
1903fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1904fcf5ef2aSThomas Huth {
19053c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1906fcf5ef2aSThomas Huth 
1907e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1908fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1909fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1910fcf5ef2aSThomas Huth #else
1911fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1912fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1913fcf5ef2aSThomas Huth #endif
1914fcf5ef2aSThomas Huth }
1915fcf5ef2aSThomas Huth 
1916fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1917fcf5ef2aSThomas Huth {
1918fcf5ef2aSThomas Huth     int64_t t;
1919fcf5ef2aSThomas Huth     int i, upper;
1920fcf5ef2aSThomas Huth     ppc_avr_t result;
1921fcf5ef2aSThomas Huth     int sat = 0;
1922fcf5ef2aSThomas Huth 
1923fcf5ef2aSThomas Huth     upper = ARRAY_SIZE(r->s32) - 1;
192460594feaSMark Cave-Ayland     t = (int64_t)b->VsrSW(upper);
1925fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
192660594feaSMark Cave-Ayland         t += a->VsrSW(i);
192760594feaSMark Cave-Ayland         result.VsrSW(i) = 0;
1928fcf5ef2aSThomas Huth     }
192960594feaSMark Cave-Ayland     result.VsrSW(upper) = cvtsdsw(t, &sat);
1930fcf5ef2aSThomas Huth     *r = result;
1931fcf5ef2aSThomas Huth 
1932fcf5ef2aSThomas Huth     if (sat) {
19336175f5a0SRichard Henderson         set_vscr_sat(env);
1934fcf5ef2aSThomas Huth     }
1935fcf5ef2aSThomas Huth }
1936fcf5ef2aSThomas Huth 
1937fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1938fcf5ef2aSThomas Huth {
1939fcf5ef2aSThomas Huth     int i, j, upper;
1940fcf5ef2aSThomas Huth     ppc_avr_t result;
1941fcf5ef2aSThomas Huth     int sat = 0;
1942fcf5ef2aSThomas Huth 
1943fcf5ef2aSThomas Huth     upper = 1;
1944fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
194560594feaSMark Cave-Ayland         int64_t t = (int64_t)b->VsrSW(upper + i * 2);
1946fcf5ef2aSThomas Huth 
19477fa0ddc1SAnton Blanchard         result.VsrD(i) = 0;
1948fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u64); j++) {
194960594feaSMark Cave-Ayland             t += a->VsrSW(2 * i + j);
1950fcf5ef2aSThomas Huth         }
195160594feaSMark Cave-Ayland         result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat);
1952fcf5ef2aSThomas Huth     }
1953fcf5ef2aSThomas Huth 
1954fcf5ef2aSThomas Huth     *r = result;
1955fcf5ef2aSThomas Huth     if (sat) {
19566175f5a0SRichard Henderson         set_vscr_sat(env);
1957fcf5ef2aSThomas Huth     }
1958fcf5ef2aSThomas Huth }
1959fcf5ef2aSThomas Huth 
1960fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1961fcf5ef2aSThomas Huth {
1962fcf5ef2aSThomas Huth     int i, j;
1963fcf5ef2aSThomas Huth     int sat = 0;
1964fcf5ef2aSThomas Huth 
1965fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1966fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1967fcf5ef2aSThomas Huth 
1968fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->s32); j++) {
1969fcf5ef2aSThomas Huth             t += a->s8[4 * i + j];
1970fcf5ef2aSThomas Huth         }
1971fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1972fcf5ef2aSThomas Huth     }
1973fcf5ef2aSThomas Huth 
1974fcf5ef2aSThomas Huth     if (sat) {
19756175f5a0SRichard Henderson         set_vscr_sat(env);
1976fcf5ef2aSThomas Huth     }
1977fcf5ef2aSThomas Huth }
1978fcf5ef2aSThomas Huth 
1979fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1980fcf5ef2aSThomas Huth {
1981fcf5ef2aSThomas Huth     int sat = 0;
1982fcf5ef2aSThomas Huth     int i;
1983fcf5ef2aSThomas Huth 
1984fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1985fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1986fcf5ef2aSThomas Huth 
1987fcf5ef2aSThomas Huth         t += a->s16[2 * i] + a->s16[2 * i + 1];
1988fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1989fcf5ef2aSThomas Huth     }
1990fcf5ef2aSThomas Huth 
1991fcf5ef2aSThomas Huth     if (sat) {
19926175f5a0SRichard Henderson         set_vscr_sat(env);
1993fcf5ef2aSThomas Huth     }
1994fcf5ef2aSThomas Huth }
1995fcf5ef2aSThomas Huth 
1996fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1997fcf5ef2aSThomas Huth {
1998fcf5ef2aSThomas Huth     int i, j;
1999fcf5ef2aSThomas Huth     int sat = 0;
2000fcf5ef2aSThomas Huth 
2001fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
2002fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)b->u32[i];
2003fcf5ef2aSThomas Huth 
2004fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u32); j++) {
2005fcf5ef2aSThomas Huth             t += a->u8[4 * i + j];
2006fcf5ef2aSThomas Huth         }
2007fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
2008fcf5ef2aSThomas Huth     }
2009fcf5ef2aSThomas Huth 
2010fcf5ef2aSThomas Huth     if (sat) {
20116175f5a0SRichard Henderson         set_vscr_sat(env);
2012fcf5ef2aSThomas Huth     }
2013fcf5ef2aSThomas Huth }
2014fcf5ef2aSThomas Huth 
2015e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
2016fcf5ef2aSThomas Huth #define UPKHI 1
2017fcf5ef2aSThomas Huth #define UPKLO 0
2018fcf5ef2aSThomas Huth #else
2019fcf5ef2aSThomas Huth #define UPKHI 0
2020fcf5ef2aSThomas Huth #define UPKLO 1
2021fcf5ef2aSThomas Huth #endif
2022fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi)                                              \
2023fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
2024fcf5ef2aSThomas Huth     {                                                                   \
2025fcf5ef2aSThomas Huth         int i;                                                          \
2026fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
2027fcf5ef2aSThomas Huth                                                                         \
2028fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->u32); i++) {                      \
2029fcf5ef2aSThomas Huth             uint16_t e = b->u16[hi ? i : i + 4];                        \
2030fcf5ef2aSThomas Huth             uint8_t a = (e >> 15) ? 0xff : 0;                           \
2031fcf5ef2aSThomas Huth             uint8_t r = (e >> 10) & 0x1f;                               \
2032fcf5ef2aSThomas Huth             uint8_t g = (e >> 5) & 0x1f;                                \
2033fcf5ef2aSThomas Huth             uint8_t b = e & 0x1f;                                       \
2034fcf5ef2aSThomas Huth                                                                         \
2035fcf5ef2aSThomas Huth             result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b;       \
2036fcf5ef2aSThomas Huth         }                                                               \
2037fcf5ef2aSThomas Huth         *r = result;                                                    \
2038fcf5ef2aSThomas Huth     }
2039fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO)
2040fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI)
2041fcf5ef2aSThomas Huth #undef VUPKPX
2042fcf5ef2aSThomas Huth 
2043fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi)                              \
2044fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
2045fcf5ef2aSThomas Huth     {                                                                   \
2046fcf5ef2aSThomas Huth         int i;                                                          \
2047fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
2048fcf5ef2aSThomas Huth                                                                         \
2049fcf5ef2aSThomas Huth         if (hi) {                                                       \
2050fcf5ef2aSThomas Huth             for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) {             \
2051fcf5ef2aSThomas Huth                 result.unpacked[i] = b->packee[i];                      \
2052fcf5ef2aSThomas Huth             }                                                           \
2053fcf5ef2aSThomas Huth         } else {                                                        \
2054fcf5ef2aSThomas Huth             for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \
2055fcf5ef2aSThomas Huth                  i++) {                                                 \
2056fcf5ef2aSThomas Huth                 result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \
2057fcf5ef2aSThomas Huth             }                                                           \
2058fcf5ef2aSThomas Huth         }                                                               \
2059fcf5ef2aSThomas Huth         *r = result;                                                    \
2060fcf5ef2aSThomas Huth     }
2061fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI)
2062fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI)
2063fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI)
2064fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO)
2065fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO)
2066fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO)
2067fcf5ef2aSThomas Huth #undef VUPK
2068fcf5ef2aSThomas Huth #undef UPKHI
2069fcf5ef2aSThomas Huth #undef UPKLO
2070fcf5ef2aSThomas Huth 
2071fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element)                                      \
2072fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *b)                     \
2073fcf5ef2aSThomas Huth     {                                                                   \
2074fcf5ef2aSThomas Huth         int i;                                                          \
2075fcf5ef2aSThomas Huth                                                                         \
207660594feaSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
2077fcf5ef2aSThomas Huth             r->element[i] = name(b->element[i]);                        \
2078fcf5ef2aSThomas Huth         }                                                               \
2079fcf5ef2aSThomas Huth     }
2080fcf5ef2aSThomas Huth 
2081fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8)
2082fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16)
2083fcf5ef2aSThomas Huth 
2084fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8)
2085fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16)
2086fcf5ef2aSThomas Huth 
2087fcf5ef2aSThomas Huth #undef clzb
2088fcf5ef2aSThomas Huth #undef clzh
2089fcf5ef2aSThomas Huth 
2090fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8)
2091fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16)
2092fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v))
2093fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v))
2094fcf5ef2aSThomas Huth 
2095fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8)
2096fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16)
2097fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32)
2098fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64)
2099fcf5ef2aSThomas Huth 
2100fcf5ef2aSThomas Huth #undef ctzb
2101fcf5ef2aSThomas Huth #undef ctzh
2102fcf5ef2aSThomas Huth #undef ctzw
2103fcf5ef2aSThomas Huth #undef ctzd
2104fcf5ef2aSThomas Huth 
2105fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v)
2106fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v)
2107fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v)
2108fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v)
2109fcf5ef2aSThomas Huth 
2110fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8)
2111fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16)
2112fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32)
2113fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64)
2114fcf5ef2aSThomas Huth 
2115fcf5ef2aSThomas Huth #undef popcntb
2116fcf5ef2aSThomas Huth #undef popcnth
2117fcf5ef2aSThomas Huth #undef popcntw
2118fcf5ef2aSThomas Huth #undef popcntd
2119fcf5ef2aSThomas Huth 
2120fcf5ef2aSThomas Huth #undef VGENERIC_DO
2121fcf5ef2aSThomas Huth 
21227ca04286SMatheus Ferst void helper_VADDUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2123fcf5ef2aSThomas Huth {
21247ca04286SMatheus Ferst     r->s128 = int128_add(a->s128, b->s128);
2125fcf5ef2aSThomas Huth }
2126fcf5ef2aSThomas Huth 
2127896d92c8SMatheus Ferst void helper_VADDEUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2128fcf5ef2aSThomas Huth {
2129896d92c8SMatheus Ferst     r->s128 = int128_add(int128_add(a->s128, b->s128),
2130896d92c8SMatheus Ferst                          int128_make64(int128_getlo(c->s128) & 1));
2131fcf5ef2aSThomas Huth }
2132fcf5ef2aSThomas Huth 
21338290ea50SMatheus Ferst void helper_VADDCUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2134fcf5ef2aSThomas Huth {
21358290ea50SMatheus Ferst     r->VsrD(1) = int128_ult(int128_not(a->s128), b->s128);
21363c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
2137fcf5ef2aSThomas Huth }
2138fcf5ef2aSThomas Huth 
2139896d92c8SMatheus Ferst void helper_VADDECUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2140fcf5ef2aSThomas Huth {
2141896d92c8SMatheus Ferst     bool carry_out = int128_ult(int128_not(a->s128), b->s128),
2142896d92c8SMatheus Ferst          carry_in = int128_getlo(c->s128) & 1;
2143fcf5ef2aSThomas Huth 
2144fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
2145896d92c8SMatheus Ferst         carry_out = (int128_nz(a->s128) || int128_nz(b->s128)) &&
2146896d92c8SMatheus Ferst                     int128_eq(int128_add(a->s128, b->s128), int128_makes64(-1));
2147fcf5ef2aSThomas Huth     }
2148896d92c8SMatheus Ferst 
21493c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
21503c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
2151fcf5ef2aSThomas Huth }
2152fcf5ef2aSThomas Huth 
2153b132be53SMatheus Ferst void helper_VSUBUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2154fcf5ef2aSThomas Huth {
2155b132be53SMatheus Ferst     r->s128 = int128_sub(a->s128, b->s128);
2156fcf5ef2aSThomas Huth }
2157fcf5ef2aSThomas Huth 
2158e6a5ad43SMatheus Ferst void helper_VSUBEUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2159fcf5ef2aSThomas Huth {
2160e6a5ad43SMatheus Ferst     r->s128 = int128_add(int128_add(a->s128, int128_not(b->s128)),
2161e6a5ad43SMatheus Ferst                          int128_make64(int128_getlo(c->s128) & 1));
2162fcf5ef2aSThomas Huth }
2163fcf5ef2aSThomas Huth 
2164b7d30faeSMatheus Ferst void helper_VSUBCUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2165fcf5ef2aSThomas Huth {
2166b7d30faeSMatheus Ferst     Int128 tmp = int128_not(b->s128);
2167b7d30faeSMatheus Ferst 
2168b7d30faeSMatheus Ferst     r->VsrD(1) = int128_ult(int128_not(a->s128), tmp) ||
2169b7d30faeSMatheus Ferst                  int128_eq(int128_add(a->s128, tmp), int128_makes64(-1));
21703c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
2171fcf5ef2aSThomas Huth }
2172fcf5ef2aSThomas Huth 
2173e6a5ad43SMatheus Ferst void helper_VSUBECUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2174fcf5ef2aSThomas Huth {
2175e6a5ad43SMatheus Ferst     Int128 tmp = int128_not(b->s128);
2176e6a5ad43SMatheus Ferst     bool carry_out = int128_ult(int128_not(a->s128), tmp),
2177e6a5ad43SMatheus Ferst          carry_in = int128_getlo(c->s128) & 1;
2178fcf5ef2aSThomas Huth 
2179e6a5ad43SMatheus Ferst     r->VsrD(1) = carry_out || (carry_in && int128_eq(int128_add(a->s128, tmp),
2180e6a5ad43SMatheus Ferst                                                      int128_makes64(-1)));
21813c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
2182fcf5ef2aSThomas Huth }
2183fcf5ef2aSThomas Huth 
2184fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC
2185fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF
2186fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1  0xA
2187fcf5ef2aSThomas Huth #define BCD_NEG_PREF    0xD
2188fcf5ef2aSThomas Huth #define BCD_NEG_ALT     0xB
2189fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2  0xE
2190fcf5ef2aSThomas Huth #define NATIONAL_PLUS   0x2B
2191fcf5ef2aSThomas Huth #define NATIONAL_NEG    0x2D
2192fcf5ef2aSThomas Huth 
2193365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2))
2194fcf5ef2aSThomas Huth 
2195fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd)
2196fcf5ef2aSThomas Huth {
2197428115c3SMark Cave-Ayland     switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) {
2198fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_1:
2199fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_2:
2200fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_1:
2201fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_2:
2202fcf5ef2aSThomas Huth     {
2203fcf5ef2aSThomas Huth         return 1;
2204fcf5ef2aSThomas Huth     }
2205fcf5ef2aSThomas Huth 
2206fcf5ef2aSThomas Huth     case BCD_NEG_PREF:
2207fcf5ef2aSThomas Huth     case BCD_NEG_ALT:
2208fcf5ef2aSThomas Huth     {
2209fcf5ef2aSThomas Huth         return -1;
2210fcf5ef2aSThomas Huth     }
2211fcf5ef2aSThomas Huth 
2212fcf5ef2aSThomas Huth     default:
2213fcf5ef2aSThomas Huth     {
2214fcf5ef2aSThomas Huth         return 0;
2215fcf5ef2aSThomas Huth     }
2216fcf5ef2aSThomas Huth     }
2217fcf5ef2aSThomas Huth }
2218fcf5ef2aSThomas Huth 
2219fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps)
2220fcf5ef2aSThomas Huth {
2221fcf5ef2aSThomas Huth     if (sgn >= 0) {
2222fcf5ef2aSThomas Huth         return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2;
2223fcf5ef2aSThomas Huth     } else {
2224fcf5ef2aSThomas Huth         return BCD_NEG_PREF;
2225fcf5ef2aSThomas Huth     }
2226fcf5ef2aSThomas Huth }
2227fcf5ef2aSThomas Huth 
2228fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid)
2229fcf5ef2aSThomas Huth {
2230fcf5ef2aSThomas Huth     uint8_t result;
2231fcf5ef2aSThomas Huth     if (n & 1) {
2232428115c3SMark Cave-Ayland         result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4;
2233fcf5ef2aSThomas Huth     } else {
2234428115c3SMark Cave-Ayland        result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF;
2235fcf5ef2aSThomas Huth     }
2236fcf5ef2aSThomas Huth 
2237fcf5ef2aSThomas Huth     if (unlikely(result > 9)) {
2238fcf5ef2aSThomas Huth         *invalid = true;
2239fcf5ef2aSThomas Huth     }
2240fcf5ef2aSThomas Huth     return result;
2241fcf5ef2aSThomas Huth }
2242fcf5ef2aSThomas Huth 
2243fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n)
2244fcf5ef2aSThomas Huth {
2245fcf5ef2aSThomas Huth     if (n & 1) {
2246428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F;
2247428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4);
2248fcf5ef2aSThomas Huth     } else {
2249428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0;
2250428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= digit;
2251fcf5ef2aSThomas Huth     }
2252fcf5ef2aSThomas Huth }
2253fcf5ef2aSThomas Huth 
2254071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd)
2255071663dfSJose Ricardo Ziviani {
2256071663dfSJose Ricardo Ziviani     int i;
2257071663dfSJose Ricardo Ziviani     int invalid = 0;
2258071663dfSJose Ricardo Ziviani 
2259071663dfSJose Ricardo Ziviani     if (bcd_get_sgn(bcd) == 0) {
2260071663dfSJose Ricardo Ziviani         return false;
2261071663dfSJose Ricardo Ziviani     }
2262071663dfSJose Ricardo Ziviani 
2263071663dfSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2264071663dfSJose Ricardo Ziviani         bcd_get_digit(bcd, i, &invalid);
2265071663dfSJose Ricardo Ziviani         if (unlikely(invalid)) {
2266071663dfSJose Ricardo Ziviani             return false;
2267071663dfSJose Ricardo Ziviani         }
2268071663dfSJose Ricardo Ziviani     }
2269071663dfSJose Ricardo Ziviani     return true;
2270071663dfSJose Ricardo Ziviani }
2271071663dfSJose Ricardo Ziviani 
2272fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd)
2273fcf5ef2aSThomas Huth {
22743c385a93SMark Cave-Ayland     if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) {
2275efa73196SNikunj A Dadhania         return CRF_EQ;
2276fcf5ef2aSThomas Huth     } else {
2277efa73196SNikunj A Dadhania         return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT;
2278fcf5ef2aSThomas Huth     }
2279fcf5ef2aSThomas Huth }
2280fcf5ef2aSThomas Huth 
2281fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n)
2282fcf5ef2aSThomas Huth {
228360594feaSMark Cave-Ayland     return reg->VsrH(7 - n);
2284fcf5ef2aSThomas Huth }
2285fcf5ef2aSThomas Huth 
2286fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n)
2287fcf5ef2aSThomas Huth {
228860594feaSMark Cave-Ayland     reg->VsrH(7 - n) = val;
2289fcf5ef2aSThomas Huth }
2290fcf5ef2aSThomas Huth 
2291fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b)
2292fcf5ef2aSThomas Huth {
2293fcf5ef2aSThomas Huth     int i;
2294fcf5ef2aSThomas Huth     int invalid = 0;
2295fcf5ef2aSThomas Huth     for (i = 31; i > 0; i--) {
2296fcf5ef2aSThomas Huth         uint8_t dig_a = bcd_get_digit(a, i, &invalid);
2297fcf5ef2aSThomas Huth         uint8_t dig_b = bcd_get_digit(b, i, &invalid);
2298fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2299fcf5ef2aSThomas Huth             return 0; /* doesn't matter */
2300fcf5ef2aSThomas Huth         } else if (dig_a > dig_b) {
2301fcf5ef2aSThomas Huth             return 1;
2302fcf5ef2aSThomas Huth         } else if (dig_a < dig_b) {
2303fcf5ef2aSThomas Huth             return -1;
2304fcf5ef2aSThomas Huth         }
2305fcf5ef2aSThomas Huth     }
2306fcf5ef2aSThomas Huth 
2307fcf5ef2aSThomas Huth     return 0;
2308fcf5ef2aSThomas Huth }
2309fcf5ef2aSThomas Huth 
2310936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2311fcf5ef2aSThomas Huth                        int *overflow)
2312fcf5ef2aSThomas Huth {
2313fcf5ef2aSThomas Huth     int carry = 0;
2314fcf5ef2aSThomas Huth     int i;
2315936fda4dSFabiano Rosas     int is_zero = 1;
2316936fda4dSFabiano Rosas 
2317fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2318fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) +
2319fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2320936fda4dSFabiano Rosas         is_zero &= (digit == 0);
2321fcf5ef2aSThomas Huth         if (digit > 9) {
2322fcf5ef2aSThomas Huth             carry = 1;
2323fcf5ef2aSThomas Huth             digit -= 10;
2324fcf5ef2aSThomas Huth         } else {
2325fcf5ef2aSThomas Huth             carry = 0;
2326fcf5ef2aSThomas Huth         }
2327fcf5ef2aSThomas Huth 
2328fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2329fcf5ef2aSThomas Huth     }
2330fcf5ef2aSThomas Huth 
2331fcf5ef2aSThomas Huth     *overflow = carry;
2332936fda4dSFabiano Rosas     return is_zero;
2333fcf5ef2aSThomas Huth }
2334fcf5ef2aSThomas Huth 
2335d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2336fcf5ef2aSThomas Huth                        int *overflow)
2337fcf5ef2aSThomas Huth {
2338fcf5ef2aSThomas Huth     int carry = 0;
2339fcf5ef2aSThomas Huth     int i;
2340d03b174aSYasmin Beatriz 
2341fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2342fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) -
2343fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2344fcf5ef2aSThomas Huth         if (digit & 0x80) {
2345fcf5ef2aSThomas Huth             carry = -1;
2346fcf5ef2aSThomas Huth             digit += 10;
2347fcf5ef2aSThomas Huth         } else {
2348fcf5ef2aSThomas Huth             carry = 0;
2349fcf5ef2aSThomas Huth         }
2350fcf5ef2aSThomas Huth 
2351fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2352fcf5ef2aSThomas Huth     }
2353fcf5ef2aSThomas Huth 
2354fcf5ef2aSThomas Huth     *overflow = carry;
2355fcf5ef2aSThomas Huth }
2356fcf5ef2aSThomas Huth 
2357fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2358fcf5ef2aSThomas Huth {
2359fcf5ef2aSThomas Huth 
2360fcf5ef2aSThomas Huth     int sgna = bcd_get_sgn(a);
2361fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2362fcf5ef2aSThomas Huth     int invalid = (sgna == 0) || (sgnb == 0);
2363fcf5ef2aSThomas Huth     int overflow = 0;
2364936fda4dSFabiano Rosas     int zero = 0;
2365fcf5ef2aSThomas Huth     uint32_t cr = 0;
2366fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
2367fcf5ef2aSThomas Huth 
2368fcf5ef2aSThomas Huth     if (!invalid) {
2369fcf5ef2aSThomas Huth         if (sgna == sgnb) {
2370428115c3SMark Cave-Ayland             result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2371936fda4dSFabiano Rosas             zero = bcd_add_mag(&result, a, b, &invalid, &overflow);
2372936fda4dSFabiano Rosas             cr = (sgna > 0) ? CRF_GT : CRF_LT;
2373fcf5ef2aSThomas Huth         } else {
2374d03b174aSYasmin Beatriz             int magnitude = bcd_cmp_mag(a, b);
2375d03b174aSYasmin Beatriz             if (magnitude > 0) {
2376428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2377d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, a, b, &invalid, &overflow);
2378d03b174aSYasmin Beatriz                 cr = (sgna > 0) ? CRF_GT : CRF_LT;
2379d03b174aSYasmin Beatriz             } else if (magnitude < 0) {
2380428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps);
2381d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, b, a, &invalid, &overflow);
2382efa73196SNikunj A Dadhania                 cr = (sgnb > 0) ? CRF_GT : CRF_LT;
2383d03b174aSYasmin Beatriz             } else {
2384428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps);
2385d03b174aSYasmin Beatriz                 cr = CRF_EQ;
2386d03b174aSYasmin Beatriz             }
2387fcf5ef2aSThomas Huth         }
2388fcf5ef2aSThomas Huth     }
2389fcf5ef2aSThomas Huth 
2390fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
23913c385a93SMark Cave-Ayland         result.VsrD(0) = result.VsrD(1) = -1;
2392efa73196SNikunj A Dadhania         cr = CRF_SO;
2393fcf5ef2aSThomas Huth     } else if (overflow) {
2394efa73196SNikunj A Dadhania         cr |= CRF_SO;
2395936fda4dSFabiano Rosas     } else if (zero) {
2396936fda4dSFabiano Rosas         cr |= CRF_EQ;
2397fcf5ef2aSThomas Huth     }
2398fcf5ef2aSThomas Huth 
2399fcf5ef2aSThomas Huth     *r = result;
2400fcf5ef2aSThomas Huth 
2401fcf5ef2aSThomas Huth     return cr;
2402fcf5ef2aSThomas Huth }
2403fcf5ef2aSThomas Huth 
2404fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2405fcf5ef2aSThomas Huth {
2406fcf5ef2aSThomas Huth     ppc_avr_t bcopy = *b;
2407fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2408fcf5ef2aSThomas Huth     if (sgnb < 0) {
2409fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0);
2410fcf5ef2aSThomas Huth     } else if (sgnb > 0) {
2411fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_NEG_PREF, 0);
2412fcf5ef2aSThomas Huth     }
2413fcf5ef2aSThomas Huth     /* else invalid ... defer to bcdadd code for proper handling */
2414fcf5ef2aSThomas Huth 
2415fcf5ef2aSThomas Huth     return helper_bcdadd(r, a, &bcopy, ps);
2416fcf5ef2aSThomas Huth }
2417fcf5ef2aSThomas Huth 
2418fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2419fcf5ef2aSThomas Huth {
2420fcf5ef2aSThomas Huth     int i;
2421fcf5ef2aSThomas Huth     int cr = 0;
2422fcf5ef2aSThomas Huth     uint16_t national = 0;
2423fcf5ef2aSThomas Huth     uint16_t sgnb = get_national_digit(b, 0);
2424fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2425fcf5ef2aSThomas Huth     int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG);
2426fcf5ef2aSThomas Huth 
2427fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2428fcf5ef2aSThomas Huth         national = get_national_digit(b, i);
2429fcf5ef2aSThomas Huth         if (unlikely(national < 0x30 || national > 0x39)) {
2430fcf5ef2aSThomas Huth             invalid = 1;
2431fcf5ef2aSThomas Huth             break;
2432fcf5ef2aSThomas Huth         }
2433fcf5ef2aSThomas Huth 
2434fcf5ef2aSThomas Huth         bcd_put_digit(&ret, national & 0xf, i);
2435fcf5ef2aSThomas Huth     }
2436fcf5ef2aSThomas Huth 
2437fcf5ef2aSThomas Huth     if (sgnb == NATIONAL_PLUS) {
2438fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0);
2439fcf5ef2aSThomas Huth     } else {
2440fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2441fcf5ef2aSThomas Huth     }
2442fcf5ef2aSThomas Huth 
2443fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2444fcf5ef2aSThomas Huth 
2445fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2446efa73196SNikunj A Dadhania         cr = CRF_SO;
2447fcf5ef2aSThomas Huth     }
2448fcf5ef2aSThomas Huth 
2449fcf5ef2aSThomas Huth     *r = ret;
2450fcf5ef2aSThomas Huth 
2451fcf5ef2aSThomas Huth     return cr;
2452fcf5ef2aSThomas Huth }
2453fcf5ef2aSThomas Huth 
2454fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2455fcf5ef2aSThomas Huth {
2456fcf5ef2aSThomas Huth     int i;
2457fcf5ef2aSThomas Huth     int cr = 0;
2458fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2459fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2460fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2461fcf5ef2aSThomas Huth 
24623c385a93SMark Cave-Ayland     int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0);
2463fcf5ef2aSThomas Huth 
2464fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2465fcf5ef2aSThomas Huth         set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i);
2466fcf5ef2aSThomas Huth 
2467fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2468fcf5ef2aSThomas Huth             break;
2469fcf5ef2aSThomas Huth         }
2470fcf5ef2aSThomas Huth     }
2471fcf5ef2aSThomas Huth     set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0);
2472fcf5ef2aSThomas Huth 
2473fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2474fcf5ef2aSThomas Huth 
2475fcf5ef2aSThomas Huth     if (ox_flag) {
2476efa73196SNikunj A Dadhania         cr |= CRF_SO;
2477fcf5ef2aSThomas Huth     }
2478fcf5ef2aSThomas Huth 
2479fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2480efa73196SNikunj A Dadhania         cr = CRF_SO;
2481fcf5ef2aSThomas Huth     }
2482fcf5ef2aSThomas Huth 
2483fcf5ef2aSThomas Huth     *r = ret;
2484fcf5ef2aSThomas Huth 
2485fcf5ef2aSThomas Huth     return cr;
2486fcf5ef2aSThomas Huth }
2487fcf5ef2aSThomas Huth 
2488fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2489fcf5ef2aSThomas Huth {
2490fcf5ef2aSThomas Huth     int i;
2491fcf5ef2aSThomas Huth     int cr = 0;
2492fcf5ef2aSThomas Huth     int invalid = 0;
2493fcf5ef2aSThomas Huth     int zone_digit = 0;
2494fcf5ef2aSThomas Huth     int zone_lead = ps ? 0xF : 0x3;
2495fcf5ef2aSThomas Huth     int digit = 0;
2496fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2497428115c3SMark Cave-Ayland     int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4;
2498fcf5ef2aSThomas Huth 
2499fcf5ef2aSThomas Huth     if (unlikely((sgnb < 0xA) && ps)) {
2500fcf5ef2aSThomas Huth         invalid = 1;
2501fcf5ef2aSThomas Huth     }
2502fcf5ef2aSThomas Huth 
2503fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2504428115c3SMark Cave-Ayland         zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead;
2505428115c3SMark Cave-Ayland         digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF;
2506fcf5ef2aSThomas Huth         if (unlikely(zone_digit != zone_lead || digit > 0x9)) {
2507fcf5ef2aSThomas Huth             invalid = 1;
2508fcf5ef2aSThomas Huth             break;
2509fcf5ef2aSThomas Huth         }
2510fcf5ef2aSThomas Huth 
2511fcf5ef2aSThomas Huth         bcd_put_digit(&ret, digit, i + 1);
2512fcf5ef2aSThomas Huth     }
2513fcf5ef2aSThomas Huth 
2514fcf5ef2aSThomas Huth     if ((ps && (sgnb == 0xB || sgnb == 0xD)) ||
2515fcf5ef2aSThomas Huth             (!ps && (sgnb & 0x4))) {
2516fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2517fcf5ef2aSThomas Huth     } else {
2518fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0);
2519fcf5ef2aSThomas Huth     }
2520fcf5ef2aSThomas Huth 
2521fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2522fcf5ef2aSThomas Huth 
2523fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2524efa73196SNikunj A Dadhania         cr = CRF_SO;
2525fcf5ef2aSThomas Huth     }
2526fcf5ef2aSThomas Huth 
2527fcf5ef2aSThomas Huth     *r = ret;
2528fcf5ef2aSThomas Huth 
2529fcf5ef2aSThomas Huth     return cr;
2530fcf5ef2aSThomas Huth }
2531fcf5ef2aSThomas Huth 
2532fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2533fcf5ef2aSThomas Huth {
2534fcf5ef2aSThomas Huth     int i;
2535fcf5ef2aSThomas Huth     int cr = 0;
2536fcf5ef2aSThomas Huth     uint8_t digit = 0;
2537fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2538fcf5ef2aSThomas Huth     int zone_lead = (ps) ? 0xF0 : 0x30;
2539fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2540fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2541fcf5ef2aSThomas Huth 
25423c385a93SMark Cave-Ayland     int ox_flag = ((b->VsrD(0) >> 4) != 0);
2543fcf5ef2aSThomas Huth 
2544fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2545fcf5ef2aSThomas Huth         digit = bcd_get_digit(b, i + 1, &invalid);
2546fcf5ef2aSThomas Huth 
2547fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2548fcf5ef2aSThomas Huth             break;
2549fcf5ef2aSThomas Huth         }
2550fcf5ef2aSThomas Huth 
2551428115c3SMark Cave-Ayland         ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit;
2552fcf5ef2aSThomas Huth     }
2553fcf5ef2aSThomas Huth 
2554fcf5ef2aSThomas Huth     if (ps) {
2555fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1);
2556fcf5ef2aSThomas Huth     } else {
2557fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1);
2558fcf5ef2aSThomas Huth     }
2559fcf5ef2aSThomas Huth 
2560fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2561fcf5ef2aSThomas Huth 
2562fcf5ef2aSThomas Huth     if (ox_flag) {
2563efa73196SNikunj A Dadhania         cr |= CRF_SO;
2564fcf5ef2aSThomas Huth     }
2565fcf5ef2aSThomas Huth 
2566fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2567efa73196SNikunj A Dadhania         cr = CRF_SO;
2568fcf5ef2aSThomas Huth     }
2569fcf5ef2aSThomas Huth 
2570fcf5ef2aSThomas Huth     *r = ret;
2571fcf5ef2aSThomas Huth 
2572fcf5ef2aSThomas Huth     return cr;
2573fcf5ef2aSThomas Huth }
2574fcf5ef2aSThomas Huth 
2575a3d67f3eSLuis Pires /**
2576a3d67f3eSLuis Pires  * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs
2577a3d67f3eSLuis Pires  *
2578a3d67f3eSLuis Pires  * Returns:
2579a3d67f3eSLuis Pires  * > 0 if ahi|alo > bhi|blo,
2580a3d67f3eSLuis Pires  * 0 if ahi|alo == bhi|blo,
2581a3d67f3eSLuis Pires  * < 0 if ahi|alo < bhi|blo
2582a3d67f3eSLuis Pires  */
2583a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi,
2584a3d67f3eSLuis Pires                           uint64_t blo, uint64_t bhi)
2585a3d67f3eSLuis Pires {
2586a3d67f3eSLuis Pires     return (ahi == bhi) ?
2587a3d67f3eSLuis Pires         (alo > blo ? 1 : (alo == blo ? 0 : -1)) :
2588a3d67f3eSLuis Pires         (ahi > bhi ? 1 : -1);
2589a3d67f3eSLuis Pires }
2590a3d67f3eSLuis Pires 
2591a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2592a406c058SJose Ricardo Ziviani {
2593a406c058SJose Ricardo Ziviani     int i;
2594a3d67f3eSLuis Pires     int cr;
2595a406c058SJose Ricardo Ziviani     uint64_t lo_value;
2596a406c058SJose Ricardo Ziviani     uint64_t hi_value;
259740f3e79aSLuis Pires     uint64_t rem;
2598a406c058SJose Ricardo Ziviani     ppc_avr_t ret = { .u64 = { 0, 0 } };
2599a406c058SJose Ricardo Ziviani 
26003c385a93SMark Cave-Ayland     if (b->VsrSD(0) < 0) {
26013c385a93SMark Cave-Ayland         lo_value = -b->VsrSD(1);
26023c385a93SMark Cave-Ayland         hi_value = ~b->VsrD(0) + !lo_value;
2603a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, 0xD, 0);
2604a3d67f3eSLuis Pires 
2605a3d67f3eSLuis Pires         cr = CRF_LT;
2606a406c058SJose Ricardo Ziviani     } else {
26073c385a93SMark Cave-Ayland         lo_value = b->VsrD(1);
26083c385a93SMark Cave-Ayland         hi_value = b->VsrD(0);
2609a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0);
2610a3d67f3eSLuis Pires 
2611a3d67f3eSLuis Pires         if (hi_value == 0 && lo_value == 0) {
2612a3d67f3eSLuis Pires             cr = CRF_EQ;
2613a3d67f3eSLuis Pires         } else {
2614a3d67f3eSLuis Pires             cr = CRF_GT;
2615a3d67f3eSLuis Pires         }
2616a406c058SJose Ricardo Ziviani     }
2617a406c058SJose Ricardo Ziviani 
2618a3d67f3eSLuis Pires     /*
2619a3d67f3eSLuis Pires      * Check src limits: abs(src) <= 10^31 - 1
2620a3d67f3eSLuis Pires      *
2621a3d67f3eSLuis Pires      * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff
2622a3d67f3eSLuis Pires      */
2623a3d67f3eSLuis Pires     if (ucmp128(lo_value, hi_value,
2624a3d67f3eSLuis Pires                 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) {
2625a3d67f3eSLuis Pires         cr |= CRF_SO;
2626a3d67f3eSLuis Pires 
2627a3d67f3eSLuis Pires         /*
2628a3d67f3eSLuis Pires          * According to the ISA, if src wouldn't fit in the destination
2629a3d67f3eSLuis Pires          * register, the result is undefined.
2630a3d67f3eSLuis Pires          * In that case, we leave r unchanged.
2631a3d67f3eSLuis Pires          */
2632a3d67f3eSLuis Pires     } else {
263340f3e79aSLuis Pires         rem = divu128(&lo_value, &hi_value, 1000000000000000ULL);
2634a406c058SJose Ricardo Ziviani 
263540f3e79aSLuis Pires         for (i = 1; i < 16; rem /= 10, i++) {
263640f3e79aSLuis Pires             bcd_put_digit(&ret, rem % 10, i);
2637a406c058SJose Ricardo Ziviani         }
2638a406c058SJose Ricardo Ziviani 
2639a406c058SJose Ricardo Ziviani         for (; i < 32; lo_value /= 10, i++) {
2640a406c058SJose Ricardo Ziviani             bcd_put_digit(&ret, lo_value % 10, i);
2641a406c058SJose Ricardo Ziviani         }
2642a406c058SJose Ricardo Ziviani 
2643a406c058SJose Ricardo Ziviani         *r = ret;
2644a3d67f3eSLuis Pires     }
2645a406c058SJose Ricardo Ziviani 
2646a406c058SJose Ricardo Ziviani     return cr;
2647a406c058SJose Ricardo Ziviani }
2648a406c058SJose Ricardo Ziviani 
2649c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2650c85bc7ddSJose Ricardo Ziviani {
2651c85bc7ddSJose Ricardo Ziviani     uint8_t i;
2652c85bc7ddSJose Ricardo Ziviani     int cr;
2653c85bc7ddSJose Ricardo Ziviani     uint64_t carry;
2654c85bc7ddSJose Ricardo Ziviani     uint64_t unused;
2655c85bc7ddSJose Ricardo Ziviani     uint64_t lo_value;
2656c85bc7ddSJose Ricardo Ziviani     uint64_t hi_value = 0;
2657c85bc7ddSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2658c85bc7ddSJose Ricardo Ziviani     int invalid = (sgnb == 0);
2659c85bc7ddSJose Ricardo Ziviani 
2660c85bc7ddSJose Ricardo Ziviani     lo_value = bcd_get_digit(b, 31, &invalid);
2661c85bc7ddSJose Ricardo Ziviani     for (i = 30; i > 0; i--) {
2662c85bc7ddSJose Ricardo Ziviani         mulu64(&lo_value, &carry, lo_value, 10ULL);
2663c85bc7ddSJose Ricardo Ziviani         mulu64(&hi_value, &unused, hi_value, 10ULL);
2664c85bc7ddSJose Ricardo Ziviani         lo_value += bcd_get_digit(b, i, &invalid);
2665c85bc7ddSJose Ricardo Ziviani         hi_value += carry;
2666c85bc7ddSJose Ricardo Ziviani 
2667c85bc7ddSJose Ricardo Ziviani         if (unlikely(invalid)) {
2668c85bc7ddSJose Ricardo Ziviani             break;
2669c85bc7ddSJose Ricardo Ziviani         }
2670c85bc7ddSJose Ricardo Ziviani     }
2671c85bc7ddSJose Ricardo Ziviani 
2672c85bc7ddSJose Ricardo Ziviani     if (sgnb == -1) {
26733c385a93SMark Cave-Ayland         r->VsrSD(1) = -lo_value;
26743c385a93SMark Cave-Ayland         r->VsrSD(0) = ~hi_value + !r->VsrSD(1);
2675c85bc7ddSJose Ricardo Ziviani     } else {
26763c385a93SMark Cave-Ayland         r->VsrSD(1) = lo_value;
26773c385a93SMark Cave-Ayland         r->VsrSD(0) = hi_value;
2678c85bc7ddSJose Ricardo Ziviani     }
2679c85bc7ddSJose Ricardo Ziviani 
2680c85bc7ddSJose Ricardo Ziviani     cr = bcd_cmp_zero(b);
2681c85bc7ddSJose Ricardo Ziviani 
2682c85bc7ddSJose Ricardo Ziviani     if (unlikely(invalid)) {
2683c85bc7ddSJose Ricardo Ziviani         cr = CRF_SO;
2684c85bc7ddSJose Ricardo Ziviani     }
2685c85bc7ddSJose Ricardo Ziviani 
2686c85bc7ddSJose Ricardo Ziviani     return cr;
2687c85bc7ddSJose Ricardo Ziviani }
2688c85bc7ddSJose Ricardo Ziviani 
2689c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2690c3025c3bSJose Ricardo Ziviani {
2691c3025c3bSJose Ricardo Ziviani     int i;
2692c3025c3bSJose Ricardo Ziviani     int invalid = 0;
2693c3025c3bSJose Ricardo Ziviani 
2694c3025c3bSJose Ricardo Ziviani     if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) {
2695c3025c3bSJose Ricardo Ziviani         return CRF_SO;
2696c3025c3bSJose Ricardo Ziviani     }
2697c3025c3bSJose Ricardo Ziviani 
2698c3025c3bSJose Ricardo Ziviani     *r = *a;
2699428115c3SMark Cave-Ayland     bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0);
2700c3025c3bSJose Ricardo Ziviani 
2701c3025c3bSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2702c3025c3bSJose Ricardo Ziviani         bcd_get_digit(a, i, &invalid);
2703c3025c3bSJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2704c3025c3bSJose Ricardo Ziviani         if (unlikely(invalid)) {
2705c3025c3bSJose Ricardo Ziviani             return CRF_SO;
2706c3025c3bSJose Ricardo Ziviani         }
2707c3025c3bSJose Ricardo Ziviani     }
2708c3025c3bSJose Ricardo Ziviani 
2709c3025c3bSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2710c3025c3bSJose Ricardo Ziviani }
2711c3025c3bSJose Ricardo Ziviani 
2712466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2713466a3f9cSJose Ricardo Ziviani {
2714466a3f9cSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2715466a3f9cSJose Ricardo Ziviani 
2716466a3f9cSJose Ricardo Ziviani     *r = *b;
2717466a3f9cSJose Ricardo Ziviani     bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0);
2718466a3f9cSJose Ricardo Ziviani 
2719071663dfSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2720466a3f9cSJose Ricardo Ziviani         return CRF_SO;
2721466a3f9cSJose Ricardo Ziviani     }
2722466a3f9cSJose Ricardo Ziviani 
2723466a3f9cSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2724466a3f9cSJose Ricardo Ziviani }
2725466a3f9cSJose Ricardo Ziviani 
2726e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2727e04797f7SJose Ricardo Ziviani {
2728e04797f7SJose Ricardo Ziviani     int cr;
2729428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2730e04797f7SJose Ricardo Ziviani     bool ox_flag = false;
2731e04797f7SJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2732e04797f7SJose Ricardo Ziviani     ppc_avr_t ret = *b;
27333c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2734e04797f7SJose Ricardo Ziviani 
2735e04797f7SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2736e04797f7SJose Ricardo Ziviani         return CRF_SO;
2737e04797f7SJose Ricardo Ziviani     }
2738e04797f7SJose Ricardo Ziviani 
2739e04797f7SJose Ricardo Ziviani     if (unlikely(i > 31)) {
2740e04797f7SJose Ricardo Ziviani         i = 31;
2741e04797f7SJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2742e04797f7SJose Ricardo Ziviani         i = -31;
2743e04797f7SJose Ricardo Ziviani     }
2744e04797f7SJose Ricardo Ziviani 
2745e04797f7SJose Ricardo Ziviani     if (i > 0) {
27463c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2747e04797f7SJose Ricardo Ziviani     } else {
27483c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2749e04797f7SJose Ricardo Ziviani     }
2750e04797f7SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2751e04797f7SJose Ricardo Ziviani 
2752e04797f7SJose Ricardo Ziviani     *r = ret;
2753e04797f7SJose Ricardo Ziviani 
2754e04797f7SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2755e04797f7SJose Ricardo Ziviani     if (ox_flag) {
2756e04797f7SJose Ricardo Ziviani         cr |= CRF_SO;
2757e04797f7SJose Ricardo Ziviani     }
2758e04797f7SJose Ricardo Ziviani 
2759e04797f7SJose Ricardo Ziviani     return cr;
2760e04797f7SJose Ricardo Ziviani }
2761e04797f7SJose Ricardo Ziviani 
2762a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2763a49a95e9SJose Ricardo Ziviani {
2764a49a95e9SJose Ricardo Ziviani     int cr;
2765a49a95e9SJose Ricardo Ziviani     int i;
2766a49a95e9SJose Ricardo Ziviani     int invalid = 0;
2767a49a95e9SJose Ricardo Ziviani     bool ox_flag = false;
2768a49a95e9SJose Ricardo Ziviani     ppc_avr_t ret = *b;
2769a49a95e9SJose Ricardo Ziviani 
2770a49a95e9SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
2771a49a95e9SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2772a49a95e9SJose Ricardo Ziviani 
2773a49a95e9SJose Ricardo Ziviani         if (unlikely(invalid)) {
2774a49a95e9SJose Ricardo Ziviani             return CRF_SO;
2775a49a95e9SJose Ricardo Ziviani         }
2776a49a95e9SJose Ricardo Ziviani     }
2777a49a95e9SJose Ricardo Ziviani 
2778428115c3SMark Cave-Ayland     i = a->VsrSB(7);
2779a49a95e9SJose Ricardo Ziviani     if (i >= 32) {
2780a49a95e9SJose Ricardo Ziviani         ox_flag = true;
27813c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2782a49a95e9SJose Ricardo Ziviani     } else if (i <= -32) {
27833c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2784a49a95e9SJose Ricardo Ziviani     } else if (i > 0) {
27853c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2786a49a95e9SJose Ricardo Ziviani     } else {
27873c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2788a49a95e9SJose Ricardo Ziviani     }
2789a49a95e9SJose Ricardo Ziviani     *r = ret;
2790a49a95e9SJose Ricardo Ziviani 
2791a49a95e9SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2792a49a95e9SJose Ricardo Ziviani     if (ox_flag) {
2793a49a95e9SJose Ricardo Ziviani         cr |= CRF_SO;
2794a49a95e9SJose Ricardo Ziviani     }
2795a49a95e9SJose Ricardo Ziviani 
2796a49a95e9SJose Ricardo Ziviani     return cr;
2797a49a95e9SJose Ricardo Ziviani }
2798a49a95e9SJose Ricardo Ziviani 
2799a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2800a54238adSJose Ricardo Ziviani {
2801a54238adSJose Ricardo Ziviani     int cr;
2802a54238adSJose Ricardo Ziviani     int unused = 0;
2803a54238adSJose Ricardo Ziviani     int invalid = 0;
2804a54238adSJose Ricardo Ziviani     bool ox_flag = false;
2805a54238adSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2806a54238adSJose Ricardo Ziviani     ppc_avr_t ret = *b;
28073c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2808a54238adSJose Ricardo Ziviani 
2809428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2810428115c3SMark Cave-Ayland     ppc_avr_t bcd_one;
2811428115c3SMark Cave-Ayland 
2812428115c3SMark Cave-Ayland     bcd_one.VsrD(0) = 0;
2813428115c3SMark Cave-Ayland     bcd_one.VsrD(1) = 0x10;
2814a54238adSJose Ricardo Ziviani 
2815a54238adSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2816a54238adSJose Ricardo Ziviani         return CRF_SO;
2817a54238adSJose Ricardo Ziviani     }
2818a54238adSJose Ricardo Ziviani 
2819a54238adSJose Ricardo Ziviani     if (unlikely(i > 31)) {
2820a54238adSJose Ricardo Ziviani         i = 31;
2821a54238adSJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2822a54238adSJose Ricardo Ziviani         i = -31;
2823a54238adSJose Ricardo Ziviani     }
2824a54238adSJose Ricardo Ziviani 
2825a54238adSJose Ricardo Ziviani     if (i > 0) {
28263c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2827a54238adSJose Ricardo Ziviani     } else {
28283c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2829a54238adSJose Ricardo Ziviani 
2830a54238adSJose Ricardo Ziviani         if (bcd_get_digit(&ret, 0, &invalid) >= 5) {
2831a54238adSJose Ricardo Ziviani             bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused);
2832a54238adSJose Ricardo Ziviani         }
2833a54238adSJose Ricardo Ziviani     }
2834a54238adSJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2835a54238adSJose Ricardo Ziviani 
2836a54238adSJose Ricardo Ziviani     cr = bcd_cmp_zero(&ret);
2837a54238adSJose Ricardo Ziviani     if (ox_flag) {
2838a54238adSJose Ricardo Ziviani         cr |= CRF_SO;
2839a54238adSJose Ricardo Ziviani     }
2840a54238adSJose Ricardo Ziviani     *r = ret;
2841a54238adSJose Ricardo Ziviani 
2842a54238adSJose Ricardo Ziviani     return cr;
2843a54238adSJose Ricardo Ziviani }
2844a54238adSJose Ricardo Ziviani 
284531bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
284631bc4d11SJose Ricardo Ziviani {
284731bc4d11SJose Ricardo Ziviani     uint64_t mask;
284831bc4d11SJose Ricardo Ziviani     uint32_t ox_flag = 0;
2849428115c3SMark Cave-Ayland     int i = a->VsrSH(3) + 1;
285031bc4d11SJose Ricardo Ziviani     ppc_avr_t ret = *b;
285131bc4d11SJose Ricardo Ziviani 
285231bc4d11SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
285331bc4d11SJose Ricardo Ziviani         return CRF_SO;
285431bc4d11SJose Ricardo Ziviani     }
285531bc4d11SJose Ricardo Ziviani 
285631bc4d11SJose Ricardo Ziviani     if (i > 16 && i < 32) {
285731bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
28583c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
285931bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
286031bc4d11SJose Ricardo Ziviani         }
286131bc4d11SJose Ricardo Ziviani 
28623c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
286331bc4d11SJose Ricardo Ziviani     } else if (i >= 0 && i <= 16) {
286431bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
28653c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
286631bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
286731bc4d11SJose Ricardo Ziviani         }
286831bc4d11SJose Ricardo Ziviani 
28693c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
28703c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
287131bc4d11SJose Ricardo Ziviani     }
287231bc4d11SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0);
287331bc4d11SJose Ricardo Ziviani     *r = ret;
287431bc4d11SJose Ricardo Ziviani 
287531bc4d11SJose Ricardo Ziviani     return bcd_cmp_zero(&ret) | ox_flag;
287631bc4d11SJose Ricardo Ziviani }
287731bc4d11SJose Ricardo Ziviani 
28785c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
28795c32e2e4SJose Ricardo Ziviani {
28805c32e2e4SJose Ricardo Ziviani     int i;
28815c32e2e4SJose Ricardo Ziviani     uint64_t mask;
28825c32e2e4SJose Ricardo Ziviani     uint32_t ox_flag = 0;
28835c32e2e4SJose Ricardo Ziviani     int invalid = 0;
28845c32e2e4SJose Ricardo Ziviani     ppc_avr_t ret = *b;
28855c32e2e4SJose Ricardo Ziviani 
28865c32e2e4SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
28875c32e2e4SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
28885c32e2e4SJose Ricardo Ziviani 
28895c32e2e4SJose Ricardo Ziviani         if (unlikely(invalid)) {
28905c32e2e4SJose Ricardo Ziviani             return CRF_SO;
28915c32e2e4SJose Ricardo Ziviani         }
28925c32e2e4SJose Ricardo Ziviani     }
28935c32e2e4SJose Ricardo Ziviani 
2894428115c3SMark Cave-Ayland     i = a->VsrSH(3);
28955c32e2e4SJose Ricardo Ziviani     if (i > 16 && i < 33) {
28965c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
28973c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
28985c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
28995c32e2e4SJose Ricardo Ziviani         }
29005c32e2e4SJose Ricardo Ziviani 
29013c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
29025c32e2e4SJose Ricardo Ziviani     } else if (i > 0 && i <= 16) {
29035c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
29043c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
29055c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
29065c32e2e4SJose Ricardo Ziviani         }
29075c32e2e4SJose Ricardo Ziviani 
29083c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
29093c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
29105c32e2e4SJose Ricardo Ziviani     } else if (i == 0) {
29113c385a93SMark Cave-Ayland         if (ret.VsrD(0) || ret.VsrD(1)) {
29125c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
29135c32e2e4SJose Ricardo Ziviani         }
29143c385a93SMark Cave-Ayland         ret.VsrD(0) = ret.VsrD(1) = 0;
29155c32e2e4SJose Ricardo Ziviani     }
29165c32e2e4SJose Ricardo Ziviani 
29175c32e2e4SJose Ricardo Ziviani     *r = ret;
29183c385a93SMark Cave-Ayland     if (r->VsrD(0) == 0 && r->VsrD(1) == 0) {
29195c32e2e4SJose Ricardo Ziviani         return ox_flag | CRF_EQ;
29205c32e2e4SJose Ricardo Ziviani     }
29215c32e2e4SJose Ricardo Ziviani 
29225c32e2e4SJose Ricardo Ziviani     return ox_flag | CRF_GT;
29235c32e2e4SJose Ricardo Ziviani }
29245c32e2e4SJose Ricardo Ziviani 
2925fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a)
2926fcf5ef2aSThomas Huth {
2927fcf5ef2aSThomas Huth     int i;
2928fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
2929fcf5ef2aSThomas Huth         r->u8[i] = AES_sbox[a->u8[i]];
2930fcf5ef2aSThomas Huth     }
2931fcf5ef2aSThomas Huth }
2932fcf5ef2aSThomas Huth 
2933fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2934fcf5ef2aSThomas Huth {
2935fcf5ef2aSThomas Huth     ppc_avr_t result;
2936fcf5ef2aSThomas Huth     int i;
2937fcf5ef2aSThomas Huth 
2938fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
29392dea57dbSMark Cave-Ayland         result.VsrW(i) = b->VsrW(i) ^
29402dea57dbSMark Cave-Ayland             (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^
29412dea57dbSMark Cave-Ayland              AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^
29422dea57dbSMark Cave-Ayland              AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^
29432dea57dbSMark Cave-Ayland              AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]);
2944fcf5ef2aSThomas Huth     }
2945fcf5ef2aSThomas Huth     *r = result;
2946fcf5ef2aSThomas Huth }
2947fcf5ef2aSThomas Huth 
2948fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2949fcf5ef2aSThomas Huth {
2950fcf5ef2aSThomas Huth     ppc_avr_t result;
2951fcf5ef2aSThomas Huth     int i;
2952fcf5ef2aSThomas Huth 
2953fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
29542dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]);
2955fcf5ef2aSThomas Huth     }
2956fcf5ef2aSThomas Huth     *r = result;
2957fcf5ef2aSThomas Huth }
2958fcf5ef2aSThomas Huth 
2959fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2960fcf5ef2aSThomas Huth {
2961fcf5ef2aSThomas Huth     /* This differs from what is written in ISA V2.07.  The RTL is */
2962fcf5ef2aSThomas Huth     /* incorrect and will be fixed in V2.07B.                      */
2963fcf5ef2aSThomas Huth     int i;
2964fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2965fcf5ef2aSThomas Huth 
2966fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
29672dea57dbSMark Cave-Ayland         tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])];
2968fcf5ef2aSThomas Huth     }
2969fcf5ef2aSThomas Huth 
2970fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
29712dea57dbSMark Cave-Ayland         r->VsrW(i) =
29722dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 0)][0] ^
29732dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 1)][1] ^
29742dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 2)][2] ^
29752dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 3)][3];
2976fcf5ef2aSThomas Huth     }
2977fcf5ef2aSThomas Huth }
2978fcf5ef2aSThomas Huth 
2979fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2980fcf5ef2aSThomas Huth {
2981fcf5ef2aSThomas Huth     ppc_avr_t result;
2982fcf5ef2aSThomas Huth     int i;
2983fcf5ef2aSThomas Huth 
2984fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
29852dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]);
2986fcf5ef2aSThomas Huth     }
2987fcf5ef2aSThomas Huth     *r = result;
2988fcf5ef2aSThomas Huth }
2989fcf5ef2aSThomas Huth 
2990fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
2991fcf5ef2aSThomas Huth {
2992fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
2993fcf5ef2aSThomas Huth     int six = st_six & 0xF;
2994fcf5ef2aSThomas Huth     int i;
2995fcf5ef2aSThomas Huth 
2996730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
2997fcf5ef2aSThomas Huth         if (st == 0) {
2998fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
29990ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 7) ^
30000ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 18) ^
3001730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 3);
3002fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
30030ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 17) ^
30040ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 19) ^
3005730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 10);
3006fcf5ef2aSThomas Huth             }
3007fcf5ef2aSThomas Huth         } else { /* st == 1 */
3008fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
30090ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 2) ^
30100ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 13) ^
30110ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 22);
3012fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
30130ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 6) ^
30140ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 11) ^
30150ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 25);
3016fcf5ef2aSThomas Huth             }
3017fcf5ef2aSThomas Huth         }
3018fcf5ef2aSThomas Huth     }
3019fcf5ef2aSThomas Huth }
3020fcf5ef2aSThomas Huth 
3021fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
3022fcf5ef2aSThomas Huth {
3023fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
3024fcf5ef2aSThomas Huth     int six = st_six & 0xF;
3025fcf5ef2aSThomas Huth     int i;
3026fcf5ef2aSThomas Huth 
3027730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
3028fcf5ef2aSThomas Huth         if (st == 0) {
3029fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
30300ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 1) ^
30310ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 8) ^
3032730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 7);
3033fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
30340ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 19) ^
30350ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 61) ^
3036730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 6);
3037fcf5ef2aSThomas Huth             }
3038fcf5ef2aSThomas Huth         } else { /* st == 1 */
3039fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
30400ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 28) ^
30410ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 34) ^
30420ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 39);
3043fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
30440ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 14) ^
30450ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 18) ^
30460ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 41);
3047fcf5ef2aSThomas Huth             }
3048fcf5ef2aSThomas Huth         }
3049fcf5ef2aSThomas Huth     }
3050fcf5ef2aSThomas Huth }
3051fcf5ef2aSThomas Huth 
3052fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
3053fcf5ef2aSThomas Huth {
3054fcf5ef2aSThomas Huth     ppc_avr_t result;
3055fcf5ef2aSThomas Huth     int i;
3056fcf5ef2aSThomas Huth 
305760594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
305860594feaSMark Cave-Ayland         int indexA = c->VsrB(i) >> 4;
305960594feaSMark Cave-Ayland         int indexB = c->VsrB(i) & 0xF;
306060594feaSMark Cave-Ayland 
306160594feaSMark Cave-Ayland         result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB);
3062fcf5ef2aSThomas Huth     }
3063fcf5ef2aSThomas Huth     *r = result;
3064fcf5ef2aSThomas Huth }
3065fcf5ef2aSThomas Huth 
3066fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I
3067fcf5ef2aSThomas Huth 
3068fcf5ef2aSThomas Huth /*****************************************************************************/
3069fcf5ef2aSThomas Huth /* SPE extension helpers */
3070fcf5ef2aSThomas Huth /* Use a table to make this quicker */
3071fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = {
3072fcf5ef2aSThomas Huth     0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE,
3073fcf5ef2aSThomas Huth     0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF,
3074fcf5ef2aSThomas Huth };
3075fcf5ef2aSThomas Huth 
3076fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val)
3077fcf5ef2aSThomas Huth {
3078fcf5ef2aSThomas Huth     return hbrev[val >> 4] | (hbrev[val & 0xF] << 4);
3079fcf5ef2aSThomas Huth }
3080fcf5ef2aSThomas Huth 
3081fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val)
3082fcf5ef2aSThomas Huth {
3083fcf5ef2aSThomas Huth     return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) |
3084fcf5ef2aSThomas Huth         (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24);
3085fcf5ef2aSThomas Huth }
3086fcf5ef2aSThomas Huth 
3087fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */
3088fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2)
3089fcf5ef2aSThomas Huth {
3090fcf5ef2aSThomas Huth     uint32_t a, b, d, mask;
3091fcf5ef2aSThomas Huth 
3092fcf5ef2aSThomas Huth     mask = UINT32_MAX >> (32 - MASKBITS);
3093fcf5ef2aSThomas Huth     a = arg1 & mask;
3094fcf5ef2aSThomas Huth     b = arg2 & mask;
3095fcf5ef2aSThomas Huth     d = word_reverse(1 + word_reverse(a | ~b));
3096fcf5ef2aSThomas Huth     return (arg1 & ~mask) | (d & b);
3097fcf5ef2aSThomas Huth }
3098fcf5ef2aSThomas Huth 
3099fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val)
3100fcf5ef2aSThomas Huth {
3101fcf5ef2aSThomas Huth     if (val & 0x80000000) {
3102fcf5ef2aSThomas Huth         return clz32(~val);
3103fcf5ef2aSThomas Huth     } else {
3104fcf5ef2aSThomas Huth         return clz32(val);
3105fcf5ef2aSThomas Huth     }
3106fcf5ef2aSThomas Huth }
3107fcf5ef2aSThomas Huth 
3108fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val)
3109fcf5ef2aSThomas Huth {
3110fcf5ef2aSThomas Huth     return clz32(val);
3111fcf5ef2aSThomas Huth }
3112fcf5ef2aSThomas Huth 
3113fcf5ef2aSThomas Huth /* 440 specific */
3114fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high,
3115fcf5ef2aSThomas Huth                           target_ulong low, uint32_t update_Rc)
3116fcf5ef2aSThomas Huth {
3117fcf5ef2aSThomas Huth     target_ulong mask;
3118fcf5ef2aSThomas Huth     int i;
3119fcf5ef2aSThomas Huth 
3120fcf5ef2aSThomas Huth     i = 1;
3121fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3122fcf5ef2aSThomas Huth         if ((high & mask) == 0) {
3123fcf5ef2aSThomas Huth             if (update_Rc) {
3124fcf5ef2aSThomas Huth                 env->crf[0] = 0x4;
3125fcf5ef2aSThomas Huth             }
3126fcf5ef2aSThomas Huth             goto done;
3127fcf5ef2aSThomas Huth         }
3128fcf5ef2aSThomas Huth         i++;
3129fcf5ef2aSThomas Huth     }
3130fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3131fcf5ef2aSThomas Huth         if ((low & mask) == 0) {
3132fcf5ef2aSThomas Huth             if (update_Rc) {
3133fcf5ef2aSThomas Huth                 env->crf[0] = 0x8;
3134fcf5ef2aSThomas Huth             }
3135fcf5ef2aSThomas Huth             goto done;
3136fcf5ef2aSThomas Huth         }
3137fcf5ef2aSThomas Huth         i++;
3138fcf5ef2aSThomas Huth     }
3139fcf5ef2aSThomas Huth     i = 8;
3140fcf5ef2aSThomas Huth     if (update_Rc) {
3141fcf5ef2aSThomas Huth         env->crf[0] = 0x2;
3142fcf5ef2aSThomas Huth     }
3143fcf5ef2aSThomas Huth  done:
3144fcf5ef2aSThomas Huth     env->xer = (env->xer & ~0x7F) | i;
3145fcf5ef2aSThomas Huth     if (update_Rc) {
3146fcf5ef2aSThomas Huth         env->crf[0] |= xer_so;
3147fcf5ef2aSThomas Huth     }
3148fcf5ef2aSThomas Huth     return i;
3149fcf5ef2aSThomas Huth }
3150