xref: /openbmc/qemu/target/ppc/int_helper.c (revision 1015fcab)
1fcf5ef2aSThomas Huth /*
2fcf5ef2aSThomas Huth  *  PowerPC integer and vector emulation helpers for QEMU.
3fcf5ef2aSThomas Huth  *
4fcf5ef2aSThomas Huth  *  Copyright (c) 2003-2007 Jocelyn Mayer
5fcf5ef2aSThomas Huth  *
6fcf5ef2aSThomas Huth  * This library is free software; you can redistribute it and/or
7fcf5ef2aSThomas Huth  * modify it under the terms of the GNU Lesser General Public
8fcf5ef2aSThomas Huth  * License as published by the Free Software Foundation; either
96bd039cdSChetan Pant  * version 2.1 of the License, or (at your option) any later version.
10fcf5ef2aSThomas Huth  *
11fcf5ef2aSThomas Huth  * This library is distributed in the hope that it will be useful,
12fcf5ef2aSThomas Huth  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13fcf5ef2aSThomas Huth  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14fcf5ef2aSThomas Huth  * Lesser General Public License for more details.
15fcf5ef2aSThomas Huth  *
16fcf5ef2aSThomas Huth  * You should have received a copy of the GNU Lesser General Public
17fcf5ef2aSThomas Huth  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18fcf5ef2aSThomas Huth  */
19db725815SMarkus Armbruster 
20fcf5ef2aSThomas Huth #include "qemu/osdep.h"
21fcf5ef2aSThomas Huth #include "cpu.h"
22fcf5ef2aSThomas Huth #include "internal.h"
23fcf5ef2aSThomas Huth #include "qemu/host-utils.h"
24db725815SMarkus Armbruster #include "qemu/main-loop.h"
258a05fd9aSRichard Henderson #include "qemu/log.h"
26fcf5ef2aSThomas Huth #include "exec/helper-proto.h"
27fcf5ef2aSThomas Huth #include "crypto/aes.h"
2824f91e81SAlex Bennée #include "fpu/softfloat.h"
293f74b632SRichard Henderson #include "qapi/error.h"
303f74b632SRichard Henderson #include "qemu/guest-random.h"
31*1015fcabSMatheus Ferst #include "tcg/tcg-gvec-desc.h"
32fcf5ef2aSThomas Huth 
33fcf5ef2aSThomas Huth #include "helper_regs.h"
34fcf5ef2aSThomas Huth /*****************************************************************************/
35fcf5ef2aSThomas Huth /* Fixed point operations helpers */
36fcf5ef2aSThomas Huth 
37f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov)
38f32899deSNikunj A Dadhania {
39f32899deSNikunj A Dadhania     if (unlikely(ov)) {
40f32899deSNikunj A Dadhania         env->so = env->ov = 1;
41f32899deSNikunj A Dadhania     } else {
42f32899deSNikunj A Dadhania         env->ov = 0;
43f32899deSNikunj A Dadhania     }
44f32899deSNikunj A Dadhania }
45f32899deSNikunj A Dadhania 
46fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb,
47fcf5ef2aSThomas Huth                            uint32_t oe)
48fcf5ef2aSThomas Huth {
49fcf5ef2aSThomas Huth     uint64_t rt = 0;
50fcf5ef2aSThomas Huth     int overflow = 0;
51fcf5ef2aSThomas Huth 
52fcf5ef2aSThomas Huth     uint64_t dividend = (uint64_t)ra << 32;
53fcf5ef2aSThomas Huth     uint64_t divisor = (uint32_t)rb;
54fcf5ef2aSThomas Huth 
55fcf5ef2aSThomas Huth     if (unlikely(divisor == 0)) {
56fcf5ef2aSThomas Huth         overflow = 1;
57fcf5ef2aSThomas Huth     } else {
58fcf5ef2aSThomas Huth         rt = dividend / divisor;
59fcf5ef2aSThomas Huth         overflow = rt > UINT32_MAX;
60fcf5ef2aSThomas Huth     }
61fcf5ef2aSThomas Huth 
62fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
63fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
64fcf5ef2aSThomas Huth     }
65fcf5ef2aSThomas Huth 
66fcf5ef2aSThomas Huth     if (oe) {
67f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
68fcf5ef2aSThomas Huth     }
69fcf5ef2aSThomas Huth 
70fcf5ef2aSThomas Huth     return (target_ulong)rt;
71fcf5ef2aSThomas Huth }
72fcf5ef2aSThomas Huth 
73fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb,
74fcf5ef2aSThomas Huth                           uint32_t oe)
75fcf5ef2aSThomas Huth {
76fcf5ef2aSThomas Huth     int64_t rt = 0;
77fcf5ef2aSThomas Huth     int overflow = 0;
78fcf5ef2aSThomas Huth 
79fcf5ef2aSThomas Huth     int64_t dividend = (int64_t)ra << 32;
80fcf5ef2aSThomas Huth     int64_t divisor = (int64_t)((int32_t)rb);
81fcf5ef2aSThomas Huth 
82fcf5ef2aSThomas Huth     if (unlikely((divisor == 0) ||
83fcf5ef2aSThomas Huth                  ((divisor == -1ull) && (dividend == INT64_MIN)))) {
84fcf5ef2aSThomas Huth         overflow = 1;
85fcf5ef2aSThomas Huth     } else {
86fcf5ef2aSThomas Huth         rt = dividend / divisor;
87fcf5ef2aSThomas Huth         overflow = rt != (int32_t)rt;
88fcf5ef2aSThomas Huth     }
89fcf5ef2aSThomas Huth 
90fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
91fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
92fcf5ef2aSThomas Huth     }
93fcf5ef2aSThomas Huth 
94fcf5ef2aSThomas Huth     if (oe) {
95f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
96fcf5ef2aSThomas Huth     }
97fcf5ef2aSThomas Huth 
98fcf5ef2aSThomas Huth     return (target_ulong)rt;
99fcf5ef2aSThomas Huth }
100fcf5ef2aSThomas Huth 
101fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
102fcf5ef2aSThomas Huth 
103fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe)
104fcf5ef2aSThomas Huth {
105fcf5ef2aSThomas Huth     uint64_t rt = 0;
106fcf5ef2aSThomas Huth     int overflow = 0;
107fcf5ef2aSThomas Huth 
1089276a31cSLuis Pires     if (unlikely(rb == 0 || ra >= rb)) {
1099276a31cSLuis Pires         overflow = 1;
110fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1119276a31cSLuis Pires     } else {
1129276a31cSLuis Pires         divu128(&rt, &ra, rb);
113fcf5ef2aSThomas Huth     }
114fcf5ef2aSThomas Huth 
115fcf5ef2aSThomas Huth     if (oe) {
116f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
117fcf5ef2aSThomas Huth     }
118fcf5ef2aSThomas Huth 
119fcf5ef2aSThomas Huth     return rt;
120fcf5ef2aSThomas Huth }
121fcf5ef2aSThomas Huth 
122fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe)
123fcf5ef2aSThomas Huth {
12440f3e79aSLuis Pires     uint64_t rt = 0;
125fcf5ef2aSThomas Huth     int64_t ra = (int64_t)rau;
126fcf5ef2aSThomas Huth     int64_t rb = (int64_t)rbu;
1279276a31cSLuis Pires     int overflow = 0;
128fcf5ef2aSThomas Huth 
1299276a31cSLuis Pires     if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) {
1309276a31cSLuis Pires         overflow = 1;
131fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1329276a31cSLuis Pires     } else {
1339276a31cSLuis Pires         divs128(&rt, &ra, rb);
134fcf5ef2aSThomas Huth     }
135fcf5ef2aSThomas Huth 
136fcf5ef2aSThomas Huth     if (oe) {
137f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
138fcf5ef2aSThomas Huth     }
139fcf5ef2aSThomas Huth 
140fcf5ef2aSThomas Huth     return rt;
141fcf5ef2aSThomas Huth }
142fcf5ef2aSThomas Huth 
143fcf5ef2aSThomas Huth #endif
144fcf5ef2aSThomas Huth 
145fcf5ef2aSThomas Huth 
146fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
147fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */
148fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff))
149fcf5ef2aSThomas Huth 
150b6cb41b2SDavid Gibson /*
151b6cb41b2SDavid Gibson  * subtract 1 from each byte, and with inverse, check if MSB is set at each
152fcf5ef2aSThomas Huth  * byte.
153fcf5ef2aSThomas Huth  * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80
154fcf5ef2aSThomas Huth  *      (0xFF & 0xFF) & 0x80 = 0x80 (zero found)
155fcf5ef2aSThomas Huth  */
156fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80))
157fcf5ef2aSThomas Huth 
158fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */
159fcf5ef2aSThomas Huth #define hasvalue(x, n)  (haszero((x) ^ pattern(n)))
160fcf5ef2aSThomas Huth 
161fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb)
162fcf5ef2aSThomas Huth {
163efa73196SNikunj A Dadhania     return hasvalue(rb, ra) ? CRF_GT : 0;
164fcf5ef2aSThomas Huth }
165fcf5ef2aSThomas Huth 
166fcf5ef2aSThomas Huth #undef pattern
167fcf5ef2aSThomas Huth #undef haszero
168fcf5ef2aSThomas Huth #undef hasvalue
169fcf5ef2aSThomas Huth 
170b6cb41b2SDavid Gibson /*
1713f74b632SRichard Henderson  * Return a random number.
172fcf5ef2aSThomas Huth  */
1733f74b632SRichard Henderson uint64_t helper_darn32(void)
174fcf5ef2aSThomas Huth {
1753f74b632SRichard Henderson     Error *err = NULL;
1763f74b632SRichard Henderson     uint32_t ret;
1773f74b632SRichard Henderson 
1783f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1793f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1803f74b632SRichard Henderson                       error_get_pretty(err));
1813f74b632SRichard Henderson         error_free(err);
182fcf5ef2aSThomas Huth         return -1;
183fcf5ef2aSThomas Huth     }
184fcf5ef2aSThomas Huth 
1853f74b632SRichard Henderson     return ret;
1863f74b632SRichard Henderson }
1873f74b632SRichard Henderson 
1883f74b632SRichard Henderson uint64_t helper_darn64(void)
189fcf5ef2aSThomas Huth {
1903f74b632SRichard Henderson     Error *err = NULL;
1913f74b632SRichard Henderson     uint64_t ret;
1923f74b632SRichard Henderson 
1933f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1943f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1953f74b632SRichard Henderson                       error_get_pretty(err));
1963f74b632SRichard Henderson         error_free(err);
197fcf5ef2aSThomas Huth         return -1;
198fcf5ef2aSThomas Huth     }
199fcf5ef2aSThomas Huth 
2003f74b632SRichard Henderson     return ret;
2013f74b632SRichard Henderson }
202fcf5ef2aSThomas Huth 
203fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb)
204fcf5ef2aSThomas Huth {
205fcf5ef2aSThomas Huth     int i;
206fcf5ef2aSThomas Huth     uint64_t ra = 0;
207fcf5ef2aSThomas Huth 
208fcf5ef2aSThomas Huth     for (i = 0; i < 8; i++) {
209fcf5ef2aSThomas Huth         int index = (rs >> (i * 8)) & 0xFF;
210fcf5ef2aSThomas Huth         if (index < 64) {
211a6a444a8SCédric Le Goater             if (rb & PPC_BIT(index)) {
212fcf5ef2aSThomas Huth                 ra |= 1 << i;
213fcf5ef2aSThomas Huth             }
214fcf5ef2aSThomas Huth         }
215fcf5ef2aSThomas Huth     }
216fcf5ef2aSThomas Huth     return ra;
217fcf5ef2aSThomas Huth }
218fcf5ef2aSThomas Huth 
219fcf5ef2aSThomas Huth #endif
220fcf5ef2aSThomas Huth 
221fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb)
222fcf5ef2aSThomas Huth {
223fcf5ef2aSThomas Huth     target_ulong mask = 0xff;
224fcf5ef2aSThomas Huth     target_ulong ra = 0;
225fcf5ef2aSThomas Huth     int i;
226fcf5ef2aSThomas Huth 
227fcf5ef2aSThomas Huth     for (i = 0; i < sizeof(target_ulong); i++) {
228fcf5ef2aSThomas Huth         if ((rs & mask) == (rb & mask)) {
229fcf5ef2aSThomas Huth             ra |= mask;
230fcf5ef2aSThomas Huth         }
231fcf5ef2aSThomas Huth         mask <<= 8;
232fcf5ef2aSThomas Huth     }
233fcf5ef2aSThomas Huth     return ra;
234fcf5ef2aSThomas Huth }
235fcf5ef2aSThomas Huth 
236fcf5ef2aSThomas Huth /* shift right arithmetic helper */
237fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value,
238fcf5ef2aSThomas Huth                          target_ulong shift)
239fcf5ef2aSThomas Huth {
240fcf5ef2aSThomas Huth     int32_t ret;
241fcf5ef2aSThomas Huth 
242fcf5ef2aSThomas Huth     if (likely(!(shift & 0x20))) {
243fcf5ef2aSThomas Huth         if (likely((uint32_t)shift != 0)) {
244fcf5ef2aSThomas Huth             shift &= 0x1f;
245fcf5ef2aSThomas Huth             ret = (int32_t)value >> shift;
246fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) {
247af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
248fcf5ef2aSThomas Huth             } else {
249af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
250fcf5ef2aSThomas Huth             }
251fcf5ef2aSThomas Huth         } else {
252fcf5ef2aSThomas Huth             ret = (int32_t)value;
253af1c259fSSandipan Das             env->ca32 = env->ca = 0;
254fcf5ef2aSThomas Huth         }
255fcf5ef2aSThomas Huth     } else {
256fcf5ef2aSThomas Huth         ret = (int32_t)value >> 31;
257af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
258fcf5ef2aSThomas Huth     }
259fcf5ef2aSThomas Huth     return (target_long)ret;
260fcf5ef2aSThomas Huth }
261fcf5ef2aSThomas Huth 
262fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
263fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value,
264fcf5ef2aSThomas Huth                          target_ulong shift)
265fcf5ef2aSThomas Huth {
266fcf5ef2aSThomas Huth     int64_t ret;
267fcf5ef2aSThomas Huth 
268fcf5ef2aSThomas Huth     if (likely(!(shift & 0x40))) {
269fcf5ef2aSThomas Huth         if (likely((uint64_t)shift != 0)) {
270fcf5ef2aSThomas Huth             shift &= 0x3f;
271fcf5ef2aSThomas Huth             ret = (int64_t)value >> shift;
272fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) {
273af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
274fcf5ef2aSThomas Huth             } else {
275af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
276fcf5ef2aSThomas Huth             }
277fcf5ef2aSThomas Huth         } else {
278fcf5ef2aSThomas Huth             ret = (int64_t)value;
279af1c259fSSandipan Das             env->ca32 = env->ca = 0;
280fcf5ef2aSThomas Huth         }
281fcf5ef2aSThomas Huth     } else {
282fcf5ef2aSThomas Huth         ret = (int64_t)value >> 63;
283af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
284fcf5ef2aSThomas Huth     }
285fcf5ef2aSThomas Huth     return ret;
286fcf5ef2aSThomas Huth }
287fcf5ef2aSThomas Huth #endif
288fcf5ef2aSThomas Huth 
289fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
290fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
291fcf5ef2aSThomas Huth {
29279770002SRichard Henderson     /* Note that we don't fold past bytes */
293fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
294fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
295fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
296fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
297fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
298fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
299fcf5ef2aSThomas Huth     return val;
300fcf5ef2aSThomas Huth }
301fcf5ef2aSThomas Huth 
302fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val)
303fcf5ef2aSThomas Huth {
30479770002SRichard Henderson     /* Note that we don't fold past words.  */
305fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
306fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
307fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
308fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
309fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
310fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
311fcf5ef2aSThomas Huth     val = (val & 0x00ff00ff00ff00ffULL) + ((val >>  8) &
312fcf5ef2aSThomas Huth                                            0x00ff00ff00ff00ffULL);
313fcf5ef2aSThomas Huth     val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) &
314fcf5ef2aSThomas Huth                                            0x0000ffff0000ffffULL);
315fcf5ef2aSThomas Huth     return val;
316fcf5ef2aSThomas Huth }
317fcf5ef2aSThomas Huth #else
318fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
319fcf5ef2aSThomas Huth {
32079770002SRichard Henderson     /* Note that we don't fold past bytes */
321fcf5ef2aSThomas Huth     val = (val & 0x55555555) + ((val >>  1) & 0x55555555);
322fcf5ef2aSThomas Huth     val = (val & 0x33333333) + ((val >>  2) & 0x33333333);
323fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f) + ((val >>  4) & 0x0f0f0f0f);
324fcf5ef2aSThomas Huth     return val;
325fcf5ef2aSThomas Huth }
326fcf5ef2aSThomas Huth #endif
327fcf5ef2aSThomas Huth 
3286e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask)
32989ccd7dcSMatheus Ferst {
33089ccd7dcSMatheus Ferst     /*
33189ccd7dcSMatheus Ferst      * Instead of processing the mask bit-by-bit from the most significant to
33289ccd7dcSMatheus Ferst      * the least significant bit, as described in PowerISA, we'll handle it in
33389ccd7dcSMatheus Ferst      * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use
33489ccd7dcSMatheus Ferst      * ctz or cto, we negate the mask at the end of the loop.
33589ccd7dcSMatheus Ferst      */
33689ccd7dcSMatheus Ferst     target_ulong m, left = 0, right = 0;
33789ccd7dcSMatheus Ferst     unsigned int n, i = 64;
33889ccd7dcSMatheus Ferst     bool bit = false; /* tracks if we are processing zeros or ones */
33989ccd7dcSMatheus Ferst 
34089ccd7dcSMatheus Ferst     if (mask == 0 || mask == -1) {
34189ccd7dcSMatheus Ferst         return src;
34289ccd7dcSMatheus Ferst     }
34389ccd7dcSMatheus Ferst 
34489ccd7dcSMatheus Ferst     /* Processes the mask in blocks, from LSB to MSB */
34589ccd7dcSMatheus Ferst     while (i) {
34689ccd7dcSMatheus Ferst         /* Find how many bits we should take */
34789ccd7dcSMatheus Ferst         n = ctz64(mask);
34889ccd7dcSMatheus Ferst         if (n > i) {
34989ccd7dcSMatheus Ferst             n = i;
35089ccd7dcSMatheus Ferst         }
35189ccd7dcSMatheus Ferst 
35289ccd7dcSMatheus Ferst         /*
35389ccd7dcSMatheus Ferst          * Extracts 'n' trailing bits of src and put them on the leading 'n'
35489ccd7dcSMatheus Ferst          * bits of 'right' or 'left', pushing down the previously extracted
35589ccd7dcSMatheus Ferst          * values.
35689ccd7dcSMatheus Ferst          */
35789ccd7dcSMatheus Ferst         m = (1ll << n) - 1;
35889ccd7dcSMatheus Ferst         if (bit) {
35989ccd7dcSMatheus Ferst             right = ror64(right | (src & m), n);
36089ccd7dcSMatheus Ferst         } else {
36189ccd7dcSMatheus Ferst             left = ror64(left | (src & m), n);
36289ccd7dcSMatheus Ferst         }
36389ccd7dcSMatheus Ferst 
36489ccd7dcSMatheus Ferst         /*
36589ccd7dcSMatheus Ferst          * Discards the processed bits from 'src' and 'mask'. Note that we are
36689ccd7dcSMatheus Ferst          * removing 'n' trailing zeros from 'mask', but the logical shift will
36789ccd7dcSMatheus Ferst          * add 'n' leading zeros back, so the population count of 'mask' is kept
36889ccd7dcSMatheus Ferst          * the same.
36989ccd7dcSMatheus Ferst          */
37089ccd7dcSMatheus Ferst         src >>= n;
37189ccd7dcSMatheus Ferst         mask >>= n;
37289ccd7dcSMatheus Ferst         i -= n;
37389ccd7dcSMatheus Ferst         bit = !bit;
37489ccd7dcSMatheus Ferst         mask = ~mask;
37589ccd7dcSMatheus Ferst     }
37689ccd7dcSMatheus Ferst 
37789ccd7dcSMatheus Ferst     /*
37889ccd7dcSMatheus Ferst      * At the end, right was ror'ed ctpop(mask) times. To put it back in place,
37989ccd7dcSMatheus Ferst      * we'll shift it more 64-ctpop(mask) times.
38089ccd7dcSMatheus Ferst      */
38189ccd7dcSMatheus Ferst     if (bit) {
38289ccd7dcSMatheus Ferst         n = ctpop64(mask);
38389ccd7dcSMatheus Ferst     } else {
38489ccd7dcSMatheus Ferst         n = 64 - ctpop64(mask);
38589ccd7dcSMatheus Ferst     }
38689ccd7dcSMatheus Ferst 
38789ccd7dcSMatheus Ferst     return left | (right >> n);
38889ccd7dcSMatheus Ferst }
38989ccd7dcSMatheus Ferst 
39021ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask)
39121ba6e58SMatheus Ferst {
39221ba6e58SMatheus Ferst     int i, o;
39321ba6e58SMatheus Ferst     uint64_t result = 0;
39421ba6e58SMatheus Ferst 
39521ba6e58SMatheus Ferst     if (mask == -1) {
39621ba6e58SMatheus Ferst         return src;
39721ba6e58SMatheus Ferst     }
39821ba6e58SMatheus Ferst 
39921ba6e58SMatheus Ferst     for (i = 0; mask != 0; i++) {
40021ba6e58SMatheus Ferst         o = ctz64(mask);
40121ba6e58SMatheus Ferst         mask &= mask - 1;
40221ba6e58SMatheus Ferst         result |= ((src >> i) & 1) << o;
40321ba6e58SMatheus Ferst     }
40421ba6e58SMatheus Ferst 
40521ba6e58SMatheus Ferst     return result;
40621ba6e58SMatheus Ferst }
4078bdb7606SMatheus Ferst 
4088bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask)
4098bdb7606SMatheus Ferst {
4108bdb7606SMatheus Ferst     int i, o;
4118bdb7606SMatheus Ferst     uint64_t result = 0;
4128bdb7606SMatheus Ferst 
4138bdb7606SMatheus Ferst     if (mask == -1) {
4148bdb7606SMatheus Ferst         return src;
4158bdb7606SMatheus Ferst     }
4168bdb7606SMatheus Ferst 
4178bdb7606SMatheus Ferst     for (o = 0; mask != 0; o++) {
4188bdb7606SMatheus Ferst         i = ctz64(mask);
4198bdb7606SMatheus Ferst         mask &= mask - 1;
4208bdb7606SMatheus Ferst         result |= ((src >> i) & 1) << o;
4218bdb7606SMatheus Ferst     }
4228bdb7606SMatheus Ferst 
4238bdb7606SMatheus Ferst     return result;
4248bdb7606SMatheus Ferst }
42521ba6e58SMatheus Ferst 
426fcf5ef2aSThomas Huth /*****************************************************************************/
427fcf5ef2aSThomas Huth /* Altivec extension helpers */
428fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
429fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
430fcf5ef2aSThomas Huth     for (index = 0; index < ARRAY_SIZE(r->element); index++)
431fcf5ef2aSThomas Huth #else
432fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
433fcf5ef2aSThomas Huth     for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--)
434fcf5ef2aSThomas Huth #endif
435fcf5ef2aSThomas Huth 
436fcf5ef2aSThomas Huth /* Saturating arithmetic helpers.  */
437fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max)          \
438fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
439fcf5ef2aSThomas Huth     {                                                           \
440fcf5ef2aSThomas Huth         to_type r;                                              \
441fcf5ef2aSThomas Huth                                                                 \
442fcf5ef2aSThomas Huth         if (x < (from_type)min) {                               \
443fcf5ef2aSThomas Huth             r = min;                                            \
444fcf5ef2aSThomas Huth             *sat = 1;                                           \
445fcf5ef2aSThomas Huth         } else if (x > (from_type)max) {                        \
446fcf5ef2aSThomas Huth             r = max;                                            \
447fcf5ef2aSThomas Huth             *sat = 1;                                           \
448fcf5ef2aSThomas Huth         } else {                                                \
449fcf5ef2aSThomas Huth             r = x;                                              \
450fcf5ef2aSThomas Huth         }                                                       \
451fcf5ef2aSThomas Huth         return r;                                               \
452fcf5ef2aSThomas Huth     }
453fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max)         \
454fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
455fcf5ef2aSThomas Huth     {                                                           \
456fcf5ef2aSThomas Huth         to_type r;                                              \
457fcf5ef2aSThomas Huth                                                                 \
458fcf5ef2aSThomas Huth         if (x > (from_type)max) {                               \
459fcf5ef2aSThomas Huth             r = max;                                            \
460fcf5ef2aSThomas Huth             *sat = 1;                                           \
461fcf5ef2aSThomas Huth         } else {                                                \
462fcf5ef2aSThomas Huth             r = x;                                              \
463fcf5ef2aSThomas Huth         }                                                       \
464fcf5ef2aSThomas Huth         return r;                                               \
465fcf5ef2aSThomas Huth     }
466fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX)
467fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX)
468fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX)
469fcf5ef2aSThomas Huth 
470fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX)
471fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX)
472fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX)
473fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX)
474fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX)
475fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX)
476fcf5ef2aSThomas Huth #undef SATCVT
477fcf5ef2aSThomas Huth #undef SATCVTU
478fcf5ef2aSThomas Huth 
479dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr)
480fcf5ef2aSThomas Huth {
481c19940dbSBruno Larsen (billionai)     ppc_store_vscr(env, vscr);
482fcf5ef2aSThomas Huth }
483fcf5ef2aSThomas Huth 
484cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env)
485cc2b90d7SRichard Henderson {
486c19940dbSBruno Larsen (billionai)     return ppc_get_vscr(env);
487cc2b90d7SRichard Henderson }
488cc2b90d7SRichard Henderson 
4896175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env)
4906175f5a0SRichard Henderson {
4919b5b74daSRichard Henderson     /* The choice of non-zero value is arbitrary.  */
4929b5b74daSRichard Henderson     env->vscr_sat.u32[0] = 1;
4936175f5a0SRichard Henderson }
4946175f5a0SRichard Henderson 
495fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
496fcf5ef2aSThomas Huth {
497fcf5ef2aSThomas Huth     int i;
498fcf5ef2aSThomas Huth 
499fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
500fcf5ef2aSThomas Huth         r->u32[i] = ~a->u32[i] < b->u32[i];
501fcf5ef2aSThomas Huth     }
502fcf5ef2aSThomas Huth }
503fcf5ef2aSThomas Huth 
504fcf5ef2aSThomas Huth /* vprtybw */
505fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b)
506fcf5ef2aSThomas Huth {
507fcf5ef2aSThomas Huth     int i;
508fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
509fcf5ef2aSThomas Huth         uint64_t res = b->u32[i] ^ (b->u32[i] >> 16);
510fcf5ef2aSThomas Huth         res ^= res >> 8;
511fcf5ef2aSThomas Huth         r->u32[i] = res & 1;
512fcf5ef2aSThomas Huth     }
513fcf5ef2aSThomas Huth }
514fcf5ef2aSThomas Huth 
515fcf5ef2aSThomas Huth /* vprtybd */
516fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b)
517fcf5ef2aSThomas Huth {
518fcf5ef2aSThomas Huth     int i;
519fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
520fcf5ef2aSThomas Huth         uint64_t res = b->u64[i] ^ (b->u64[i] >> 32);
521fcf5ef2aSThomas Huth         res ^= res >> 16;
522fcf5ef2aSThomas Huth         res ^= res >> 8;
523fcf5ef2aSThomas Huth         r->u64[i] = res & 1;
524fcf5ef2aSThomas Huth     }
525fcf5ef2aSThomas Huth }
526fcf5ef2aSThomas Huth 
527fcf5ef2aSThomas Huth /* vprtybq */
528fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b)
529fcf5ef2aSThomas Huth {
530fcf5ef2aSThomas Huth     uint64_t res = b->u64[0] ^ b->u64[1];
531fcf5ef2aSThomas Huth     res ^= res >> 32;
532fcf5ef2aSThomas Huth     res ^= res >> 16;
533fcf5ef2aSThomas Huth     res ^= res >> 8;
5343c385a93SMark Cave-Ayland     r->VsrD(1) = res & 1;
5353c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
536fcf5ef2aSThomas Huth }
537fcf5ef2aSThomas Huth 
538fcf5ef2aSThomas Huth #define VARITHFP(suffix, func)                                          \
539fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
540fcf5ef2aSThomas Huth                           ppc_avr_t *b)                                 \
541fcf5ef2aSThomas Huth     {                                                                   \
542fcf5ef2aSThomas Huth         int i;                                                          \
543fcf5ef2aSThomas Huth                                                                         \
54405ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
54505ee3e8aSMark Cave-Ayland             r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status);   \
546fcf5ef2aSThomas Huth         }                                                               \
547fcf5ef2aSThomas Huth     }
548fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add)
549fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub)
550fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min)
551fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max)
552fcf5ef2aSThomas Huth #undef VARITHFP
553fcf5ef2aSThomas Huth 
554fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type)                                       \
555fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
556fcf5ef2aSThomas Huth                            ppc_avr_t *b, ppc_avr_t *c)                  \
557fcf5ef2aSThomas Huth     {                                                                   \
558fcf5ef2aSThomas Huth         int i;                                                          \
55905ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
56005ee3e8aSMark Cave-Ayland             r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \
561fcf5ef2aSThomas Huth                                        type, &env->vec_status);         \
562fcf5ef2aSThomas Huth         }                                                               \
563fcf5ef2aSThomas Huth     }
564fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0);
565fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c);
566fcf5ef2aSThomas Huth #undef VARITHFPFMA
567fcf5ef2aSThomas Huth 
568fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element)                          \
569fcf5ef2aSThomas Huth     {                                                                   \
570fcf5ef2aSThomas Huth         type result = (type)a->element[i] op (type)b->element[i];       \
571fcf5ef2aSThomas Huth         r->element[i] = cvt(result, &sat);                              \
572fcf5ef2aSThomas Huth     }
573fcf5ef2aSThomas Huth 
574fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element)                    \
575fb11ae7dSRichard Henderson     void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat,              \
576fb11ae7dSRichard Henderson                         ppc_avr_t *a, ppc_avr_t *b, uint32_t desc)      \
577fcf5ef2aSThomas Huth     {                                                                   \
578fcf5ef2aSThomas Huth         int sat = 0;                                                    \
579fcf5ef2aSThomas Huth         int i;                                                          \
580fcf5ef2aSThomas Huth                                                                         \
581fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
582fcf5ef2aSThomas Huth             VARITHSAT_CASE(optype, op, cvt, element);                   \
583fcf5ef2aSThomas Huth         }                                                               \
584fcf5ef2aSThomas Huth         if (sat) {                                                      \
585fb11ae7dSRichard Henderson             vscr_sat->u32[0] = 1;                                       \
586fcf5ef2aSThomas Huth         }                                                               \
587fcf5ef2aSThomas Huth     }
588fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt)          \
589fcf5ef2aSThomas Huth     VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element)      \
590fcf5ef2aSThomas Huth     VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element)
591fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt)        \
592fcf5ef2aSThomas Huth     VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element)      \
593fcf5ef2aSThomas Huth     VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element)
594fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb)
595fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh)
596fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw)
597fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub)
598fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh)
599fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw)
600fcf5ef2aSThomas Huth #undef VARITHSAT_CASE
601fcf5ef2aSThomas Huth #undef VARITHSAT_DO
602fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED
603fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED
604fcf5ef2aSThomas Huth 
605fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype)                                   \
606fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
607fcf5ef2aSThomas Huth     {                                                                   \
608fcf5ef2aSThomas Huth         int i;                                                          \
609fcf5ef2aSThomas Huth                                                                         \
610fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
611fcf5ef2aSThomas Huth             etype x = (etype)a->element[i] + (etype)b->element[i] + 1;  \
612fcf5ef2aSThomas Huth             r->element[i] = x >> 1;                                     \
613fcf5ef2aSThomas Huth         }                                                               \
614fcf5ef2aSThomas Huth     }
615fcf5ef2aSThomas Huth 
616fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element,       \
617fcf5ef2aSThomas Huth              unsigned_type)                                             \
618fcf5ef2aSThomas Huth     VAVG_DO(avgs##type, signed_element, signed_type)                    \
619fcf5ef2aSThomas Huth     VAVG_DO(avgu##type, unsigned_element, unsigned_type)
620fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t)
621fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t)
622fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t)
623fcf5ef2aSThomas Huth #undef VAVG_DO
624fcf5ef2aSThomas Huth #undef VAVG
625fcf5ef2aSThomas Huth 
626fcf5ef2aSThomas Huth #define VABSDU_DO(name, element)                                        \
627fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)           \
628fcf5ef2aSThomas Huth {                                                                       \
629fcf5ef2aSThomas Huth     int i;                                                              \
630fcf5ef2aSThomas Huth                                                                         \
631fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
632fcf5ef2aSThomas Huth         r->element[i] = (a->element[i] > b->element[i]) ?               \
633fcf5ef2aSThomas Huth             (a->element[i] - b->element[i]) :                           \
634fcf5ef2aSThomas Huth             (b->element[i] - a->element[i]);                            \
635fcf5ef2aSThomas Huth     }                                                                   \
636fcf5ef2aSThomas Huth }
637fcf5ef2aSThomas Huth 
638b6cb41b2SDavid Gibson /*
639b6cb41b2SDavid Gibson  * VABSDU - Vector absolute difference unsigned
640fcf5ef2aSThomas Huth  *   name    - instruction mnemonic suffix (b: byte, h: halfword, w: word)
641fcf5ef2aSThomas Huth  *   element - element type to access from vector
642fcf5ef2aSThomas Huth  */
643fcf5ef2aSThomas Huth #define VABSDU(type, element)                   \
644fcf5ef2aSThomas Huth     VABSDU_DO(absdu##type, element)
645fcf5ef2aSThomas Huth VABSDU(b, u8)
646fcf5ef2aSThomas Huth VABSDU(h, u16)
647fcf5ef2aSThomas Huth VABSDU(w, u32)
648fcf5ef2aSThomas Huth #undef VABSDU_DO
649fcf5ef2aSThomas Huth #undef VABSDU
650fcf5ef2aSThomas Huth 
651fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element)                                       \
652fcf5ef2aSThomas Huth     void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r,             \
653fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
654fcf5ef2aSThomas Huth     {                                                                   \
655fcf5ef2aSThomas Huth         int i;                                                          \
656fcf5ef2aSThomas Huth                                                                         \
65705ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
658fcf5ef2aSThomas Huth             float32 t = cvt(b->element[i], &env->vec_status);           \
65905ee3e8aSMark Cave-Ayland             r->f32[i] = float32_scalbn(t, -uim, &env->vec_status);      \
660fcf5ef2aSThomas Huth         }                                                               \
661fcf5ef2aSThomas Huth     }
662fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32)
663fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32)
664fcf5ef2aSThomas Huth #undef VCF
665fcf5ef2aSThomas Huth 
666eb936dc0SMatheus Ferst #define VCMPNEZ(NAME, ELEM) \
667eb936dc0SMatheus Ferst void helper_##NAME(ppc_vsr_t *t, ppc_vsr_t *a, ppc_vsr_t *b, uint32_t desc) \
668fcf5ef2aSThomas Huth {                                                                           \
669eb936dc0SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->ELEM); i++) {                         \
670eb936dc0SMatheus Ferst         t->ELEM[i] = ((a->ELEM[i] == 0) || (b->ELEM[i] == 0) ||             \
671eb936dc0SMatheus Ferst                       (a->ELEM[i] != b->ELEM[i])) ? -1 : 0;                 \
672fcf5ef2aSThomas Huth     }                                                                       \
673fcf5ef2aSThomas Huth }
674eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZB, u8)
675eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZH, u16)
676eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZW, u32)
677eb936dc0SMatheus Ferst #undef VCMPNEZ
678fcf5ef2aSThomas Huth 
679fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record)                       \
680fcf5ef2aSThomas Huth     void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r,            \
681fcf5ef2aSThomas Huth                              ppc_avr_t *a, ppc_avr_t *b)                \
682fcf5ef2aSThomas Huth     {                                                                   \
683fcf5ef2aSThomas Huth         uint32_t ones = (uint32_t)-1;                                   \
684fcf5ef2aSThomas Huth         uint32_t all = ones;                                            \
685fcf5ef2aSThomas Huth         uint32_t none = 0;                                              \
686fcf5ef2aSThomas Huth         int i;                                                          \
687fcf5ef2aSThomas Huth                                                                         \
68805ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
689fcf5ef2aSThomas Huth             uint32_t result;                                            \
69071bfd65cSRichard Henderson             FloatRelation rel =                                         \
69171bfd65cSRichard Henderson                 float32_compare_quiet(a->f32[i], b->f32[i],             \
692fcf5ef2aSThomas Huth                                       &env->vec_status);                \
693fcf5ef2aSThomas Huth             if (rel == float_relation_unordered) {                      \
694fcf5ef2aSThomas Huth                 result = 0;                                             \
695fcf5ef2aSThomas Huth             } else if (rel compare order) {                             \
696fcf5ef2aSThomas Huth                 result = ones;                                          \
697fcf5ef2aSThomas Huth             } else {                                                    \
698fcf5ef2aSThomas Huth                 result = 0;                                             \
699fcf5ef2aSThomas Huth             }                                                           \
700fcf5ef2aSThomas Huth             r->u32[i] = result;                                         \
701fcf5ef2aSThomas Huth             all &= result;                                              \
702fcf5ef2aSThomas Huth             none |= result;                                             \
703fcf5ef2aSThomas Huth         }                                                               \
704fcf5ef2aSThomas Huth         if (record) {                                                   \
705fcf5ef2aSThomas Huth             env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1);       \
706fcf5ef2aSThomas Huth         }                                                               \
707fcf5ef2aSThomas Huth     }
708fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order)          \
709fcf5ef2aSThomas Huth     VCMPFP_DO(suffix, compare, order, 0)        \
710fcf5ef2aSThomas Huth     VCMPFP_DO(suffix##_dot, compare, order, 1)
711fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal)
712fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less)
713fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater)
714fcf5ef2aSThomas Huth #undef VCMPFP_DO
715fcf5ef2aSThomas Huth #undef VCMPFP
716fcf5ef2aSThomas Huth 
717fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r,
718fcf5ef2aSThomas Huth                                     ppc_avr_t *a, ppc_avr_t *b, int record)
719fcf5ef2aSThomas Huth {
720fcf5ef2aSThomas Huth     int i;
721fcf5ef2aSThomas Huth     int all_in = 0;
722fcf5ef2aSThomas Huth 
72305ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
72471bfd65cSRichard Henderson         FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i],
72505ee3e8aSMark Cave-Ayland                                                      &env->vec_status);
726fcf5ef2aSThomas Huth         if (le_rel == float_relation_unordered) {
727fcf5ef2aSThomas Huth             r->u32[i] = 0xc0000000;
728fcf5ef2aSThomas Huth             all_in = 1;
729fcf5ef2aSThomas Huth         } else {
73005ee3e8aSMark Cave-Ayland             float32 bneg = float32_chs(b->f32[i]);
73171bfd65cSRichard Henderson             FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg,
73205ee3e8aSMark Cave-Ayland                                                          &env->vec_status);
733fcf5ef2aSThomas Huth             int le = le_rel != float_relation_greater;
734fcf5ef2aSThomas Huth             int ge = ge_rel != float_relation_less;
735fcf5ef2aSThomas Huth 
736fcf5ef2aSThomas Huth             r->u32[i] = ((!le) << 31) | ((!ge) << 30);
737fcf5ef2aSThomas Huth             all_in |= (!le | !ge);
738fcf5ef2aSThomas Huth         }
739fcf5ef2aSThomas Huth     }
740fcf5ef2aSThomas Huth     if (record) {
741fcf5ef2aSThomas Huth         env->crf[6] = (all_in == 0) << 1;
742fcf5ef2aSThomas Huth     }
743fcf5ef2aSThomas Huth }
744fcf5ef2aSThomas Huth 
745fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
746fcf5ef2aSThomas Huth {
747fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 0);
748fcf5ef2aSThomas Huth }
749fcf5ef2aSThomas Huth 
750fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
751fcf5ef2aSThomas Huth                         ppc_avr_t *b)
752fcf5ef2aSThomas Huth {
753fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 1);
754fcf5ef2aSThomas Huth }
755fcf5ef2aSThomas Huth 
756fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element)                                    \
757fcf5ef2aSThomas Huth     void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r,             \
758fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
759fcf5ef2aSThomas Huth     {                                                                   \
760fcf5ef2aSThomas Huth         int i;                                                          \
761fcf5ef2aSThomas Huth         int sat = 0;                                                    \
762fcf5ef2aSThomas Huth         float_status s = env->vec_status;                               \
763fcf5ef2aSThomas Huth                                                                         \
764fcf5ef2aSThomas Huth         set_float_rounding_mode(float_round_to_zero, &s);               \
76505ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
76605ee3e8aSMark Cave-Ayland             if (float32_is_any_nan(b->f32[i])) {                        \
767fcf5ef2aSThomas Huth                 r->element[i] = 0;                                      \
768fcf5ef2aSThomas Huth             } else {                                                    \
76905ee3e8aSMark Cave-Ayland                 float64 t = float32_to_float64(b->f32[i], &s);          \
770fcf5ef2aSThomas Huth                 int64_t j;                                              \
771fcf5ef2aSThomas Huth                                                                         \
772fcf5ef2aSThomas Huth                 t = float64_scalbn(t, uim, &s);                         \
773fcf5ef2aSThomas Huth                 j = float64_to_int64(t, &s);                            \
774fcf5ef2aSThomas Huth                 r->element[i] = satcvt(j, &sat);                        \
775fcf5ef2aSThomas Huth             }                                                           \
776fcf5ef2aSThomas Huth         }                                                               \
777fcf5ef2aSThomas Huth         if (sat) {                                                      \
7786175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
779fcf5ef2aSThomas Huth         }                                                               \
780fcf5ef2aSThomas Huth     }
781fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32)
782fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32)
783fcf5ef2aSThomas Huth #undef VCT
784fcf5ef2aSThomas Huth 
785fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r)
786fcf5ef2aSThomas Huth {
787fcf5ef2aSThomas Huth     target_ulong count = 0;
788fcf5ef2aSThomas Huth     int i;
78960594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
79060594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
791fcf5ef2aSThomas Huth             break;
792fcf5ef2aSThomas Huth         }
793fcf5ef2aSThomas Huth         count++;
794fcf5ef2aSThomas Huth     }
795fcf5ef2aSThomas Huth     return count;
796fcf5ef2aSThomas Huth }
797fcf5ef2aSThomas Huth 
798fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r)
799fcf5ef2aSThomas Huth {
800fcf5ef2aSThomas Huth     target_ulong count = 0;
801fcf5ef2aSThomas Huth     int i;
802fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
80360594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
804fcf5ef2aSThomas Huth             break;
805fcf5ef2aSThomas Huth         }
806fcf5ef2aSThomas Huth         count++;
807fcf5ef2aSThomas Huth     }
808fcf5ef2aSThomas Huth     return count;
809fcf5ef2aSThomas Huth }
810fcf5ef2aSThomas Huth 
811fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
812fcf5ef2aSThomas Huth                       ppc_avr_t *b, ppc_avr_t *c)
813fcf5ef2aSThomas Huth {
814fcf5ef2aSThomas Huth     int sat = 0;
815fcf5ef2aSThomas Huth     int i;
816fcf5ef2aSThomas Huth 
817fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
818fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
819fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
820fcf5ef2aSThomas Huth 
821fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
822fcf5ef2aSThomas Huth     }
823fcf5ef2aSThomas Huth 
824fcf5ef2aSThomas Huth     if (sat) {
8256175f5a0SRichard Henderson         set_vscr_sat(env);
826fcf5ef2aSThomas Huth     }
827fcf5ef2aSThomas Huth }
828fcf5ef2aSThomas Huth 
829fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
830fcf5ef2aSThomas Huth                        ppc_avr_t *b, ppc_avr_t *c)
831fcf5ef2aSThomas Huth {
832fcf5ef2aSThomas Huth     int sat = 0;
833fcf5ef2aSThomas Huth     int i;
834fcf5ef2aSThomas Huth 
835fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
836fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i] + 0x00004000;
837fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
838fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
839fcf5ef2aSThomas Huth     }
840fcf5ef2aSThomas Huth 
841fcf5ef2aSThomas Huth     if (sat) {
8426175f5a0SRichard Henderson         set_vscr_sat(env);
843fcf5ef2aSThomas Huth     }
844fcf5ef2aSThomas Huth }
845fcf5ef2aSThomas Huth 
846fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
847fcf5ef2aSThomas Huth {
848fcf5ef2aSThomas Huth     int i;
849fcf5ef2aSThomas Huth 
850fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
851fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
852fcf5ef2aSThomas Huth         r->s16[i] = (int16_t) (prod + c->s16[i]);
853fcf5ef2aSThomas Huth     }
854fcf5ef2aSThomas Huth }
855fcf5ef2aSThomas Huth 
856d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs)                                  \
857fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)            \
858fcf5ef2aSThomas Huth     {                                                                        \
859fcf5ef2aSThomas Huth         ppc_avr_t result;                                                    \
860d81c2040SMark Cave-Ayland         int i, half = ARRAY_SIZE(r->element) / 2;                            \
861fcf5ef2aSThomas Huth                                                                              \
862d81c2040SMark Cave-Ayland         for (i = 0; i < half; i++) {                                         \
863d81c2040SMark Cave-Ayland             result.access(i * 2 + 0) = a->access(i + ofs);                   \
864d81c2040SMark Cave-Ayland             result.access(i * 2 + 1) = b->access(i + ofs);                   \
865fcf5ef2aSThomas Huth         }                                                                    \
866fcf5ef2aSThomas Huth         *r = result;                                                         \
867fcf5ef2aSThomas Huth     }
868d81c2040SMark Cave-Ayland 
869d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access)          \
870d81c2040SMark Cave-Ayland     VMRG_DO(mrgl##suffix, element, access, half)   \
871d81c2040SMark Cave-Ayland     VMRG_DO(mrgh##suffix, element, access, 0)
872d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB)
873d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH)
874d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW)
875fcf5ef2aSThomas Huth #undef VMRG_DO
876fcf5ef2aSThomas Huth #undef VMRG
877fcf5ef2aSThomas Huth 
878fcf5ef2aSThomas Huth void helper_vmsummbm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
879fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
880fcf5ef2aSThomas Huth {
881fcf5ef2aSThomas Huth     int32_t prod[16];
882fcf5ef2aSThomas Huth     int i;
883fcf5ef2aSThomas Huth 
884fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s8); i++) {
885fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s8[i] * b->u8[i];
886fcf5ef2aSThomas Huth     }
887fcf5ef2aSThomas Huth 
888fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
889fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] +
890fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
891fcf5ef2aSThomas Huth     }
892fcf5ef2aSThomas Huth }
893fcf5ef2aSThomas Huth 
894fcf5ef2aSThomas Huth void helper_vmsumshm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
895fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
896fcf5ef2aSThomas Huth {
897fcf5ef2aSThomas Huth     int32_t prod[8];
898fcf5ef2aSThomas Huth     int i;
899fcf5ef2aSThomas Huth 
900fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
901fcf5ef2aSThomas Huth         prod[i] = a->s16[i] * b->s16[i];
902fcf5ef2aSThomas Huth     }
903fcf5ef2aSThomas Huth 
904fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
905fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1];
906fcf5ef2aSThomas Huth     }
907fcf5ef2aSThomas Huth }
908fcf5ef2aSThomas Huth 
909fcf5ef2aSThomas Huth void helper_vmsumshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
910fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
911fcf5ef2aSThomas Huth {
912fcf5ef2aSThomas Huth     int32_t prod[8];
913fcf5ef2aSThomas Huth     int i;
914fcf5ef2aSThomas Huth     int sat = 0;
915fcf5ef2aSThomas Huth 
916fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
917fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s16[i] * b->s16[i];
918fcf5ef2aSThomas Huth     }
919fcf5ef2aSThomas Huth 
920fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
921fcf5ef2aSThomas Huth         int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1];
922fcf5ef2aSThomas Huth 
923fcf5ef2aSThomas Huth         r->u32[i] = cvtsdsw(t, &sat);
924fcf5ef2aSThomas Huth     }
925fcf5ef2aSThomas Huth 
926fcf5ef2aSThomas Huth     if (sat) {
9276175f5a0SRichard Henderson         set_vscr_sat(env);
928fcf5ef2aSThomas Huth     }
929fcf5ef2aSThomas Huth }
930fcf5ef2aSThomas Huth 
931fcf5ef2aSThomas Huth void helper_vmsumubm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
932fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
933fcf5ef2aSThomas Huth {
934fcf5ef2aSThomas Huth     uint16_t prod[16];
935fcf5ef2aSThomas Huth     int i;
936fcf5ef2aSThomas Huth 
937fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
938fcf5ef2aSThomas Huth         prod[i] = a->u8[i] * b->u8[i];
939fcf5ef2aSThomas Huth     }
940fcf5ef2aSThomas Huth 
941fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
942fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] +
943fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
944fcf5ef2aSThomas Huth     }
945fcf5ef2aSThomas Huth }
946fcf5ef2aSThomas Huth 
947fcf5ef2aSThomas Huth void helper_vmsumuhm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
948fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
949fcf5ef2aSThomas Huth {
950fcf5ef2aSThomas Huth     uint32_t prod[8];
951fcf5ef2aSThomas Huth     int i;
952fcf5ef2aSThomas Huth 
953fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
954fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
955fcf5ef2aSThomas Huth     }
956fcf5ef2aSThomas Huth 
957fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
958fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1];
959fcf5ef2aSThomas Huth     }
960fcf5ef2aSThomas Huth }
961fcf5ef2aSThomas Huth 
962fcf5ef2aSThomas Huth void helper_vmsumuhs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
963fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
964fcf5ef2aSThomas Huth {
965fcf5ef2aSThomas Huth     uint32_t prod[8];
966fcf5ef2aSThomas Huth     int i;
967fcf5ef2aSThomas Huth     int sat = 0;
968fcf5ef2aSThomas Huth 
969fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
970fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
971fcf5ef2aSThomas Huth     }
972fcf5ef2aSThomas Huth 
973fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
974fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1];
975fcf5ef2aSThomas Huth 
976fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
977fcf5ef2aSThomas Huth     }
978fcf5ef2aSThomas Huth 
979fcf5ef2aSThomas Huth     if (sat) {
9806175f5a0SRichard Henderson         set_vscr_sat(env);
981fcf5ef2aSThomas Huth     }
982fcf5ef2aSThomas Huth }
983fcf5ef2aSThomas Huth 
9844fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast)   \
98580eca687SLucas Mateus Castro (alqotel)     void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
986fcf5ef2aSThomas Huth     {                                                                   \
987fcf5ef2aSThomas Huth         int i;                                                          \
988fcf5ef2aSThomas Huth                                                                         \
9894fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
9904fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i) *           \
9914fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i);            \
992fcf5ef2aSThomas Huth         }                                                               \
993fcf5ef2aSThomas Huth     }
9944fbc89edSMark Cave-Ayland 
9954fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast)   \
99680eca687SLucas Mateus Castro (alqotel)     void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
9974fbc89edSMark Cave-Ayland     {                                                                   \
9984fbc89edSMark Cave-Ayland         int i;                                                          \
9994fbc89edSMark Cave-Ayland                                                                         \
10004fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
10014fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) *       \
10024fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i + 1);        \
10034fbc89edSMark Cave-Ayland         }                                                               \
10044fbc89edSMark Cave-Ayland     }
10054fbc89edSMark Cave-Ayland 
10064fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast)       \
100780eca687SLucas Mateus Castro (alqotel)     VMUL_DO_EVN(MULE##suffix, mul_element, mul_access, prod_access, cast)  \
100880eca687SLucas Mateus Castro (alqotel)     VMUL_DO_ODD(MULO##suffix, mul_element, mul_access, prod_access, cast)
100980eca687SLucas Mateus Castro (alqotel) VMUL(SB, s8, VsrSB, VsrSH, int16_t)
101080eca687SLucas Mateus Castro (alqotel) VMUL(SH, s16, VsrSH, VsrSW, int32_t)
101180eca687SLucas Mateus Castro (alqotel) VMUL(SW, s32, VsrSW, VsrSD, int64_t)
101280eca687SLucas Mateus Castro (alqotel) VMUL(UB, u8, VsrB, VsrH, uint16_t)
101380eca687SLucas Mateus Castro (alqotel) VMUL(UH, u16, VsrH, VsrW, uint32_t)
101480eca687SLucas Mateus Castro (alqotel) VMUL(UW, u32, VsrW, VsrD, uint64_t)
10154fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN
10164fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD
1017fcf5ef2aSThomas Huth #undef VMUL
1018fcf5ef2aSThomas Huth 
101941c2877fSMatheus Ferst void helper_XXPERMX(ppc_vsr_t *t, ppc_vsr_t *s0, ppc_vsr_t *s1, ppc_vsr_t *pcv,
102041c2877fSMatheus Ferst                     target_ulong uim)
102141c2877fSMatheus Ferst {
102241c2877fSMatheus Ferst     int i, idx;
102341c2877fSMatheus Ferst     ppc_vsr_t tmp = { .u64 = {0, 0} };
102441c2877fSMatheus Ferst 
102541c2877fSMatheus Ferst     for (i = 0; i < ARRAY_SIZE(t->u8); i++) {
102641c2877fSMatheus Ferst         if ((pcv->VsrB(i) >> 5) == uim) {
102741c2877fSMatheus Ferst             idx = pcv->VsrB(i) & 0x1f;
102841c2877fSMatheus Ferst             if (idx < ARRAY_SIZE(t->u8)) {
102941c2877fSMatheus Ferst                 tmp.VsrB(i) = s0->VsrB(idx);
103041c2877fSMatheus Ferst             } else {
103141c2877fSMatheus Ferst                 tmp.VsrB(i) = s1->VsrB(idx - ARRAY_SIZE(t->u8));
103241c2877fSMatheus Ferst             }
103341c2877fSMatheus Ferst         }
103441c2877fSMatheus Ferst     }
103541c2877fSMatheus Ferst 
103641c2877fSMatheus Ferst     *t = tmp;
103741c2877fSMatheus Ferst }
103841c2877fSMatheus Ferst 
103928347fe2SMatheus Ferst void helper_VPERM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1040fcf5ef2aSThomas Huth {
1041fcf5ef2aSThomas Huth     ppc_avr_t result;
1042fcf5ef2aSThomas Huth     int i;
1043fcf5ef2aSThomas Huth 
104460594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
104560594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1046fcf5ef2aSThomas Huth         int index = s & 0xf;
1047fcf5ef2aSThomas Huth 
1048fcf5ef2aSThomas Huth         if (s & 0x10) {
104960594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1050fcf5ef2aSThomas Huth         } else {
105160594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1052fcf5ef2aSThomas Huth         }
1053fcf5ef2aSThomas Huth     }
1054fcf5ef2aSThomas Huth     *r = result;
1055fcf5ef2aSThomas Huth }
1056fcf5ef2aSThomas Huth 
105728347fe2SMatheus Ferst void helper_VPERMR(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1058fcf5ef2aSThomas Huth {
1059fcf5ef2aSThomas Huth     ppc_avr_t result;
1060fcf5ef2aSThomas Huth     int i;
1061fcf5ef2aSThomas Huth 
106260594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
106360594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1064fcf5ef2aSThomas Huth         int index = 15 - (s & 0xf);
1065fcf5ef2aSThomas Huth 
1066fcf5ef2aSThomas Huth         if (s & 0x10) {
106760594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1068fcf5ef2aSThomas Huth         } else {
106960594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1070fcf5ef2aSThomas Huth         }
1071fcf5ef2aSThomas Huth     }
1072fcf5ef2aSThomas Huth     *r = result;
1073fcf5ef2aSThomas Huth }
1074fcf5ef2aSThomas Huth 
1075fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1076fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)])
1077fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i)
1078fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0)
1079fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1))
1080fcf5ef2aSThomas Huth #else
1081fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)])
1082fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i)
1083fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0)
1084fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \
1085fcf5ef2aSThomas Huth         (extract64((avr)->u64[1 - i], 63 - index, 1))
1086fcf5ef2aSThomas Huth #endif
1087fcf5ef2aSThomas Huth 
1088fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1089fcf5ef2aSThomas Huth {
1090fcf5ef2aSThomas Huth     int i, j;
1091fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
1092fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1093fcf5ef2aSThomas Huth         for (j = 0; j < 8; j++) {
1094fcf5ef2aSThomas Huth             int index = VBPERMQ_INDEX(b, (i * 8) + j);
1095fcf5ef2aSThomas Huth             if (index < 64 && EXTRACT_BIT(a, i, index)) {
1096fcf5ef2aSThomas Huth                 result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j);
1097fcf5ef2aSThomas Huth             }
1098fcf5ef2aSThomas Huth         }
1099fcf5ef2aSThomas Huth     }
1100fcf5ef2aSThomas Huth     *r = result;
1101fcf5ef2aSThomas Huth }
1102fcf5ef2aSThomas Huth 
1103fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1104fcf5ef2aSThomas Huth {
1105fcf5ef2aSThomas Huth     int i;
1106fcf5ef2aSThomas Huth     uint64_t perm = 0;
1107fcf5ef2aSThomas Huth 
1108fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
1109fcf5ef2aSThomas Huth         int index = VBPERMQ_INDEX(b, i);
1110fcf5ef2aSThomas Huth 
1111fcf5ef2aSThomas Huth         if (index < 128) {
1112fcf5ef2aSThomas Huth             uint64_t mask = (1ull << (63 - (index & 0x3F)));
1113fcf5ef2aSThomas Huth             if (a->u64[VBPERMQ_DW(index)] & mask) {
1114fcf5ef2aSThomas Huth                 perm |= (0x8000 >> i);
1115fcf5ef2aSThomas Huth             }
1116fcf5ef2aSThomas Huth         }
1117fcf5ef2aSThomas Huth     }
1118fcf5ef2aSThomas Huth 
11193c385a93SMark Cave-Ayland     r->VsrD(0) = perm;
11203c385a93SMark Cave-Ayland     r->VsrD(1) = 0;
1121fcf5ef2aSThomas Huth }
1122fcf5ef2aSThomas Huth 
1123fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX
1124fcf5ef2aSThomas Huth #undef VBPERMQ_DW
1125fcf5ef2aSThomas Huth 
1126fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp)                   \
1127fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)  \
1128fcf5ef2aSThomas Huth {                                                             \
1129fcf5ef2aSThomas Huth     int i, j;                                                 \
1130fcf5ef2aSThomas Huth     trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])];    \
1131fcf5ef2aSThomas Huth                                                               \
1132fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, srcfld) {                         \
1133fcf5ef2aSThomas Huth         prod[i] = 0;                                          \
1134fcf5ef2aSThomas Huth         for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) {      \
1135fcf5ef2aSThomas Huth             if (a->srcfld[i] & (1ull << j)) {                 \
1136fcf5ef2aSThomas Huth                 prod[i] ^= ((trgtyp)b->srcfld[i] << j);       \
1137fcf5ef2aSThomas Huth             }                                                 \
1138fcf5ef2aSThomas Huth         }                                                     \
1139fcf5ef2aSThomas Huth     }                                                         \
1140fcf5ef2aSThomas Huth                                                               \
1141fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, trgfld) {                         \
1142fcf5ef2aSThomas Huth         r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1];         \
1143fcf5ef2aSThomas Huth     }                                                         \
1144fcf5ef2aSThomas Huth }
1145fcf5ef2aSThomas Huth 
1146fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t)
1147fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t)
1148fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t)
1149fcf5ef2aSThomas Huth 
1150fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1151fcf5ef2aSThomas Huth {
1152fcf5ef2aSThomas Huth 
1153fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1154fcf5ef2aSThomas Huth     int i, j;
1155fcf5ef2aSThomas Huth     __uint128_t prod[2];
1156fcf5ef2aSThomas Huth 
1157fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1158fcf5ef2aSThomas Huth         prod[i] = 0;
1159fcf5ef2aSThomas Huth         for (j = 0; j < 64; j++) {
1160fcf5ef2aSThomas Huth             if (a->u64[i] & (1ull << j)) {
1161fcf5ef2aSThomas Huth                 prod[i] ^= (((__uint128_t)b->u64[i]) << j);
1162fcf5ef2aSThomas Huth             }
1163fcf5ef2aSThomas Huth         }
1164fcf5ef2aSThomas Huth     }
1165fcf5ef2aSThomas Huth 
1166fcf5ef2aSThomas Huth     r->u128 = prod[0] ^ prod[1];
1167fcf5ef2aSThomas Huth 
1168fcf5ef2aSThomas Huth #else
1169fcf5ef2aSThomas Huth     int i, j;
1170fcf5ef2aSThomas Huth     ppc_avr_t prod[2];
1171fcf5ef2aSThomas Huth 
1172fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
11733c385a93SMark Cave-Ayland         prod[i].VsrD(1) = prod[i].VsrD(0) = 0;
1174fcf5ef2aSThomas Huth         for (j = 0; j < 64; j++) {
1175fcf5ef2aSThomas Huth             if (a->u64[i] & (1ull << j)) {
1176fcf5ef2aSThomas Huth                 ppc_avr_t bshift;
1177fcf5ef2aSThomas Huth                 if (j == 0) {
11783c385a93SMark Cave-Ayland                     bshift.VsrD(0) = 0;
11793c385a93SMark Cave-Ayland                     bshift.VsrD(1) = b->u64[i];
1180fcf5ef2aSThomas Huth                 } else {
11813c385a93SMark Cave-Ayland                     bshift.VsrD(0) = b->u64[i] >> (64 - j);
11823c385a93SMark Cave-Ayland                     bshift.VsrD(1) = b->u64[i] << j;
1183fcf5ef2aSThomas Huth                 }
11843c385a93SMark Cave-Ayland                 prod[i].VsrD(1) ^= bshift.VsrD(1);
11853c385a93SMark Cave-Ayland                 prod[i].VsrD(0) ^= bshift.VsrD(0);
1186fcf5ef2aSThomas Huth             }
1187fcf5ef2aSThomas Huth         }
1188fcf5ef2aSThomas Huth     }
1189fcf5ef2aSThomas Huth 
11903c385a93SMark Cave-Ayland     r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1);
11913c385a93SMark Cave-Ayland     r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0);
1192fcf5ef2aSThomas Huth #endif
1193fcf5ef2aSThomas Huth }
1194fcf5ef2aSThomas Huth 
1195fcf5ef2aSThomas Huth 
1196fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1197fcf5ef2aSThomas Huth #define PKBIG 1
1198fcf5ef2aSThomas Huth #else
1199fcf5ef2aSThomas Huth #define PKBIG 0
1200fcf5ef2aSThomas Huth #endif
1201fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1202fcf5ef2aSThomas Huth {
1203fcf5ef2aSThomas Huth     int i, j;
1204fcf5ef2aSThomas Huth     ppc_avr_t result;
1205fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1206fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { a, b };
1207fcf5ef2aSThomas Huth #else
1208fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { b, a };
1209fcf5ef2aSThomas Huth #endif
1210fcf5ef2aSThomas Huth 
1211fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1212fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(j, u32) {
1213fcf5ef2aSThomas Huth             uint32_t e = x[i]->u32[j];
1214fcf5ef2aSThomas Huth 
1215fcf5ef2aSThomas Huth             result.u16[4 * i + j] = (((e >> 9) & 0xfc00) |
1216fcf5ef2aSThomas Huth                                      ((e >> 6) & 0x3e0) |
1217fcf5ef2aSThomas Huth                                      ((e >> 3) & 0x1f));
1218fcf5ef2aSThomas Huth         }
1219fcf5ef2aSThomas Huth     }
1220fcf5ef2aSThomas Huth     *r = result;
1221fcf5ef2aSThomas Huth }
1222fcf5ef2aSThomas Huth 
1223fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat)                               \
1224fcf5ef2aSThomas Huth     void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r,             \
1225fcf5ef2aSThomas Huth                             ppc_avr_t *a, ppc_avr_t *b)                 \
1226fcf5ef2aSThomas Huth     {                                                                   \
1227fcf5ef2aSThomas Huth         int i;                                                          \
1228fcf5ef2aSThomas Huth         int sat = 0;                                                    \
1229fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1230fcf5ef2aSThomas Huth         ppc_avr_t *a0 = PKBIG ? a : b;                                  \
1231fcf5ef2aSThomas Huth         ppc_avr_t *a1 = PKBIG ? b : a;                                  \
1232fcf5ef2aSThomas Huth                                                                         \
1233fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(i, from) {                                 \
1234fcf5ef2aSThomas Huth             result.to[i] = cvt(a0->from[i], &sat);                      \
1235fcf5ef2aSThomas Huth             result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\
1236fcf5ef2aSThomas Huth         }                                                               \
1237fcf5ef2aSThomas Huth         *r = result;                                                    \
1238fcf5ef2aSThomas Huth         if (dosat && sat) {                                             \
12396175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
1240fcf5ef2aSThomas Huth         }                                                               \
1241fcf5ef2aSThomas Huth     }
1242fcf5ef2aSThomas Huth #define I(x, y) (x)
1243fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1)
1244fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1)
1245fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1)
1246fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1)
1247fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1)
1248fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1)
1249fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1)
1250fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1)
1251fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1)
1252fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0)
1253fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0)
1254fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0)
1255fcf5ef2aSThomas Huth #undef I
1256fcf5ef2aSThomas Huth #undef VPK
1257fcf5ef2aSThomas Huth #undef PKBIG
1258fcf5ef2aSThomas Huth 
1259fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1260fcf5ef2aSThomas Huth {
1261fcf5ef2aSThomas Huth     int i;
1262fcf5ef2aSThomas Huth 
126305ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
126405ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status);
1265fcf5ef2aSThomas Huth     }
1266fcf5ef2aSThomas Huth }
1267fcf5ef2aSThomas Huth 
1268fcf5ef2aSThomas Huth #define VRFI(suffix, rounding)                                  \
1269fcf5ef2aSThomas Huth     void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r,    \
1270fcf5ef2aSThomas Huth                              ppc_avr_t *b)                      \
1271fcf5ef2aSThomas Huth     {                                                           \
1272fcf5ef2aSThomas Huth         int i;                                                  \
1273fcf5ef2aSThomas Huth         float_status s = env->vec_status;                       \
1274fcf5ef2aSThomas Huth                                                                 \
1275fcf5ef2aSThomas Huth         set_float_rounding_mode(rounding, &s);                  \
127605ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {              \
127705ee3e8aSMark Cave-Ayland             r->f32[i] = float32_round_to_int (b->f32[i], &s);   \
1278fcf5ef2aSThomas Huth         }                                                       \
1279fcf5ef2aSThomas Huth     }
1280fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even)
1281fcf5ef2aSThomas Huth VRFI(m, float_round_down)
1282fcf5ef2aSThomas Huth VRFI(p, float_round_up)
1283fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero)
1284fcf5ef2aSThomas Huth #undef VRFI
1285fcf5ef2aSThomas Huth 
1286fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1287fcf5ef2aSThomas Huth {
1288fcf5ef2aSThomas Huth     int i;
1289fcf5ef2aSThomas Huth 
129005ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
129105ee3e8aSMark Cave-Ayland         float32 t = float32_sqrt(b->f32[i], &env->vec_status);
1292fcf5ef2aSThomas Huth 
129305ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, t, &env->vec_status);
1294fcf5ef2aSThomas Huth     }
1295fcf5ef2aSThomas Huth }
1296fcf5ef2aSThomas Huth 
1297fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert)                                  \
129802c74f0eSMatheus Ferst void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \
1299fcf5ef2aSThomas Huth {                                                                           \
1300fcf5ef2aSThomas Huth     int i;                                                                  \
1301fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                          \
1302fcf5ef2aSThomas Huth         uint##size##_t src1 = a->element[i];                                \
1303fcf5ef2aSThomas Huth         uint##size##_t src2 = b->element[i];                                \
1304fcf5ef2aSThomas Huth         uint##size##_t src3 = r->element[i];                                \
1305fcf5ef2aSThomas Huth         uint##size##_t begin, end, shift, mask, rot_val;                    \
1306fcf5ef2aSThomas Huth                                                                             \
1307fcf5ef2aSThomas Huth         shift = extract##size(src2, 0, 6);                                  \
1308fcf5ef2aSThomas Huth         end   = extract##size(src2, 8, 6);                                  \
1309fcf5ef2aSThomas Huth         begin = extract##size(src2, 16, 6);                                 \
1310fcf5ef2aSThomas Huth         rot_val = rol##size(src1, shift);                                   \
1311fcf5ef2aSThomas Huth         mask = mask_u##size(begin, end);                                    \
1312fcf5ef2aSThomas Huth         if (insert) {                                                       \
1313fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask) | (src3 & ~mask);              \
1314fcf5ef2aSThomas Huth         } else {                                                            \
1315fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask);                               \
1316fcf5ef2aSThomas Huth         }                                                                   \
1317fcf5ef2aSThomas Huth     }                                                                       \
1318fcf5ef2aSThomas Huth }
1319fcf5ef2aSThomas Huth 
132002c74f0eSMatheus Ferst VRLMI(VRLDMI, 64, u64, 1);
132102c74f0eSMatheus Ferst VRLMI(VRLWMI, 32, u32, 1);
132202c74f0eSMatheus Ferst VRLMI(VRLDNM, 64, u64, 0);
132302c74f0eSMatheus Ferst VRLMI(VRLWNM, 32, u32, 0);
1324fcf5ef2aSThomas Huth 
1325fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1326fcf5ef2aSThomas Huth {
1327fcf5ef2aSThomas Huth     int i;
1328fcf5ef2aSThomas Huth 
132905ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
133005ee3e8aSMark Cave-Ayland         r->f32[i] = float32_exp2(b->f32[i], &env->vec_status);
1331fcf5ef2aSThomas Huth     }
1332fcf5ef2aSThomas Huth }
1333fcf5ef2aSThomas Huth 
1334fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1335fcf5ef2aSThomas Huth {
1336fcf5ef2aSThomas Huth     int i;
1337fcf5ef2aSThomas Huth 
133805ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
133905ee3e8aSMark Cave-Ayland         r->f32[i] = float32_log2(b->f32[i], &env->vec_status);
1340fcf5ef2aSThomas Huth     }
1341fcf5ef2aSThomas Huth }
1342fcf5ef2aSThomas Huth 
134360caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left)                            \
134460caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b)  \
134560caf221SAvinesh Kumar {                                                               \
1346f297c4c6SMatheus Ferst     int index = (a & 0xf) * 8;                                  \
134760caf221SAvinesh Kumar     if (left) {                                                 \
1348f297c4c6SMatheus Ferst         index = 128 - index - size;                             \
134960caf221SAvinesh Kumar     }                                                           \
135060caf221SAvinesh Kumar     return int128_getlo(int128_rshift(b->s128, index)) &        \
135160caf221SAvinesh Kumar         MAKE_64BIT_MASK(0, size);                               \
135260caf221SAvinesh Kumar }
135360caf221SAvinesh Kumar VEXTU_X_DO(vextublx,  8, 1)
135460caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1)
135560caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1)
135660caf221SAvinesh Kumar VEXTU_X_DO(vextubrx,  8, 0)
135760caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0)
135860caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0)
135960caf221SAvinesh Kumar #undef VEXTU_X_DO
136060caf221SAvinesh Kumar 
1361fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1362fcf5ef2aSThomas Huth {
1363fcf5ef2aSThomas Huth     int i;
1364fcf5ef2aSThomas Huth     unsigned int shift, bytes, size;
1365fcf5ef2aSThomas Huth 
1366fcf5ef2aSThomas Huth     size = ARRAY_SIZE(r->u8);
1367fcf5ef2aSThomas Huth     for (i = 0; i < size; i++) {
136863be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;             /* extract shift value */
136963be02fcSAnton Blanchard         bytes = (a->VsrB(i) << 8) +           /* extract adjacent bytes */
137063be02fcSAnton Blanchard             (((i + 1) < size) ? a->VsrB(i + 1) : 0);
137163be02fcSAnton Blanchard         r->VsrB(i) = (bytes << shift) >> 8;   /* shift and store result */
1372fcf5ef2aSThomas Huth     }
1373fcf5ef2aSThomas Huth }
1374fcf5ef2aSThomas Huth 
1375fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1376fcf5ef2aSThomas Huth {
1377fcf5ef2aSThomas Huth     int i;
1378fcf5ef2aSThomas Huth     unsigned int shift, bytes;
1379fcf5ef2aSThomas Huth 
1380b6cb41b2SDavid Gibson     /*
1381b6cb41b2SDavid Gibson      * Use reverse order, as destination and source register can be
1382b6cb41b2SDavid Gibson      * same. Its being modified in place saving temporary, reverse
1383b6cb41b2SDavid Gibson      * order will guarantee that computed result is not fed back.
1384fcf5ef2aSThomas Huth      */
1385fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
138663be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;               /* extract shift value */
138763be02fcSAnton Blanchard         bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i);
1388fcf5ef2aSThomas Huth                                                 /* extract adjacent bytes */
138963be02fcSAnton Blanchard         r->VsrB(i) = (bytes >> shift) & 0xFF;   /* shift and store result */
1390fcf5ef2aSThomas Huth     }
1391fcf5ef2aSThomas Huth }
1392fcf5ef2aSThomas Huth 
1393fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift)
1394fcf5ef2aSThomas Huth {
1395fcf5ef2aSThomas Huth     int sh = shift & 0xf;
1396fcf5ef2aSThomas Huth     int i;
1397fcf5ef2aSThomas Huth     ppc_avr_t result;
1398fcf5ef2aSThomas Huth 
1399fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1400fcf5ef2aSThomas Huth         int index = sh + i;
1401fcf5ef2aSThomas Huth         if (index > 0xf) {
140260594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index - 0x10);
1403fcf5ef2aSThomas Huth         } else {
140460594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1405fcf5ef2aSThomas Huth         }
1406fcf5ef2aSThomas Huth     }
1407fcf5ef2aSThomas Huth     *r = result;
1408fcf5ef2aSThomas Huth }
1409fcf5ef2aSThomas Huth 
1410fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1411fcf5ef2aSThomas Huth {
14123c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1413fcf5ef2aSThomas Huth 
1414fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1415fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1416fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1417fcf5ef2aSThomas Huth #else
1418fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1419fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1420fcf5ef2aSThomas Huth #endif
1421fcf5ef2aSThomas Huth }
1422fcf5ef2aSThomas Huth 
1423fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
14242cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX])
14252cc12af3SMatheus Ferst #else
14262cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1)
14272cc12af3SMatheus Ferst #endif
14282cc12af3SMatheus Ferst 
14292cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \
14302cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t,       \
14312cc12af3SMatheus Ferst                                          uint64_t val, target_ulong index)     \
14322cc12af3SMatheus Ferst {                                                                              \
14332cc12af3SMatheus Ferst     const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE);                       \
14342cc12af3SMatheus Ferst     target_long idx = index;                                                   \
14352cc12af3SMatheus Ferst                                                                                \
14362cc12af3SMatheus Ferst     if (idx < 0 || idx > maxidx) {                                             \
14372cc12af3SMatheus Ferst         idx =  idx < 0 ? sizeof(TYPE) - idx : idx;                             \
14382cc12af3SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR,                                         \
14392cc12af3SMatheus Ferst             "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx   \
14402cc12af3SMatheus Ferst             ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx);         \
14412cc12af3SMatheus Ferst     } else {                                                                   \
14422cc12af3SMatheus Ferst         TYPE src = val;                                                        \
14432cc12af3SMatheus Ferst         memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE));           \
14442cc12af3SMatheus Ferst     }                                                                          \
14452cc12af3SMatheus Ferst }
14462cc12af3SMatheus Ferst VINSX(B, uint8_t)
14472cc12af3SMatheus Ferst VINSX(H, uint16_t)
14482cc12af3SMatheus Ferst VINSX(W, uint32_t)
14492cc12af3SMatheus Ferst VINSX(D, uint64_t)
14502cc12af3SMatheus Ferst #undef ELEM_ADDR
14512cc12af3SMatheus Ferst #undef VINSX
1452fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
145328110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
145428110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
145528110b72SMatheus Ferst                    target_ulong index)                                         \
145628110b72SMatheus Ferst {                                                                              \
145728110b72SMatheus Ferst     const target_long idx = index;                                             \
145828110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *a, *b };                                             \
145928110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
146028110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
146128110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \
146228110b72SMatheus Ferst     } else {                                                                   \
146328110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
146428110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
146528110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
146628110b72SMatheus Ferst     }                                                                          \
146728110b72SMatheus Ferst }
146828110b72SMatheus Ferst #else
146928110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
147028110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
147128110b72SMatheus Ferst                    target_ulong index)                                         \
147228110b72SMatheus Ferst {                                                                              \
147328110b72SMatheus Ferst     const target_long idx = index;                                             \
147428110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *b, *a };                                             \
147528110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
147628110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
147728110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2],                                  \
147828110b72SMatheus Ferst                (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE);                  \
147928110b72SMatheus Ferst     } else {                                                                   \
148028110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
148128110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
148228110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
148328110b72SMatheus Ferst     }                                                                          \
148428110b72SMatheus Ferst }
148528110b72SMatheus Ferst #endif
148628110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1)
148728110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2)
148828110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4)
148928110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8)
149028110b72SMatheus Ferst #undef VEXTDVLX
149128110b72SMatheus Ferst #if defined(HOST_WORDS_BIGENDIAN)
1492fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1493fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1494fcf5ef2aSThomas Huth     {                                                                        \
1495fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1496fcf5ef2aSThomas Huth         memmove(&r->u8[8 - es], &b->u8[index], es);                          \
1497fcf5ef2aSThomas Huth         memset(&r->u8[8], 0, 8);                                             \
1498fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8 - es);                                        \
1499fcf5ef2aSThomas Huth     }
1500fcf5ef2aSThomas Huth #else
1501fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1502fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1503fcf5ef2aSThomas Huth     {                                                                        \
1504fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1505fcf5ef2aSThomas Huth         uint32_t s = (16 - index) - es;                                      \
1506fcf5ef2aSThomas Huth         memmove(&r->u8[8], &b->u8[s], es);                                   \
1507fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8);                                             \
1508fcf5ef2aSThomas Huth         memset(&r->u8[8 + es], 0, 8 - es);                                   \
1509fcf5ef2aSThomas Huth     }
1510fcf5ef2aSThomas Huth #endif
1511fcf5ef2aSThomas Huth VEXTRACT(ub, u8)
1512fcf5ef2aSThomas Huth VEXTRACT(uh, u16)
1513fcf5ef2aSThomas Huth VEXTRACT(uw, u32)
1514fcf5ef2aSThomas Huth VEXTRACT(d, u64)
1515fcf5ef2aSThomas Huth #undef VEXTRACT
1516fcf5ef2aSThomas Huth 
1517fb5303ccSMatheus Ferst #define VSTRI(NAME, ELEM, NUM_ELEMS, LEFT) \
1518fb5303ccSMatheus Ferst uint32_t helper_##NAME(ppc_avr_t *t, ppc_avr_t *b) \
1519fb5303ccSMatheus Ferst {                                                   \
1520fb5303ccSMatheus Ferst     int i, idx, crf = 0;                            \
1521fb5303ccSMatheus Ferst                                                     \
1522fb5303ccSMatheus Ferst     for (i = 0; i < NUM_ELEMS; i++) {               \
1523fb5303ccSMatheus Ferst         idx = LEFT ? i : NUM_ELEMS - i - 1;         \
1524fb5303ccSMatheus Ferst         if (b->Vsr##ELEM(idx)) {                    \
1525fb5303ccSMatheus Ferst             t->Vsr##ELEM(idx) = b->Vsr##ELEM(idx);  \
1526fb5303ccSMatheus Ferst         } else {                                    \
1527fb5303ccSMatheus Ferst             crf = 0b0010;                           \
1528fb5303ccSMatheus Ferst             break;                                  \
1529fb5303ccSMatheus Ferst         }                                           \
1530fb5303ccSMatheus Ferst     }                                               \
1531fb5303ccSMatheus Ferst                                                     \
1532fb5303ccSMatheus Ferst     for (; i < NUM_ELEMS; i++) {                    \
1533fb5303ccSMatheus Ferst         idx = LEFT ? i : NUM_ELEMS - i - 1;         \
1534fb5303ccSMatheus Ferst         t->Vsr##ELEM(idx) = 0;                      \
1535fb5303ccSMatheus Ferst     }                                               \
1536fb5303ccSMatheus Ferst                                                     \
1537fb5303ccSMatheus Ferst     return crf;                                     \
1538fb5303ccSMatheus Ferst }
1539fb5303ccSMatheus Ferst VSTRI(VSTRIBL, B, 16, true)
1540fb5303ccSMatheus Ferst VSTRI(VSTRIBR, B, 16, false)
1541fb5303ccSMatheus Ferst VSTRI(VSTRIHL, H, 8, true)
1542fb5303ccSMatheus Ferst VSTRI(VSTRIHR, H, 8, false)
1543fb5303ccSMatheus Ferst #undef VSTRI
1544fb5303ccSMatheus Ferst 
15455ba5335dSMark Cave-Ayland void helper_xxextractuw(CPUPPCState *env, ppc_vsr_t *xt,
15465ba5335dSMark Cave-Ayland                         ppc_vsr_t *xb, uint32_t index)
15478ad901e5SNikunj A Dadhania {
154803b32c09SMark Cave-Ayland     ppc_vsr_t t = { };
15498ad901e5SNikunj A Dadhania     size_t es = sizeof(uint32_t);
15508ad901e5SNikunj A Dadhania     uint32_t ext_index;
15518ad901e5SNikunj A Dadhania     int i;
15528ad901e5SNikunj A Dadhania 
15538ad901e5SNikunj A Dadhania     ext_index = index;
15548ad901e5SNikunj A Dadhania     for (i = 0; i < es; i++, ext_index++) {
155503b32c09SMark Cave-Ayland         t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16);
15568ad901e5SNikunj A Dadhania     }
15578ad901e5SNikunj A Dadhania 
155803b32c09SMark Cave-Ayland     *xt = t;
15598ad901e5SNikunj A Dadhania }
15608ad901e5SNikunj A Dadhania 
15615ba5335dSMark Cave-Ayland void helper_xxinsertw(CPUPPCState *env, ppc_vsr_t *xt,
15625ba5335dSMark Cave-Ayland                       ppc_vsr_t *xb, uint32_t index)
15633398b742SNikunj A Dadhania {
156403b32c09SMark Cave-Ayland     ppc_vsr_t t = *xt;
15653398b742SNikunj A Dadhania     size_t es = sizeof(uint32_t);
15663398b742SNikunj A Dadhania     int ins_index, i = 0;
15673398b742SNikunj A Dadhania 
15683398b742SNikunj A Dadhania     ins_index = index;
15693398b742SNikunj A Dadhania     for (i = 0; i < es && ins_index < 16; i++, ins_index++) {
157003b32c09SMark Cave-Ayland         t.VsrB(ins_index) = xb->VsrB(8 - es + i);
15713398b742SNikunj A Dadhania     }
15723398b742SNikunj A Dadhania 
157303b32c09SMark Cave-Ayland     *xt = t;
15743398b742SNikunj A Dadhania }
15753398b742SNikunj A Dadhania 
1576*1015fcabSMatheus Ferst void helper_XXEVAL(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c,
1577*1015fcabSMatheus Ferst                    uint32_t desc)
1578*1015fcabSMatheus Ferst {
1579*1015fcabSMatheus Ferst     /*
1580*1015fcabSMatheus Ferst      * Instead of processing imm bit-by-bit, we'll skip the computation of
1581*1015fcabSMatheus Ferst      * conjunctions whose corresponding bit is unset.
1582*1015fcabSMatheus Ferst      */
1583*1015fcabSMatheus Ferst     int bit, imm = simd_data(desc);
1584*1015fcabSMatheus Ferst     Int128 conj, disj = int128_zero();
1585*1015fcabSMatheus Ferst 
1586*1015fcabSMatheus Ferst     /* Iterate over set bits from the least to the most significant bit */
1587*1015fcabSMatheus Ferst     while (imm) {
1588*1015fcabSMatheus Ferst         /*
1589*1015fcabSMatheus Ferst          * Get the next bit to be processed with ctz64. Invert the result of
1590*1015fcabSMatheus Ferst          * ctz64 to match the indexing used by PowerISA.
1591*1015fcabSMatheus Ferst          */
1592*1015fcabSMatheus Ferst         bit = 7 - ctzl(imm);
1593*1015fcabSMatheus Ferst         if (bit & 0x4) {
1594*1015fcabSMatheus Ferst             conj = a->s128;
1595*1015fcabSMatheus Ferst         } else {
1596*1015fcabSMatheus Ferst             conj = int128_not(a->s128);
1597*1015fcabSMatheus Ferst         }
1598*1015fcabSMatheus Ferst         if (bit & 0x2) {
1599*1015fcabSMatheus Ferst             conj = int128_and(conj, b->s128);
1600*1015fcabSMatheus Ferst         } else {
1601*1015fcabSMatheus Ferst             conj = int128_and(conj, int128_not(b->s128));
1602*1015fcabSMatheus Ferst         }
1603*1015fcabSMatheus Ferst         if (bit & 0x1) {
1604*1015fcabSMatheus Ferst             conj = int128_and(conj, c->s128);
1605*1015fcabSMatheus Ferst         } else {
1606*1015fcabSMatheus Ferst             conj = int128_and(conj, int128_not(c->s128));
1607*1015fcabSMatheus Ferst         }
1608*1015fcabSMatheus Ferst         disj = int128_or(disj, conj);
1609*1015fcabSMatheus Ferst 
1610*1015fcabSMatheus Ferst         /* Unset the least significant bit that is set */
1611*1015fcabSMatheus Ferst         imm &= imm - 1;
1612*1015fcabSMatheus Ferst     }
1613*1015fcabSMatheus Ferst 
1614*1015fcabSMatheus Ferst     t->s128 = disj;
1615*1015fcabSMatheus Ferst }
1616*1015fcabSMatheus Ferst 
1617788c6399SMatheus Ferst #define XXBLEND(name, sz) \
1618788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b,  \
1619788c6399SMatheus Ferst                                  ppc_avr_t *c, uint32_t desc)               \
1620788c6399SMatheus Ferst {                                                                           \
1621788c6399SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) {                  \
1622788c6399SMatheus Ferst         t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ?               \
1623788c6399SMatheus Ferst             b->glue(u, sz)[i] : a->glue(u, sz)[i];                          \
1624788c6399SMatheus Ferst     }                                                                       \
1625788c6399SMatheus Ferst }
1626788c6399SMatheus Ferst XXBLEND(B, 8)
1627788c6399SMatheus Ferst XXBLEND(H, 16)
1628788c6399SMatheus Ferst XXBLEND(W, 32)
1629788c6399SMatheus Ferst XXBLEND(D, 64)
1630788c6399SMatheus Ferst #undef XXBLEND
1631788c6399SMatheus Ferst 
1632fcf5ef2aSThomas Huth #define VNEG(name, element)                                         \
1633fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b)                      \
1634fcf5ef2aSThomas Huth {                                                                   \
1635fcf5ef2aSThomas Huth     int i;                                                          \
163660594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
1637fcf5ef2aSThomas Huth         r->element[i] = -b->element[i];                             \
1638fcf5ef2aSThomas Huth     }                                                               \
1639fcf5ef2aSThomas Huth }
1640fcf5ef2aSThomas Huth VNEG(vnegw, s32)
1641fcf5ef2aSThomas Huth VNEG(vnegd, s64)
1642fcf5ef2aSThomas Huth #undef VNEG
1643fcf5ef2aSThomas Huth 
1644fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1645fcf5ef2aSThomas Huth {
16463c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1647fcf5ef2aSThomas Huth 
1648fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1649fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1650fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1651fcf5ef2aSThomas Huth #else
1652fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1653fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1654fcf5ef2aSThomas Huth #endif
1655fcf5ef2aSThomas Huth }
1656fcf5ef2aSThomas Huth 
1657fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1658fcf5ef2aSThomas Huth {
1659fcf5ef2aSThomas Huth     int i;
1660fcf5ef2aSThomas Huth 
1661fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
1662fcf5ef2aSThomas Huth         r->u32[i] = a->u32[i] >= b->u32[i];
1663fcf5ef2aSThomas Huth     }
1664fcf5ef2aSThomas Huth }
1665fcf5ef2aSThomas Huth 
1666fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1667fcf5ef2aSThomas Huth {
1668fcf5ef2aSThomas Huth     int64_t t;
1669fcf5ef2aSThomas Huth     int i, upper;
1670fcf5ef2aSThomas Huth     ppc_avr_t result;
1671fcf5ef2aSThomas Huth     int sat = 0;
1672fcf5ef2aSThomas Huth 
1673fcf5ef2aSThomas Huth     upper = ARRAY_SIZE(r->s32) - 1;
167460594feaSMark Cave-Ayland     t = (int64_t)b->VsrSW(upper);
1675fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
167660594feaSMark Cave-Ayland         t += a->VsrSW(i);
167760594feaSMark Cave-Ayland         result.VsrSW(i) = 0;
1678fcf5ef2aSThomas Huth     }
167960594feaSMark Cave-Ayland     result.VsrSW(upper) = cvtsdsw(t, &sat);
1680fcf5ef2aSThomas Huth     *r = result;
1681fcf5ef2aSThomas Huth 
1682fcf5ef2aSThomas Huth     if (sat) {
16836175f5a0SRichard Henderson         set_vscr_sat(env);
1684fcf5ef2aSThomas Huth     }
1685fcf5ef2aSThomas Huth }
1686fcf5ef2aSThomas Huth 
1687fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1688fcf5ef2aSThomas Huth {
1689fcf5ef2aSThomas Huth     int i, j, upper;
1690fcf5ef2aSThomas Huth     ppc_avr_t result;
1691fcf5ef2aSThomas Huth     int sat = 0;
1692fcf5ef2aSThomas Huth 
1693fcf5ef2aSThomas Huth     upper = 1;
1694fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
169560594feaSMark Cave-Ayland         int64_t t = (int64_t)b->VsrSW(upper + i * 2);
1696fcf5ef2aSThomas Huth 
16977fa0ddc1SAnton Blanchard         result.VsrD(i) = 0;
1698fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u64); j++) {
169960594feaSMark Cave-Ayland             t += a->VsrSW(2 * i + j);
1700fcf5ef2aSThomas Huth         }
170160594feaSMark Cave-Ayland         result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat);
1702fcf5ef2aSThomas Huth     }
1703fcf5ef2aSThomas Huth 
1704fcf5ef2aSThomas Huth     *r = result;
1705fcf5ef2aSThomas Huth     if (sat) {
17066175f5a0SRichard Henderson         set_vscr_sat(env);
1707fcf5ef2aSThomas Huth     }
1708fcf5ef2aSThomas Huth }
1709fcf5ef2aSThomas Huth 
1710fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1711fcf5ef2aSThomas Huth {
1712fcf5ef2aSThomas Huth     int i, j;
1713fcf5ef2aSThomas Huth     int sat = 0;
1714fcf5ef2aSThomas Huth 
1715fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1716fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1717fcf5ef2aSThomas Huth 
1718fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->s32); j++) {
1719fcf5ef2aSThomas Huth             t += a->s8[4 * i + j];
1720fcf5ef2aSThomas Huth         }
1721fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1722fcf5ef2aSThomas Huth     }
1723fcf5ef2aSThomas Huth 
1724fcf5ef2aSThomas Huth     if (sat) {
17256175f5a0SRichard Henderson         set_vscr_sat(env);
1726fcf5ef2aSThomas Huth     }
1727fcf5ef2aSThomas Huth }
1728fcf5ef2aSThomas Huth 
1729fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1730fcf5ef2aSThomas Huth {
1731fcf5ef2aSThomas Huth     int sat = 0;
1732fcf5ef2aSThomas Huth     int i;
1733fcf5ef2aSThomas Huth 
1734fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1735fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1736fcf5ef2aSThomas Huth 
1737fcf5ef2aSThomas Huth         t += a->s16[2 * i] + a->s16[2 * i + 1];
1738fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1739fcf5ef2aSThomas Huth     }
1740fcf5ef2aSThomas Huth 
1741fcf5ef2aSThomas Huth     if (sat) {
17426175f5a0SRichard Henderson         set_vscr_sat(env);
1743fcf5ef2aSThomas Huth     }
1744fcf5ef2aSThomas Huth }
1745fcf5ef2aSThomas Huth 
1746fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1747fcf5ef2aSThomas Huth {
1748fcf5ef2aSThomas Huth     int i, j;
1749fcf5ef2aSThomas Huth     int sat = 0;
1750fcf5ef2aSThomas Huth 
1751fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
1752fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)b->u32[i];
1753fcf5ef2aSThomas Huth 
1754fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u32); j++) {
1755fcf5ef2aSThomas Huth             t += a->u8[4 * i + j];
1756fcf5ef2aSThomas Huth         }
1757fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
1758fcf5ef2aSThomas Huth     }
1759fcf5ef2aSThomas Huth 
1760fcf5ef2aSThomas Huth     if (sat) {
17616175f5a0SRichard Henderson         set_vscr_sat(env);
1762fcf5ef2aSThomas Huth     }
1763fcf5ef2aSThomas Huth }
1764fcf5ef2aSThomas Huth 
1765fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1766fcf5ef2aSThomas Huth #define UPKHI 1
1767fcf5ef2aSThomas Huth #define UPKLO 0
1768fcf5ef2aSThomas Huth #else
1769fcf5ef2aSThomas Huth #define UPKHI 0
1770fcf5ef2aSThomas Huth #define UPKLO 1
1771fcf5ef2aSThomas Huth #endif
1772fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi)                                              \
1773fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
1774fcf5ef2aSThomas Huth     {                                                                   \
1775fcf5ef2aSThomas Huth         int i;                                                          \
1776fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1777fcf5ef2aSThomas Huth                                                                         \
1778fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->u32); i++) {                      \
1779fcf5ef2aSThomas Huth             uint16_t e = b->u16[hi ? i : i + 4];                        \
1780fcf5ef2aSThomas Huth             uint8_t a = (e >> 15) ? 0xff : 0;                           \
1781fcf5ef2aSThomas Huth             uint8_t r = (e >> 10) & 0x1f;                               \
1782fcf5ef2aSThomas Huth             uint8_t g = (e >> 5) & 0x1f;                                \
1783fcf5ef2aSThomas Huth             uint8_t b = e & 0x1f;                                       \
1784fcf5ef2aSThomas Huth                                                                         \
1785fcf5ef2aSThomas Huth             result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b;       \
1786fcf5ef2aSThomas Huth         }                                                               \
1787fcf5ef2aSThomas Huth         *r = result;                                                    \
1788fcf5ef2aSThomas Huth     }
1789fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO)
1790fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI)
1791fcf5ef2aSThomas Huth #undef VUPKPX
1792fcf5ef2aSThomas Huth 
1793fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi)                              \
1794fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
1795fcf5ef2aSThomas Huth     {                                                                   \
1796fcf5ef2aSThomas Huth         int i;                                                          \
1797fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1798fcf5ef2aSThomas Huth                                                                         \
1799fcf5ef2aSThomas Huth         if (hi) {                                                       \
1800fcf5ef2aSThomas Huth             for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) {             \
1801fcf5ef2aSThomas Huth                 result.unpacked[i] = b->packee[i];                      \
1802fcf5ef2aSThomas Huth             }                                                           \
1803fcf5ef2aSThomas Huth         } else {                                                        \
1804fcf5ef2aSThomas Huth             for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \
1805fcf5ef2aSThomas Huth                  i++) {                                                 \
1806fcf5ef2aSThomas Huth                 result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \
1807fcf5ef2aSThomas Huth             }                                                           \
1808fcf5ef2aSThomas Huth         }                                                               \
1809fcf5ef2aSThomas Huth         *r = result;                                                    \
1810fcf5ef2aSThomas Huth     }
1811fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI)
1812fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI)
1813fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI)
1814fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO)
1815fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO)
1816fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO)
1817fcf5ef2aSThomas Huth #undef VUPK
1818fcf5ef2aSThomas Huth #undef UPKHI
1819fcf5ef2aSThomas Huth #undef UPKLO
1820fcf5ef2aSThomas Huth 
1821fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element)                                      \
1822fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *b)                     \
1823fcf5ef2aSThomas Huth     {                                                                   \
1824fcf5ef2aSThomas Huth         int i;                                                          \
1825fcf5ef2aSThomas Huth                                                                         \
182660594feaSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
1827fcf5ef2aSThomas Huth             r->element[i] = name(b->element[i]);                        \
1828fcf5ef2aSThomas Huth         }                                                               \
1829fcf5ef2aSThomas Huth     }
1830fcf5ef2aSThomas Huth 
1831fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8)
1832fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16)
1833fcf5ef2aSThomas Huth 
1834fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8)
1835fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16)
1836fcf5ef2aSThomas Huth 
1837fcf5ef2aSThomas Huth #undef clzb
1838fcf5ef2aSThomas Huth #undef clzh
1839fcf5ef2aSThomas Huth 
1840fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8)
1841fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16)
1842fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v))
1843fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v))
1844fcf5ef2aSThomas Huth 
1845fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8)
1846fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16)
1847fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32)
1848fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64)
1849fcf5ef2aSThomas Huth 
1850fcf5ef2aSThomas Huth #undef ctzb
1851fcf5ef2aSThomas Huth #undef ctzh
1852fcf5ef2aSThomas Huth #undef ctzw
1853fcf5ef2aSThomas Huth #undef ctzd
1854fcf5ef2aSThomas Huth 
1855fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v)
1856fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v)
1857fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v)
1858fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v)
1859fcf5ef2aSThomas Huth 
1860fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8)
1861fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16)
1862fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32)
1863fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64)
1864fcf5ef2aSThomas Huth 
1865fcf5ef2aSThomas Huth #undef popcntb
1866fcf5ef2aSThomas Huth #undef popcnth
1867fcf5ef2aSThomas Huth #undef popcntw
1868fcf5ef2aSThomas Huth #undef popcntd
1869fcf5ef2aSThomas Huth 
1870fcf5ef2aSThomas Huth #undef VGENERIC_DO
1871fcf5ef2aSThomas Huth 
1872fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1873fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } }
1874fcf5ef2aSThomas Huth #else
1875fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } }
1876fcf5ef2aSThomas Huth #endif
1877fcf5ef2aSThomas Huth 
1878fcf5ef2aSThomas Huth #ifndef CONFIG_INT128
1879fcf5ef2aSThomas Huth 
1880fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a)
1881fcf5ef2aSThomas Huth {
1882fcf5ef2aSThomas Huth     t->u64[0] = ~a.u64[0];
1883fcf5ef2aSThomas Huth     t->u64[1] = ~a.u64[1];
1884fcf5ef2aSThomas Huth }
1885fcf5ef2aSThomas Huth 
1886fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b)
1887fcf5ef2aSThomas Huth {
18883c385a93SMark Cave-Ayland     if (a.VsrD(0) < b.VsrD(0)) {
1889fcf5ef2aSThomas Huth         return -1;
18903c385a93SMark Cave-Ayland     } else if (a.VsrD(0) > b.VsrD(0)) {
1891fcf5ef2aSThomas Huth         return 1;
18923c385a93SMark Cave-Ayland     } else if (a.VsrD(1) < b.VsrD(1)) {
1893fcf5ef2aSThomas Huth         return -1;
18943c385a93SMark Cave-Ayland     } else if (a.VsrD(1) > b.VsrD(1)) {
1895fcf5ef2aSThomas Huth         return 1;
1896fcf5ef2aSThomas Huth     } else {
1897fcf5ef2aSThomas Huth         return 0;
1898fcf5ef2aSThomas Huth     }
1899fcf5ef2aSThomas Huth }
1900fcf5ef2aSThomas Huth 
1901fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b)
1902fcf5ef2aSThomas Huth {
19033c385a93SMark Cave-Ayland     t->VsrD(1) = a.VsrD(1) + b.VsrD(1);
19043c385a93SMark Cave-Ayland     t->VsrD(0) = a.VsrD(0) + b.VsrD(0) +
19053c385a93SMark Cave-Ayland                      (~a.VsrD(1) < b.VsrD(1));
1906fcf5ef2aSThomas Huth }
1907fcf5ef2aSThomas Huth 
1908fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b)
1909fcf5ef2aSThomas Huth {
1910fcf5ef2aSThomas Huth     ppc_avr_t not_a;
19113c385a93SMark Cave-Ayland     t->VsrD(1) = a.VsrD(1) + b.VsrD(1);
19123c385a93SMark Cave-Ayland     t->VsrD(0) = a.VsrD(0) + b.VsrD(0) +
19133c385a93SMark Cave-Ayland                      (~a.VsrD(1) < b.VsrD(1));
1914fcf5ef2aSThomas Huth     avr_qw_not(&not_a, a);
1915fcf5ef2aSThomas Huth     return avr_qw_cmpu(not_a, b) < 0;
1916fcf5ef2aSThomas Huth }
1917fcf5ef2aSThomas Huth 
1918fcf5ef2aSThomas Huth #endif
1919fcf5ef2aSThomas Huth 
1920fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1921fcf5ef2aSThomas Huth {
1922fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1923fcf5ef2aSThomas Huth     r->u128 = a->u128 + b->u128;
1924fcf5ef2aSThomas Huth #else
1925fcf5ef2aSThomas Huth     avr_qw_add(r, *a, *b);
1926fcf5ef2aSThomas Huth #endif
1927fcf5ef2aSThomas Huth }
1928fcf5ef2aSThomas Huth 
1929fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1930fcf5ef2aSThomas Huth {
1931fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1932fcf5ef2aSThomas Huth     r->u128 = a->u128 + b->u128 + (c->u128 & 1);
1933fcf5ef2aSThomas Huth #else
1934fcf5ef2aSThomas Huth 
19353c385a93SMark Cave-Ayland     if (c->VsrD(1) & 1) {
1936fcf5ef2aSThomas Huth         ppc_avr_t tmp;
1937fcf5ef2aSThomas Huth 
19383c385a93SMark Cave-Ayland         tmp.VsrD(0) = 0;
19393c385a93SMark Cave-Ayland         tmp.VsrD(1) = c->VsrD(1) & 1;
1940fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
1941fcf5ef2aSThomas Huth         avr_qw_add(r, tmp, *b);
1942fcf5ef2aSThomas Huth     } else {
1943fcf5ef2aSThomas Huth         avr_qw_add(r, *a, *b);
1944fcf5ef2aSThomas Huth     }
1945fcf5ef2aSThomas Huth #endif
1946fcf5ef2aSThomas Huth }
1947fcf5ef2aSThomas Huth 
1948fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1949fcf5ef2aSThomas Huth {
1950fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1951fcf5ef2aSThomas Huth     r->u128 = (~a->u128 < b->u128);
1952fcf5ef2aSThomas Huth #else
1953fcf5ef2aSThomas Huth     ppc_avr_t not_a;
1954fcf5ef2aSThomas Huth 
1955fcf5ef2aSThomas Huth     avr_qw_not(&not_a, *a);
1956fcf5ef2aSThomas Huth 
19573c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
19583c385a93SMark Cave-Ayland     r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0);
1959fcf5ef2aSThomas Huth #endif
1960fcf5ef2aSThomas Huth }
1961fcf5ef2aSThomas Huth 
1962fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1963fcf5ef2aSThomas Huth {
1964fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1965fcf5ef2aSThomas Huth     int carry_out = (~a->u128 < b->u128);
1966fcf5ef2aSThomas Huth     if (!carry_out && (c->u128 & 1)) {
1967fcf5ef2aSThomas Huth         carry_out = ((a->u128 + b->u128 + 1) == 0) &&
1968fcf5ef2aSThomas Huth                     ((a->u128 != 0) || (b->u128 != 0));
1969fcf5ef2aSThomas Huth     }
1970fcf5ef2aSThomas Huth     r->u128 = carry_out;
1971fcf5ef2aSThomas Huth #else
1972fcf5ef2aSThomas Huth 
19733c385a93SMark Cave-Ayland     int carry_in = c->VsrD(1) & 1;
1974fcf5ef2aSThomas Huth     int carry_out = 0;
1975fcf5ef2aSThomas Huth     ppc_avr_t tmp;
1976fcf5ef2aSThomas Huth 
1977fcf5ef2aSThomas Huth     carry_out = avr_qw_addc(&tmp, *a, *b);
1978fcf5ef2aSThomas Huth 
1979fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
1980fcf5ef2aSThomas Huth         ppc_avr_t one = QW_ONE;
1981fcf5ef2aSThomas Huth         carry_out = avr_qw_addc(&tmp, tmp, one);
1982fcf5ef2aSThomas Huth     }
19833c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
19843c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
1985fcf5ef2aSThomas Huth #endif
1986fcf5ef2aSThomas Huth }
1987fcf5ef2aSThomas Huth 
1988fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1989fcf5ef2aSThomas Huth {
1990fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1991fcf5ef2aSThomas Huth     r->u128 = a->u128 - b->u128;
1992fcf5ef2aSThomas Huth #else
1993fcf5ef2aSThomas Huth     ppc_avr_t tmp;
1994fcf5ef2aSThomas Huth     ppc_avr_t one = QW_ONE;
1995fcf5ef2aSThomas Huth 
1996fcf5ef2aSThomas Huth     avr_qw_not(&tmp, *b);
1997fcf5ef2aSThomas Huth     avr_qw_add(&tmp, *a, tmp);
1998fcf5ef2aSThomas Huth     avr_qw_add(r, tmp, one);
1999fcf5ef2aSThomas Huth #endif
2000fcf5ef2aSThomas Huth }
2001fcf5ef2aSThomas Huth 
2002fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2003fcf5ef2aSThomas Huth {
2004fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2005fcf5ef2aSThomas Huth     r->u128 = a->u128 + ~b->u128 + (c->u128 & 1);
2006fcf5ef2aSThomas Huth #else
2007fcf5ef2aSThomas Huth     ppc_avr_t tmp, sum;
2008fcf5ef2aSThomas Huth 
2009fcf5ef2aSThomas Huth     avr_qw_not(&tmp, *b);
2010fcf5ef2aSThomas Huth     avr_qw_add(&sum, *a, tmp);
2011fcf5ef2aSThomas Huth 
20123c385a93SMark Cave-Ayland     tmp.VsrD(0) = 0;
20133c385a93SMark Cave-Ayland     tmp.VsrD(1) = c->VsrD(1) & 1;
2014fcf5ef2aSThomas Huth     avr_qw_add(r, sum, tmp);
2015fcf5ef2aSThomas Huth #endif
2016fcf5ef2aSThomas Huth }
2017fcf5ef2aSThomas Huth 
2018fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2019fcf5ef2aSThomas Huth {
2020fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2021fcf5ef2aSThomas Huth     r->u128 = (~a->u128 < ~b->u128) ||
2022fcf5ef2aSThomas Huth                  (a->u128 + ~b->u128 == (__uint128_t)-1);
2023fcf5ef2aSThomas Huth #else
2024fcf5ef2aSThomas Huth     int carry = (avr_qw_cmpu(*a, *b) > 0);
2025fcf5ef2aSThomas Huth     if (!carry) {
2026fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2027fcf5ef2aSThomas Huth         avr_qw_not(&tmp, *b);
2028fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
20293c385a93SMark Cave-Ayland         carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull));
2030fcf5ef2aSThomas Huth     }
20313c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
20323c385a93SMark Cave-Ayland     r->VsrD(1) = carry;
2033fcf5ef2aSThomas Huth #endif
2034fcf5ef2aSThomas Huth }
2035fcf5ef2aSThomas Huth 
2036fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2037fcf5ef2aSThomas Huth {
2038fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2039fcf5ef2aSThomas Huth     r->u128 =
2040fcf5ef2aSThomas Huth         (~a->u128 < ~b->u128) ||
2041fcf5ef2aSThomas Huth         ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1));
2042fcf5ef2aSThomas Huth #else
20433c385a93SMark Cave-Ayland     int carry_in = c->VsrD(1) & 1;
2044fcf5ef2aSThomas Huth     int carry_out = (avr_qw_cmpu(*a, *b) > 0);
2045fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
2046fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2047fcf5ef2aSThomas Huth         avr_qw_not(&tmp, *b);
2048fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
20493c385a93SMark Cave-Ayland         carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull));
2050fcf5ef2aSThomas Huth     }
2051fcf5ef2aSThomas Huth 
20523c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
20533c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
2054fcf5ef2aSThomas Huth #endif
2055fcf5ef2aSThomas Huth }
2056fcf5ef2aSThomas Huth 
2057fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC
2058fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF
2059fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1  0xA
2060fcf5ef2aSThomas Huth #define BCD_NEG_PREF    0xD
2061fcf5ef2aSThomas Huth #define BCD_NEG_ALT     0xB
2062fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2  0xE
2063fcf5ef2aSThomas Huth #define NATIONAL_PLUS   0x2B
2064fcf5ef2aSThomas Huth #define NATIONAL_NEG    0x2D
2065fcf5ef2aSThomas Huth 
2066365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2))
2067fcf5ef2aSThomas Huth 
2068fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd)
2069fcf5ef2aSThomas Huth {
2070428115c3SMark Cave-Ayland     switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) {
2071fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_1:
2072fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_2:
2073fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_1:
2074fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_2:
2075fcf5ef2aSThomas Huth     {
2076fcf5ef2aSThomas Huth         return 1;
2077fcf5ef2aSThomas Huth     }
2078fcf5ef2aSThomas Huth 
2079fcf5ef2aSThomas Huth     case BCD_NEG_PREF:
2080fcf5ef2aSThomas Huth     case BCD_NEG_ALT:
2081fcf5ef2aSThomas Huth     {
2082fcf5ef2aSThomas Huth         return -1;
2083fcf5ef2aSThomas Huth     }
2084fcf5ef2aSThomas Huth 
2085fcf5ef2aSThomas Huth     default:
2086fcf5ef2aSThomas Huth     {
2087fcf5ef2aSThomas Huth         return 0;
2088fcf5ef2aSThomas Huth     }
2089fcf5ef2aSThomas Huth     }
2090fcf5ef2aSThomas Huth }
2091fcf5ef2aSThomas Huth 
2092fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps)
2093fcf5ef2aSThomas Huth {
2094fcf5ef2aSThomas Huth     if (sgn >= 0) {
2095fcf5ef2aSThomas Huth         return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2;
2096fcf5ef2aSThomas Huth     } else {
2097fcf5ef2aSThomas Huth         return BCD_NEG_PREF;
2098fcf5ef2aSThomas Huth     }
2099fcf5ef2aSThomas Huth }
2100fcf5ef2aSThomas Huth 
2101fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid)
2102fcf5ef2aSThomas Huth {
2103fcf5ef2aSThomas Huth     uint8_t result;
2104fcf5ef2aSThomas Huth     if (n & 1) {
2105428115c3SMark Cave-Ayland         result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4;
2106fcf5ef2aSThomas Huth     } else {
2107428115c3SMark Cave-Ayland        result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF;
2108fcf5ef2aSThomas Huth     }
2109fcf5ef2aSThomas Huth 
2110fcf5ef2aSThomas Huth     if (unlikely(result > 9)) {
2111fcf5ef2aSThomas Huth         *invalid = true;
2112fcf5ef2aSThomas Huth     }
2113fcf5ef2aSThomas Huth     return result;
2114fcf5ef2aSThomas Huth }
2115fcf5ef2aSThomas Huth 
2116fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n)
2117fcf5ef2aSThomas Huth {
2118fcf5ef2aSThomas Huth     if (n & 1) {
2119428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F;
2120428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4);
2121fcf5ef2aSThomas Huth     } else {
2122428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0;
2123428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= digit;
2124fcf5ef2aSThomas Huth     }
2125fcf5ef2aSThomas Huth }
2126fcf5ef2aSThomas Huth 
2127071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd)
2128071663dfSJose Ricardo Ziviani {
2129071663dfSJose Ricardo Ziviani     int i;
2130071663dfSJose Ricardo Ziviani     int invalid = 0;
2131071663dfSJose Ricardo Ziviani 
2132071663dfSJose Ricardo Ziviani     if (bcd_get_sgn(bcd) == 0) {
2133071663dfSJose Ricardo Ziviani         return false;
2134071663dfSJose Ricardo Ziviani     }
2135071663dfSJose Ricardo Ziviani 
2136071663dfSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2137071663dfSJose Ricardo Ziviani         bcd_get_digit(bcd, i, &invalid);
2138071663dfSJose Ricardo Ziviani         if (unlikely(invalid)) {
2139071663dfSJose Ricardo Ziviani             return false;
2140071663dfSJose Ricardo Ziviani         }
2141071663dfSJose Ricardo Ziviani     }
2142071663dfSJose Ricardo Ziviani     return true;
2143071663dfSJose Ricardo Ziviani }
2144071663dfSJose Ricardo Ziviani 
2145fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd)
2146fcf5ef2aSThomas Huth {
21473c385a93SMark Cave-Ayland     if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) {
2148efa73196SNikunj A Dadhania         return CRF_EQ;
2149fcf5ef2aSThomas Huth     } else {
2150efa73196SNikunj A Dadhania         return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT;
2151fcf5ef2aSThomas Huth     }
2152fcf5ef2aSThomas Huth }
2153fcf5ef2aSThomas Huth 
2154fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n)
2155fcf5ef2aSThomas Huth {
215660594feaSMark Cave-Ayland     return reg->VsrH(7 - n);
2157fcf5ef2aSThomas Huth }
2158fcf5ef2aSThomas Huth 
2159fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n)
2160fcf5ef2aSThomas Huth {
216160594feaSMark Cave-Ayland     reg->VsrH(7 - n) = val;
2162fcf5ef2aSThomas Huth }
2163fcf5ef2aSThomas Huth 
2164fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b)
2165fcf5ef2aSThomas Huth {
2166fcf5ef2aSThomas Huth     int i;
2167fcf5ef2aSThomas Huth     int invalid = 0;
2168fcf5ef2aSThomas Huth     for (i = 31; i > 0; i--) {
2169fcf5ef2aSThomas Huth         uint8_t dig_a = bcd_get_digit(a, i, &invalid);
2170fcf5ef2aSThomas Huth         uint8_t dig_b = bcd_get_digit(b, i, &invalid);
2171fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2172fcf5ef2aSThomas Huth             return 0; /* doesn't matter */
2173fcf5ef2aSThomas Huth         } else if (dig_a > dig_b) {
2174fcf5ef2aSThomas Huth             return 1;
2175fcf5ef2aSThomas Huth         } else if (dig_a < dig_b) {
2176fcf5ef2aSThomas Huth             return -1;
2177fcf5ef2aSThomas Huth         }
2178fcf5ef2aSThomas Huth     }
2179fcf5ef2aSThomas Huth 
2180fcf5ef2aSThomas Huth     return 0;
2181fcf5ef2aSThomas Huth }
2182fcf5ef2aSThomas Huth 
2183936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2184fcf5ef2aSThomas Huth                        int *overflow)
2185fcf5ef2aSThomas Huth {
2186fcf5ef2aSThomas Huth     int carry = 0;
2187fcf5ef2aSThomas Huth     int i;
2188936fda4dSFabiano Rosas     int is_zero = 1;
2189936fda4dSFabiano Rosas 
2190fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2191fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) +
2192fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2193936fda4dSFabiano Rosas         is_zero &= (digit == 0);
2194fcf5ef2aSThomas Huth         if (digit > 9) {
2195fcf5ef2aSThomas Huth             carry = 1;
2196fcf5ef2aSThomas Huth             digit -= 10;
2197fcf5ef2aSThomas Huth         } else {
2198fcf5ef2aSThomas Huth             carry = 0;
2199fcf5ef2aSThomas Huth         }
2200fcf5ef2aSThomas Huth 
2201fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2202fcf5ef2aSThomas Huth     }
2203fcf5ef2aSThomas Huth 
2204fcf5ef2aSThomas Huth     *overflow = carry;
2205936fda4dSFabiano Rosas     return is_zero;
2206fcf5ef2aSThomas Huth }
2207fcf5ef2aSThomas Huth 
2208d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2209fcf5ef2aSThomas Huth                        int *overflow)
2210fcf5ef2aSThomas Huth {
2211fcf5ef2aSThomas Huth     int carry = 0;
2212fcf5ef2aSThomas Huth     int i;
2213d03b174aSYasmin Beatriz 
2214fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2215fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) -
2216fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2217fcf5ef2aSThomas Huth         if (digit & 0x80) {
2218fcf5ef2aSThomas Huth             carry = -1;
2219fcf5ef2aSThomas Huth             digit += 10;
2220fcf5ef2aSThomas Huth         } else {
2221fcf5ef2aSThomas Huth             carry = 0;
2222fcf5ef2aSThomas Huth         }
2223fcf5ef2aSThomas Huth 
2224fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2225fcf5ef2aSThomas Huth     }
2226fcf5ef2aSThomas Huth 
2227fcf5ef2aSThomas Huth     *overflow = carry;
2228fcf5ef2aSThomas Huth }
2229fcf5ef2aSThomas Huth 
2230fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2231fcf5ef2aSThomas Huth {
2232fcf5ef2aSThomas Huth 
2233fcf5ef2aSThomas Huth     int sgna = bcd_get_sgn(a);
2234fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2235fcf5ef2aSThomas Huth     int invalid = (sgna == 0) || (sgnb == 0);
2236fcf5ef2aSThomas Huth     int overflow = 0;
2237936fda4dSFabiano Rosas     int zero = 0;
2238fcf5ef2aSThomas Huth     uint32_t cr = 0;
2239fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
2240fcf5ef2aSThomas Huth 
2241fcf5ef2aSThomas Huth     if (!invalid) {
2242fcf5ef2aSThomas Huth         if (sgna == sgnb) {
2243428115c3SMark Cave-Ayland             result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2244936fda4dSFabiano Rosas             zero = bcd_add_mag(&result, a, b, &invalid, &overflow);
2245936fda4dSFabiano Rosas             cr = (sgna > 0) ? CRF_GT : CRF_LT;
2246fcf5ef2aSThomas Huth         } else {
2247d03b174aSYasmin Beatriz             int magnitude = bcd_cmp_mag(a, b);
2248d03b174aSYasmin Beatriz             if (magnitude > 0) {
2249428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2250d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, a, b, &invalid, &overflow);
2251d03b174aSYasmin Beatriz                 cr = (sgna > 0) ? CRF_GT : CRF_LT;
2252d03b174aSYasmin Beatriz             } else if (magnitude < 0) {
2253428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps);
2254d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, b, a, &invalid, &overflow);
2255efa73196SNikunj A Dadhania                 cr = (sgnb > 0) ? CRF_GT : CRF_LT;
2256d03b174aSYasmin Beatriz             } else {
2257428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps);
2258d03b174aSYasmin Beatriz                 cr = CRF_EQ;
2259d03b174aSYasmin Beatriz             }
2260fcf5ef2aSThomas Huth         }
2261fcf5ef2aSThomas Huth     }
2262fcf5ef2aSThomas Huth 
2263fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
22643c385a93SMark Cave-Ayland         result.VsrD(0) = result.VsrD(1) = -1;
2265efa73196SNikunj A Dadhania         cr = CRF_SO;
2266fcf5ef2aSThomas Huth     } else if (overflow) {
2267efa73196SNikunj A Dadhania         cr |= CRF_SO;
2268936fda4dSFabiano Rosas     } else if (zero) {
2269936fda4dSFabiano Rosas         cr |= CRF_EQ;
2270fcf5ef2aSThomas Huth     }
2271fcf5ef2aSThomas Huth 
2272fcf5ef2aSThomas Huth     *r = result;
2273fcf5ef2aSThomas Huth 
2274fcf5ef2aSThomas Huth     return cr;
2275fcf5ef2aSThomas Huth }
2276fcf5ef2aSThomas Huth 
2277fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2278fcf5ef2aSThomas Huth {
2279fcf5ef2aSThomas Huth     ppc_avr_t bcopy = *b;
2280fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2281fcf5ef2aSThomas Huth     if (sgnb < 0) {
2282fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0);
2283fcf5ef2aSThomas Huth     } else if (sgnb > 0) {
2284fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_NEG_PREF, 0);
2285fcf5ef2aSThomas Huth     }
2286fcf5ef2aSThomas Huth     /* else invalid ... defer to bcdadd code for proper handling */
2287fcf5ef2aSThomas Huth 
2288fcf5ef2aSThomas Huth     return helper_bcdadd(r, a, &bcopy, ps);
2289fcf5ef2aSThomas Huth }
2290fcf5ef2aSThomas Huth 
2291fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2292fcf5ef2aSThomas Huth {
2293fcf5ef2aSThomas Huth     int i;
2294fcf5ef2aSThomas Huth     int cr = 0;
2295fcf5ef2aSThomas Huth     uint16_t national = 0;
2296fcf5ef2aSThomas Huth     uint16_t sgnb = get_national_digit(b, 0);
2297fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2298fcf5ef2aSThomas Huth     int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG);
2299fcf5ef2aSThomas Huth 
2300fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2301fcf5ef2aSThomas Huth         national = get_national_digit(b, i);
2302fcf5ef2aSThomas Huth         if (unlikely(national < 0x30 || national > 0x39)) {
2303fcf5ef2aSThomas Huth             invalid = 1;
2304fcf5ef2aSThomas Huth             break;
2305fcf5ef2aSThomas Huth         }
2306fcf5ef2aSThomas Huth 
2307fcf5ef2aSThomas Huth         bcd_put_digit(&ret, national & 0xf, i);
2308fcf5ef2aSThomas Huth     }
2309fcf5ef2aSThomas Huth 
2310fcf5ef2aSThomas Huth     if (sgnb == NATIONAL_PLUS) {
2311fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0);
2312fcf5ef2aSThomas Huth     } else {
2313fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2314fcf5ef2aSThomas Huth     }
2315fcf5ef2aSThomas Huth 
2316fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2317fcf5ef2aSThomas Huth 
2318fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2319efa73196SNikunj A Dadhania         cr = CRF_SO;
2320fcf5ef2aSThomas Huth     }
2321fcf5ef2aSThomas Huth 
2322fcf5ef2aSThomas Huth     *r = ret;
2323fcf5ef2aSThomas Huth 
2324fcf5ef2aSThomas Huth     return cr;
2325fcf5ef2aSThomas Huth }
2326fcf5ef2aSThomas Huth 
2327fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2328fcf5ef2aSThomas Huth {
2329fcf5ef2aSThomas Huth     int i;
2330fcf5ef2aSThomas Huth     int cr = 0;
2331fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2332fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2333fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2334fcf5ef2aSThomas Huth 
23353c385a93SMark Cave-Ayland     int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0);
2336fcf5ef2aSThomas Huth 
2337fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2338fcf5ef2aSThomas Huth         set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i);
2339fcf5ef2aSThomas Huth 
2340fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2341fcf5ef2aSThomas Huth             break;
2342fcf5ef2aSThomas Huth         }
2343fcf5ef2aSThomas Huth     }
2344fcf5ef2aSThomas Huth     set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0);
2345fcf5ef2aSThomas Huth 
2346fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2347fcf5ef2aSThomas Huth 
2348fcf5ef2aSThomas Huth     if (ox_flag) {
2349efa73196SNikunj A Dadhania         cr |= CRF_SO;
2350fcf5ef2aSThomas Huth     }
2351fcf5ef2aSThomas Huth 
2352fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2353efa73196SNikunj A Dadhania         cr = CRF_SO;
2354fcf5ef2aSThomas Huth     }
2355fcf5ef2aSThomas Huth 
2356fcf5ef2aSThomas Huth     *r = ret;
2357fcf5ef2aSThomas Huth 
2358fcf5ef2aSThomas Huth     return cr;
2359fcf5ef2aSThomas Huth }
2360fcf5ef2aSThomas Huth 
2361fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2362fcf5ef2aSThomas Huth {
2363fcf5ef2aSThomas Huth     int i;
2364fcf5ef2aSThomas Huth     int cr = 0;
2365fcf5ef2aSThomas Huth     int invalid = 0;
2366fcf5ef2aSThomas Huth     int zone_digit = 0;
2367fcf5ef2aSThomas Huth     int zone_lead = ps ? 0xF : 0x3;
2368fcf5ef2aSThomas Huth     int digit = 0;
2369fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2370428115c3SMark Cave-Ayland     int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4;
2371fcf5ef2aSThomas Huth 
2372fcf5ef2aSThomas Huth     if (unlikely((sgnb < 0xA) && ps)) {
2373fcf5ef2aSThomas Huth         invalid = 1;
2374fcf5ef2aSThomas Huth     }
2375fcf5ef2aSThomas Huth 
2376fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2377428115c3SMark Cave-Ayland         zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead;
2378428115c3SMark Cave-Ayland         digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF;
2379fcf5ef2aSThomas Huth         if (unlikely(zone_digit != zone_lead || digit > 0x9)) {
2380fcf5ef2aSThomas Huth             invalid = 1;
2381fcf5ef2aSThomas Huth             break;
2382fcf5ef2aSThomas Huth         }
2383fcf5ef2aSThomas Huth 
2384fcf5ef2aSThomas Huth         bcd_put_digit(&ret, digit, i + 1);
2385fcf5ef2aSThomas Huth     }
2386fcf5ef2aSThomas Huth 
2387fcf5ef2aSThomas Huth     if ((ps && (sgnb == 0xB || sgnb == 0xD)) ||
2388fcf5ef2aSThomas Huth             (!ps && (sgnb & 0x4))) {
2389fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2390fcf5ef2aSThomas Huth     } else {
2391fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0);
2392fcf5ef2aSThomas Huth     }
2393fcf5ef2aSThomas Huth 
2394fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2395fcf5ef2aSThomas Huth 
2396fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2397efa73196SNikunj A Dadhania         cr = CRF_SO;
2398fcf5ef2aSThomas Huth     }
2399fcf5ef2aSThomas Huth 
2400fcf5ef2aSThomas Huth     *r = ret;
2401fcf5ef2aSThomas Huth 
2402fcf5ef2aSThomas Huth     return cr;
2403fcf5ef2aSThomas Huth }
2404fcf5ef2aSThomas Huth 
2405fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2406fcf5ef2aSThomas Huth {
2407fcf5ef2aSThomas Huth     int i;
2408fcf5ef2aSThomas Huth     int cr = 0;
2409fcf5ef2aSThomas Huth     uint8_t digit = 0;
2410fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2411fcf5ef2aSThomas Huth     int zone_lead = (ps) ? 0xF0 : 0x30;
2412fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2413fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2414fcf5ef2aSThomas Huth 
24153c385a93SMark Cave-Ayland     int ox_flag = ((b->VsrD(0) >> 4) != 0);
2416fcf5ef2aSThomas Huth 
2417fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2418fcf5ef2aSThomas Huth         digit = bcd_get_digit(b, i + 1, &invalid);
2419fcf5ef2aSThomas Huth 
2420fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2421fcf5ef2aSThomas Huth             break;
2422fcf5ef2aSThomas Huth         }
2423fcf5ef2aSThomas Huth 
2424428115c3SMark Cave-Ayland         ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit;
2425fcf5ef2aSThomas Huth     }
2426fcf5ef2aSThomas Huth 
2427fcf5ef2aSThomas Huth     if (ps) {
2428fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1);
2429fcf5ef2aSThomas Huth     } else {
2430fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1);
2431fcf5ef2aSThomas Huth     }
2432fcf5ef2aSThomas Huth 
2433fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2434fcf5ef2aSThomas Huth 
2435fcf5ef2aSThomas Huth     if (ox_flag) {
2436efa73196SNikunj A Dadhania         cr |= CRF_SO;
2437fcf5ef2aSThomas Huth     }
2438fcf5ef2aSThomas Huth 
2439fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2440efa73196SNikunj A Dadhania         cr = CRF_SO;
2441fcf5ef2aSThomas Huth     }
2442fcf5ef2aSThomas Huth 
2443fcf5ef2aSThomas Huth     *r = ret;
2444fcf5ef2aSThomas Huth 
2445fcf5ef2aSThomas Huth     return cr;
2446fcf5ef2aSThomas Huth }
2447fcf5ef2aSThomas Huth 
2448a3d67f3eSLuis Pires /**
2449a3d67f3eSLuis Pires  * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs
2450a3d67f3eSLuis Pires  *
2451a3d67f3eSLuis Pires  * Returns:
2452a3d67f3eSLuis Pires  * > 0 if ahi|alo > bhi|blo,
2453a3d67f3eSLuis Pires  * 0 if ahi|alo == bhi|blo,
2454a3d67f3eSLuis Pires  * < 0 if ahi|alo < bhi|blo
2455a3d67f3eSLuis Pires  */
2456a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi,
2457a3d67f3eSLuis Pires                           uint64_t blo, uint64_t bhi)
2458a3d67f3eSLuis Pires {
2459a3d67f3eSLuis Pires     return (ahi == bhi) ?
2460a3d67f3eSLuis Pires         (alo > blo ? 1 : (alo == blo ? 0 : -1)) :
2461a3d67f3eSLuis Pires         (ahi > bhi ? 1 : -1);
2462a3d67f3eSLuis Pires }
2463a3d67f3eSLuis Pires 
2464a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2465a406c058SJose Ricardo Ziviani {
2466a406c058SJose Ricardo Ziviani     int i;
2467a3d67f3eSLuis Pires     int cr;
2468a406c058SJose Ricardo Ziviani     uint64_t lo_value;
2469a406c058SJose Ricardo Ziviani     uint64_t hi_value;
247040f3e79aSLuis Pires     uint64_t rem;
2471a406c058SJose Ricardo Ziviani     ppc_avr_t ret = { .u64 = { 0, 0 } };
2472a406c058SJose Ricardo Ziviani 
24733c385a93SMark Cave-Ayland     if (b->VsrSD(0) < 0) {
24743c385a93SMark Cave-Ayland         lo_value = -b->VsrSD(1);
24753c385a93SMark Cave-Ayland         hi_value = ~b->VsrD(0) + !lo_value;
2476a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, 0xD, 0);
2477a3d67f3eSLuis Pires 
2478a3d67f3eSLuis Pires         cr = CRF_LT;
2479a406c058SJose Ricardo Ziviani     } else {
24803c385a93SMark Cave-Ayland         lo_value = b->VsrD(1);
24813c385a93SMark Cave-Ayland         hi_value = b->VsrD(0);
2482a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0);
2483a3d67f3eSLuis Pires 
2484a3d67f3eSLuis Pires         if (hi_value == 0 && lo_value == 0) {
2485a3d67f3eSLuis Pires             cr = CRF_EQ;
2486a3d67f3eSLuis Pires         } else {
2487a3d67f3eSLuis Pires             cr = CRF_GT;
2488a3d67f3eSLuis Pires         }
2489a406c058SJose Ricardo Ziviani     }
2490a406c058SJose Ricardo Ziviani 
2491a3d67f3eSLuis Pires     /*
2492a3d67f3eSLuis Pires      * Check src limits: abs(src) <= 10^31 - 1
2493a3d67f3eSLuis Pires      *
2494a3d67f3eSLuis Pires      * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff
2495a3d67f3eSLuis Pires      */
2496a3d67f3eSLuis Pires     if (ucmp128(lo_value, hi_value,
2497a3d67f3eSLuis Pires                 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) {
2498a3d67f3eSLuis Pires         cr |= CRF_SO;
2499a3d67f3eSLuis Pires 
2500a3d67f3eSLuis Pires         /*
2501a3d67f3eSLuis Pires          * According to the ISA, if src wouldn't fit in the destination
2502a3d67f3eSLuis Pires          * register, the result is undefined.
2503a3d67f3eSLuis Pires          * In that case, we leave r unchanged.
2504a3d67f3eSLuis Pires          */
2505a3d67f3eSLuis Pires     } else {
250640f3e79aSLuis Pires         rem = divu128(&lo_value, &hi_value, 1000000000000000ULL);
2507a406c058SJose Ricardo Ziviani 
250840f3e79aSLuis Pires         for (i = 1; i < 16; rem /= 10, i++) {
250940f3e79aSLuis Pires             bcd_put_digit(&ret, rem % 10, i);
2510a406c058SJose Ricardo Ziviani         }
2511a406c058SJose Ricardo Ziviani 
2512a406c058SJose Ricardo Ziviani         for (; i < 32; lo_value /= 10, i++) {
2513a406c058SJose Ricardo Ziviani             bcd_put_digit(&ret, lo_value % 10, i);
2514a406c058SJose Ricardo Ziviani         }
2515a406c058SJose Ricardo Ziviani 
2516a406c058SJose Ricardo Ziviani         *r = ret;
2517a3d67f3eSLuis Pires     }
2518a406c058SJose Ricardo Ziviani 
2519a406c058SJose Ricardo Ziviani     return cr;
2520a406c058SJose Ricardo Ziviani }
2521a406c058SJose Ricardo Ziviani 
2522c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2523c85bc7ddSJose Ricardo Ziviani {
2524c85bc7ddSJose Ricardo Ziviani     uint8_t i;
2525c85bc7ddSJose Ricardo Ziviani     int cr;
2526c85bc7ddSJose Ricardo Ziviani     uint64_t carry;
2527c85bc7ddSJose Ricardo Ziviani     uint64_t unused;
2528c85bc7ddSJose Ricardo Ziviani     uint64_t lo_value;
2529c85bc7ddSJose Ricardo Ziviani     uint64_t hi_value = 0;
2530c85bc7ddSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2531c85bc7ddSJose Ricardo Ziviani     int invalid = (sgnb == 0);
2532c85bc7ddSJose Ricardo Ziviani 
2533c85bc7ddSJose Ricardo Ziviani     lo_value = bcd_get_digit(b, 31, &invalid);
2534c85bc7ddSJose Ricardo Ziviani     for (i = 30; i > 0; i--) {
2535c85bc7ddSJose Ricardo Ziviani         mulu64(&lo_value, &carry, lo_value, 10ULL);
2536c85bc7ddSJose Ricardo Ziviani         mulu64(&hi_value, &unused, hi_value, 10ULL);
2537c85bc7ddSJose Ricardo Ziviani         lo_value += bcd_get_digit(b, i, &invalid);
2538c85bc7ddSJose Ricardo Ziviani         hi_value += carry;
2539c85bc7ddSJose Ricardo Ziviani 
2540c85bc7ddSJose Ricardo Ziviani         if (unlikely(invalid)) {
2541c85bc7ddSJose Ricardo Ziviani             break;
2542c85bc7ddSJose Ricardo Ziviani         }
2543c85bc7ddSJose Ricardo Ziviani     }
2544c85bc7ddSJose Ricardo Ziviani 
2545c85bc7ddSJose Ricardo Ziviani     if (sgnb == -1) {
25463c385a93SMark Cave-Ayland         r->VsrSD(1) = -lo_value;
25473c385a93SMark Cave-Ayland         r->VsrSD(0) = ~hi_value + !r->VsrSD(1);
2548c85bc7ddSJose Ricardo Ziviani     } else {
25493c385a93SMark Cave-Ayland         r->VsrSD(1) = lo_value;
25503c385a93SMark Cave-Ayland         r->VsrSD(0) = hi_value;
2551c85bc7ddSJose Ricardo Ziviani     }
2552c85bc7ddSJose Ricardo Ziviani 
2553c85bc7ddSJose Ricardo Ziviani     cr = bcd_cmp_zero(b);
2554c85bc7ddSJose Ricardo Ziviani 
2555c85bc7ddSJose Ricardo Ziviani     if (unlikely(invalid)) {
2556c85bc7ddSJose Ricardo Ziviani         cr = CRF_SO;
2557c85bc7ddSJose Ricardo Ziviani     }
2558c85bc7ddSJose Ricardo Ziviani 
2559c85bc7ddSJose Ricardo Ziviani     return cr;
2560c85bc7ddSJose Ricardo Ziviani }
2561c85bc7ddSJose Ricardo Ziviani 
2562c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2563c3025c3bSJose Ricardo Ziviani {
2564c3025c3bSJose Ricardo Ziviani     int i;
2565c3025c3bSJose Ricardo Ziviani     int invalid = 0;
2566c3025c3bSJose Ricardo Ziviani 
2567c3025c3bSJose Ricardo Ziviani     if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) {
2568c3025c3bSJose Ricardo Ziviani         return CRF_SO;
2569c3025c3bSJose Ricardo Ziviani     }
2570c3025c3bSJose Ricardo Ziviani 
2571c3025c3bSJose Ricardo Ziviani     *r = *a;
2572428115c3SMark Cave-Ayland     bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0);
2573c3025c3bSJose Ricardo Ziviani 
2574c3025c3bSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2575c3025c3bSJose Ricardo Ziviani         bcd_get_digit(a, i, &invalid);
2576c3025c3bSJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2577c3025c3bSJose Ricardo Ziviani         if (unlikely(invalid)) {
2578c3025c3bSJose Ricardo Ziviani             return CRF_SO;
2579c3025c3bSJose Ricardo Ziviani         }
2580c3025c3bSJose Ricardo Ziviani     }
2581c3025c3bSJose Ricardo Ziviani 
2582c3025c3bSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2583c3025c3bSJose Ricardo Ziviani }
2584c3025c3bSJose Ricardo Ziviani 
2585466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2586466a3f9cSJose Ricardo Ziviani {
2587466a3f9cSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2588466a3f9cSJose Ricardo Ziviani 
2589466a3f9cSJose Ricardo Ziviani     *r = *b;
2590466a3f9cSJose Ricardo Ziviani     bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0);
2591466a3f9cSJose Ricardo Ziviani 
2592071663dfSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2593466a3f9cSJose Ricardo Ziviani         return CRF_SO;
2594466a3f9cSJose Ricardo Ziviani     }
2595466a3f9cSJose Ricardo Ziviani 
2596466a3f9cSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2597466a3f9cSJose Ricardo Ziviani }
2598466a3f9cSJose Ricardo Ziviani 
2599e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2600e04797f7SJose Ricardo Ziviani {
2601e04797f7SJose Ricardo Ziviani     int cr;
2602428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2603e04797f7SJose Ricardo Ziviani     bool ox_flag = false;
2604e04797f7SJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2605e04797f7SJose Ricardo Ziviani     ppc_avr_t ret = *b;
26063c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2607e04797f7SJose Ricardo Ziviani 
2608e04797f7SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2609e04797f7SJose Ricardo Ziviani         return CRF_SO;
2610e04797f7SJose Ricardo Ziviani     }
2611e04797f7SJose Ricardo Ziviani 
2612e04797f7SJose Ricardo Ziviani     if (unlikely(i > 31)) {
2613e04797f7SJose Ricardo Ziviani         i = 31;
2614e04797f7SJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2615e04797f7SJose Ricardo Ziviani         i = -31;
2616e04797f7SJose Ricardo Ziviani     }
2617e04797f7SJose Ricardo Ziviani 
2618e04797f7SJose Ricardo Ziviani     if (i > 0) {
26193c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2620e04797f7SJose Ricardo Ziviani     } else {
26213c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2622e04797f7SJose Ricardo Ziviani     }
2623e04797f7SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2624e04797f7SJose Ricardo Ziviani 
2625e04797f7SJose Ricardo Ziviani     *r = ret;
2626e04797f7SJose Ricardo Ziviani 
2627e04797f7SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2628e04797f7SJose Ricardo Ziviani     if (ox_flag) {
2629e04797f7SJose Ricardo Ziviani         cr |= CRF_SO;
2630e04797f7SJose Ricardo Ziviani     }
2631e04797f7SJose Ricardo Ziviani 
2632e04797f7SJose Ricardo Ziviani     return cr;
2633e04797f7SJose Ricardo Ziviani }
2634e04797f7SJose Ricardo Ziviani 
2635a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2636a49a95e9SJose Ricardo Ziviani {
2637a49a95e9SJose Ricardo Ziviani     int cr;
2638a49a95e9SJose Ricardo Ziviani     int i;
2639a49a95e9SJose Ricardo Ziviani     int invalid = 0;
2640a49a95e9SJose Ricardo Ziviani     bool ox_flag = false;
2641a49a95e9SJose Ricardo Ziviani     ppc_avr_t ret = *b;
2642a49a95e9SJose Ricardo Ziviani 
2643a49a95e9SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
2644a49a95e9SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2645a49a95e9SJose Ricardo Ziviani 
2646a49a95e9SJose Ricardo Ziviani         if (unlikely(invalid)) {
2647a49a95e9SJose Ricardo Ziviani             return CRF_SO;
2648a49a95e9SJose Ricardo Ziviani         }
2649a49a95e9SJose Ricardo Ziviani     }
2650a49a95e9SJose Ricardo Ziviani 
2651428115c3SMark Cave-Ayland     i = a->VsrSB(7);
2652a49a95e9SJose Ricardo Ziviani     if (i >= 32) {
2653a49a95e9SJose Ricardo Ziviani         ox_flag = true;
26543c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2655a49a95e9SJose Ricardo Ziviani     } else if (i <= -32) {
26563c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2657a49a95e9SJose Ricardo Ziviani     } else if (i > 0) {
26583c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2659a49a95e9SJose Ricardo Ziviani     } else {
26603c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2661a49a95e9SJose Ricardo Ziviani     }
2662a49a95e9SJose Ricardo Ziviani     *r = ret;
2663a49a95e9SJose Ricardo Ziviani 
2664a49a95e9SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2665a49a95e9SJose Ricardo Ziviani     if (ox_flag) {
2666a49a95e9SJose Ricardo Ziviani         cr |= CRF_SO;
2667a49a95e9SJose Ricardo Ziviani     }
2668a49a95e9SJose Ricardo Ziviani 
2669a49a95e9SJose Ricardo Ziviani     return cr;
2670a49a95e9SJose Ricardo Ziviani }
2671a49a95e9SJose Ricardo Ziviani 
2672a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2673a54238adSJose Ricardo Ziviani {
2674a54238adSJose Ricardo Ziviani     int cr;
2675a54238adSJose Ricardo Ziviani     int unused = 0;
2676a54238adSJose Ricardo Ziviani     int invalid = 0;
2677a54238adSJose Ricardo Ziviani     bool ox_flag = false;
2678a54238adSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2679a54238adSJose Ricardo Ziviani     ppc_avr_t ret = *b;
26803c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2681a54238adSJose Ricardo Ziviani 
2682428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2683428115c3SMark Cave-Ayland     ppc_avr_t bcd_one;
2684428115c3SMark Cave-Ayland 
2685428115c3SMark Cave-Ayland     bcd_one.VsrD(0) = 0;
2686428115c3SMark Cave-Ayland     bcd_one.VsrD(1) = 0x10;
2687a54238adSJose Ricardo Ziviani 
2688a54238adSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2689a54238adSJose Ricardo Ziviani         return CRF_SO;
2690a54238adSJose Ricardo Ziviani     }
2691a54238adSJose Ricardo Ziviani 
2692a54238adSJose Ricardo Ziviani     if (unlikely(i > 31)) {
2693a54238adSJose Ricardo Ziviani         i = 31;
2694a54238adSJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2695a54238adSJose Ricardo Ziviani         i = -31;
2696a54238adSJose Ricardo Ziviani     }
2697a54238adSJose Ricardo Ziviani 
2698a54238adSJose Ricardo Ziviani     if (i > 0) {
26993c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2700a54238adSJose Ricardo Ziviani     } else {
27013c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2702a54238adSJose Ricardo Ziviani 
2703a54238adSJose Ricardo Ziviani         if (bcd_get_digit(&ret, 0, &invalid) >= 5) {
2704a54238adSJose Ricardo Ziviani             bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused);
2705a54238adSJose Ricardo Ziviani         }
2706a54238adSJose Ricardo Ziviani     }
2707a54238adSJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2708a54238adSJose Ricardo Ziviani 
2709a54238adSJose Ricardo Ziviani     cr = bcd_cmp_zero(&ret);
2710a54238adSJose Ricardo Ziviani     if (ox_flag) {
2711a54238adSJose Ricardo Ziviani         cr |= CRF_SO;
2712a54238adSJose Ricardo Ziviani     }
2713a54238adSJose Ricardo Ziviani     *r = ret;
2714a54238adSJose Ricardo Ziviani 
2715a54238adSJose Ricardo Ziviani     return cr;
2716a54238adSJose Ricardo Ziviani }
2717a54238adSJose Ricardo Ziviani 
271831bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
271931bc4d11SJose Ricardo Ziviani {
272031bc4d11SJose Ricardo Ziviani     uint64_t mask;
272131bc4d11SJose Ricardo Ziviani     uint32_t ox_flag = 0;
2722428115c3SMark Cave-Ayland     int i = a->VsrSH(3) + 1;
272331bc4d11SJose Ricardo Ziviani     ppc_avr_t ret = *b;
272431bc4d11SJose Ricardo Ziviani 
272531bc4d11SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
272631bc4d11SJose Ricardo Ziviani         return CRF_SO;
272731bc4d11SJose Ricardo Ziviani     }
272831bc4d11SJose Ricardo Ziviani 
272931bc4d11SJose Ricardo Ziviani     if (i > 16 && i < 32) {
273031bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
27313c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
273231bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
273331bc4d11SJose Ricardo Ziviani         }
273431bc4d11SJose Ricardo Ziviani 
27353c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
273631bc4d11SJose Ricardo Ziviani     } else if (i >= 0 && i <= 16) {
273731bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
27383c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
273931bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
274031bc4d11SJose Ricardo Ziviani         }
274131bc4d11SJose Ricardo Ziviani 
27423c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
27433c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
274431bc4d11SJose Ricardo Ziviani     }
274531bc4d11SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0);
274631bc4d11SJose Ricardo Ziviani     *r = ret;
274731bc4d11SJose Ricardo Ziviani 
274831bc4d11SJose Ricardo Ziviani     return bcd_cmp_zero(&ret) | ox_flag;
274931bc4d11SJose Ricardo Ziviani }
275031bc4d11SJose Ricardo Ziviani 
27515c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
27525c32e2e4SJose Ricardo Ziviani {
27535c32e2e4SJose Ricardo Ziviani     int i;
27545c32e2e4SJose Ricardo Ziviani     uint64_t mask;
27555c32e2e4SJose Ricardo Ziviani     uint32_t ox_flag = 0;
27565c32e2e4SJose Ricardo Ziviani     int invalid = 0;
27575c32e2e4SJose Ricardo Ziviani     ppc_avr_t ret = *b;
27585c32e2e4SJose Ricardo Ziviani 
27595c32e2e4SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
27605c32e2e4SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
27615c32e2e4SJose Ricardo Ziviani 
27625c32e2e4SJose Ricardo Ziviani         if (unlikely(invalid)) {
27635c32e2e4SJose Ricardo Ziviani             return CRF_SO;
27645c32e2e4SJose Ricardo Ziviani         }
27655c32e2e4SJose Ricardo Ziviani     }
27665c32e2e4SJose Ricardo Ziviani 
2767428115c3SMark Cave-Ayland     i = a->VsrSH(3);
27685c32e2e4SJose Ricardo Ziviani     if (i > 16 && i < 33) {
27695c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
27703c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
27715c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
27725c32e2e4SJose Ricardo Ziviani         }
27735c32e2e4SJose Ricardo Ziviani 
27743c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
27755c32e2e4SJose Ricardo Ziviani     } else if (i > 0 && i <= 16) {
27765c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
27773c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
27785c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
27795c32e2e4SJose Ricardo Ziviani         }
27805c32e2e4SJose Ricardo Ziviani 
27813c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
27823c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
27835c32e2e4SJose Ricardo Ziviani     } else if (i == 0) {
27843c385a93SMark Cave-Ayland         if (ret.VsrD(0) || ret.VsrD(1)) {
27855c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
27865c32e2e4SJose Ricardo Ziviani         }
27873c385a93SMark Cave-Ayland         ret.VsrD(0) = ret.VsrD(1) = 0;
27885c32e2e4SJose Ricardo Ziviani     }
27895c32e2e4SJose Ricardo Ziviani 
27905c32e2e4SJose Ricardo Ziviani     *r = ret;
27913c385a93SMark Cave-Ayland     if (r->VsrD(0) == 0 && r->VsrD(1) == 0) {
27925c32e2e4SJose Ricardo Ziviani         return ox_flag | CRF_EQ;
27935c32e2e4SJose Ricardo Ziviani     }
27945c32e2e4SJose Ricardo Ziviani 
27955c32e2e4SJose Ricardo Ziviani     return ox_flag | CRF_GT;
27965c32e2e4SJose Ricardo Ziviani }
27975c32e2e4SJose Ricardo Ziviani 
2798fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a)
2799fcf5ef2aSThomas Huth {
2800fcf5ef2aSThomas Huth     int i;
2801fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
2802fcf5ef2aSThomas Huth         r->u8[i] = AES_sbox[a->u8[i]];
2803fcf5ef2aSThomas Huth     }
2804fcf5ef2aSThomas Huth }
2805fcf5ef2aSThomas Huth 
2806fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2807fcf5ef2aSThomas Huth {
2808fcf5ef2aSThomas Huth     ppc_avr_t result;
2809fcf5ef2aSThomas Huth     int i;
2810fcf5ef2aSThomas Huth 
2811fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
28122dea57dbSMark Cave-Ayland         result.VsrW(i) = b->VsrW(i) ^
28132dea57dbSMark Cave-Ayland             (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^
28142dea57dbSMark Cave-Ayland              AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^
28152dea57dbSMark Cave-Ayland              AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^
28162dea57dbSMark Cave-Ayland              AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]);
2817fcf5ef2aSThomas Huth     }
2818fcf5ef2aSThomas Huth     *r = result;
2819fcf5ef2aSThomas Huth }
2820fcf5ef2aSThomas Huth 
2821fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2822fcf5ef2aSThomas Huth {
2823fcf5ef2aSThomas Huth     ppc_avr_t result;
2824fcf5ef2aSThomas Huth     int i;
2825fcf5ef2aSThomas Huth 
2826fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
28272dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]);
2828fcf5ef2aSThomas Huth     }
2829fcf5ef2aSThomas Huth     *r = result;
2830fcf5ef2aSThomas Huth }
2831fcf5ef2aSThomas Huth 
2832fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2833fcf5ef2aSThomas Huth {
2834fcf5ef2aSThomas Huth     /* This differs from what is written in ISA V2.07.  The RTL is */
2835fcf5ef2aSThomas Huth     /* incorrect and will be fixed in V2.07B.                      */
2836fcf5ef2aSThomas Huth     int i;
2837fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2838fcf5ef2aSThomas Huth 
2839fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
28402dea57dbSMark Cave-Ayland         tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])];
2841fcf5ef2aSThomas Huth     }
2842fcf5ef2aSThomas Huth 
2843fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
28442dea57dbSMark Cave-Ayland         r->VsrW(i) =
28452dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 0)][0] ^
28462dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 1)][1] ^
28472dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 2)][2] ^
28482dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 3)][3];
2849fcf5ef2aSThomas Huth     }
2850fcf5ef2aSThomas Huth }
2851fcf5ef2aSThomas Huth 
2852fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2853fcf5ef2aSThomas Huth {
2854fcf5ef2aSThomas Huth     ppc_avr_t result;
2855fcf5ef2aSThomas Huth     int i;
2856fcf5ef2aSThomas Huth 
2857fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
28582dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]);
2859fcf5ef2aSThomas Huth     }
2860fcf5ef2aSThomas Huth     *r = result;
2861fcf5ef2aSThomas Huth }
2862fcf5ef2aSThomas Huth 
2863fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
2864fcf5ef2aSThomas Huth {
2865fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
2866fcf5ef2aSThomas Huth     int six = st_six & 0xF;
2867fcf5ef2aSThomas Huth     int i;
2868fcf5ef2aSThomas Huth 
2869730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
2870fcf5ef2aSThomas Huth         if (st == 0) {
2871fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
28720ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 7) ^
28730ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 18) ^
2874730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 3);
2875fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
28760ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 17) ^
28770ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 19) ^
2878730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 10);
2879fcf5ef2aSThomas Huth             }
2880fcf5ef2aSThomas Huth         } else { /* st == 1 */
2881fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
28820ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 2) ^
28830ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 13) ^
28840ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 22);
2885fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
28860ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 6) ^
28870ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 11) ^
28880ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 25);
2889fcf5ef2aSThomas Huth             }
2890fcf5ef2aSThomas Huth         }
2891fcf5ef2aSThomas Huth     }
2892fcf5ef2aSThomas Huth }
2893fcf5ef2aSThomas Huth 
2894fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
2895fcf5ef2aSThomas Huth {
2896fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
2897fcf5ef2aSThomas Huth     int six = st_six & 0xF;
2898fcf5ef2aSThomas Huth     int i;
2899fcf5ef2aSThomas Huth 
2900730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
2901fcf5ef2aSThomas Huth         if (st == 0) {
2902fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
29030ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 1) ^
29040ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 8) ^
2905730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 7);
2906fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
29070ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 19) ^
29080ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 61) ^
2909730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 6);
2910fcf5ef2aSThomas Huth             }
2911fcf5ef2aSThomas Huth         } else { /* st == 1 */
2912fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
29130ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 28) ^
29140ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 34) ^
29150ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 39);
2916fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
29170ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 14) ^
29180ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 18) ^
29190ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 41);
2920fcf5ef2aSThomas Huth             }
2921fcf5ef2aSThomas Huth         }
2922fcf5ef2aSThomas Huth     }
2923fcf5ef2aSThomas Huth }
2924fcf5ef2aSThomas Huth 
2925fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2926fcf5ef2aSThomas Huth {
2927fcf5ef2aSThomas Huth     ppc_avr_t result;
2928fcf5ef2aSThomas Huth     int i;
2929fcf5ef2aSThomas Huth 
293060594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
293160594feaSMark Cave-Ayland         int indexA = c->VsrB(i) >> 4;
293260594feaSMark Cave-Ayland         int indexB = c->VsrB(i) & 0xF;
293360594feaSMark Cave-Ayland 
293460594feaSMark Cave-Ayland         result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB);
2935fcf5ef2aSThomas Huth     }
2936fcf5ef2aSThomas Huth     *r = result;
2937fcf5ef2aSThomas Huth }
2938fcf5ef2aSThomas Huth 
2939fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I
2940fcf5ef2aSThomas Huth 
2941fcf5ef2aSThomas Huth /*****************************************************************************/
2942fcf5ef2aSThomas Huth /* SPE extension helpers */
2943fcf5ef2aSThomas Huth /* Use a table to make this quicker */
2944fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = {
2945fcf5ef2aSThomas Huth     0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE,
2946fcf5ef2aSThomas Huth     0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF,
2947fcf5ef2aSThomas Huth };
2948fcf5ef2aSThomas Huth 
2949fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val)
2950fcf5ef2aSThomas Huth {
2951fcf5ef2aSThomas Huth     return hbrev[val >> 4] | (hbrev[val & 0xF] << 4);
2952fcf5ef2aSThomas Huth }
2953fcf5ef2aSThomas Huth 
2954fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val)
2955fcf5ef2aSThomas Huth {
2956fcf5ef2aSThomas Huth     return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) |
2957fcf5ef2aSThomas Huth         (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24);
2958fcf5ef2aSThomas Huth }
2959fcf5ef2aSThomas Huth 
2960fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */
2961fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2)
2962fcf5ef2aSThomas Huth {
2963fcf5ef2aSThomas Huth     uint32_t a, b, d, mask;
2964fcf5ef2aSThomas Huth 
2965fcf5ef2aSThomas Huth     mask = UINT32_MAX >> (32 - MASKBITS);
2966fcf5ef2aSThomas Huth     a = arg1 & mask;
2967fcf5ef2aSThomas Huth     b = arg2 & mask;
2968fcf5ef2aSThomas Huth     d = word_reverse(1 + word_reverse(a | ~b));
2969fcf5ef2aSThomas Huth     return (arg1 & ~mask) | (d & b);
2970fcf5ef2aSThomas Huth }
2971fcf5ef2aSThomas Huth 
2972fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val)
2973fcf5ef2aSThomas Huth {
2974fcf5ef2aSThomas Huth     if (val & 0x80000000) {
2975fcf5ef2aSThomas Huth         return clz32(~val);
2976fcf5ef2aSThomas Huth     } else {
2977fcf5ef2aSThomas Huth         return clz32(val);
2978fcf5ef2aSThomas Huth     }
2979fcf5ef2aSThomas Huth }
2980fcf5ef2aSThomas Huth 
2981fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val)
2982fcf5ef2aSThomas Huth {
2983fcf5ef2aSThomas Huth     return clz32(val);
2984fcf5ef2aSThomas Huth }
2985fcf5ef2aSThomas Huth 
2986fcf5ef2aSThomas Huth /* 440 specific */
2987fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high,
2988fcf5ef2aSThomas Huth                           target_ulong low, uint32_t update_Rc)
2989fcf5ef2aSThomas Huth {
2990fcf5ef2aSThomas Huth     target_ulong mask;
2991fcf5ef2aSThomas Huth     int i;
2992fcf5ef2aSThomas Huth 
2993fcf5ef2aSThomas Huth     i = 1;
2994fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
2995fcf5ef2aSThomas Huth         if ((high & mask) == 0) {
2996fcf5ef2aSThomas Huth             if (update_Rc) {
2997fcf5ef2aSThomas Huth                 env->crf[0] = 0x4;
2998fcf5ef2aSThomas Huth             }
2999fcf5ef2aSThomas Huth             goto done;
3000fcf5ef2aSThomas Huth         }
3001fcf5ef2aSThomas Huth         i++;
3002fcf5ef2aSThomas Huth     }
3003fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3004fcf5ef2aSThomas Huth         if ((low & mask) == 0) {
3005fcf5ef2aSThomas Huth             if (update_Rc) {
3006fcf5ef2aSThomas Huth                 env->crf[0] = 0x8;
3007fcf5ef2aSThomas Huth             }
3008fcf5ef2aSThomas Huth             goto done;
3009fcf5ef2aSThomas Huth         }
3010fcf5ef2aSThomas Huth         i++;
3011fcf5ef2aSThomas Huth     }
3012fcf5ef2aSThomas Huth     i = 8;
3013fcf5ef2aSThomas Huth     if (update_Rc) {
3014fcf5ef2aSThomas Huth         env->crf[0] = 0x2;
3015fcf5ef2aSThomas Huth     }
3016fcf5ef2aSThomas Huth  done:
3017fcf5ef2aSThomas Huth     env->xer = (env->xer & ~0x7F) | i;
3018fcf5ef2aSThomas Huth     if (update_Rc) {
3019fcf5ef2aSThomas Huth         env->crf[0] |= xer_so;
3020fcf5ef2aSThomas Huth     }
3021fcf5ef2aSThomas Huth     return i;
3022fcf5ef2aSThomas Huth }
3023