xref: /openbmc/qemu/target/ppc/int_helper.c (revision 788c63998ce6e17b7d7f2e30d28ee5979a6d6cec)
1fcf5ef2aSThomas Huth /*
2fcf5ef2aSThomas Huth  *  PowerPC integer and vector emulation helpers for QEMU.
3fcf5ef2aSThomas Huth  *
4fcf5ef2aSThomas Huth  *  Copyright (c) 2003-2007 Jocelyn Mayer
5fcf5ef2aSThomas Huth  *
6fcf5ef2aSThomas Huth  * This library is free software; you can redistribute it and/or
7fcf5ef2aSThomas Huth  * modify it under the terms of the GNU Lesser General Public
8fcf5ef2aSThomas Huth  * License as published by the Free Software Foundation; either
96bd039cdSChetan Pant  * version 2.1 of the License, or (at your option) any later version.
10fcf5ef2aSThomas Huth  *
11fcf5ef2aSThomas Huth  * This library is distributed in the hope that it will be useful,
12fcf5ef2aSThomas Huth  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13fcf5ef2aSThomas Huth  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14fcf5ef2aSThomas Huth  * Lesser General Public License for more details.
15fcf5ef2aSThomas Huth  *
16fcf5ef2aSThomas Huth  * You should have received a copy of the GNU Lesser General Public
17fcf5ef2aSThomas Huth  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18fcf5ef2aSThomas Huth  */
19db725815SMarkus Armbruster 
20fcf5ef2aSThomas Huth #include "qemu/osdep.h"
21fcf5ef2aSThomas Huth #include "cpu.h"
22fcf5ef2aSThomas Huth #include "internal.h"
23fcf5ef2aSThomas Huth #include "qemu/host-utils.h"
24db725815SMarkus Armbruster #include "qemu/main-loop.h"
258a05fd9aSRichard Henderson #include "qemu/log.h"
26fcf5ef2aSThomas Huth #include "exec/helper-proto.h"
27fcf5ef2aSThomas Huth #include "crypto/aes.h"
2824f91e81SAlex Bennée #include "fpu/softfloat.h"
293f74b632SRichard Henderson #include "qapi/error.h"
303f74b632SRichard Henderson #include "qemu/guest-random.h"
31fcf5ef2aSThomas Huth 
32fcf5ef2aSThomas Huth #include "helper_regs.h"
33fcf5ef2aSThomas Huth /*****************************************************************************/
34fcf5ef2aSThomas Huth /* Fixed point operations helpers */
35fcf5ef2aSThomas Huth 
36f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov)
37f32899deSNikunj A Dadhania {
38f32899deSNikunj A Dadhania     if (unlikely(ov)) {
39f32899deSNikunj A Dadhania         env->so = env->ov = 1;
40f32899deSNikunj A Dadhania     } else {
41f32899deSNikunj A Dadhania         env->ov = 0;
42f32899deSNikunj A Dadhania     }
43f32899deSNikunj A Dadhania }
44f32899deSNikunj A Dadhania 
45fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb,
46fcf5ef2aSThomas Huth                            uint32_t oe)
47fcf5ef2aSThomas Huth {
48fcf5ef2aSThomas Huth     uint64_t rt = 0;
49fcf5ef2aSThomas Huth     int overflow = 0;
50fcf5ef2aSThomas Huth 
51fcf5ef2aSThomas Huth     uint64_t dividend = (uint64_t)ra << 32;
52fcf5ef2aSThomas Huth     uint64_t divisor = (uint32_t)rb;
53fcf5ef2aSThomas Huth 
54fcf5ef2aSThomas Huth     if (unlikely(divisor == 0)) {
55fcf5ef2aSThomas Huth         overflow = 1;
56fcf5ef2aSThomas Huth     } else {
57fcf5ef2aSThomas Huth         rt = dividend / divisor;
58fcf5ef2aSThomas Huth         overflow = rt > UINT32_MAX;
59fcf5ef2aSThomas Huth     }
60fcf5ef2aSThomas Huth 
61fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
62fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
63fcf5ef2aSThomas Huth     }
64fcf5ef2aSThomas Huth 
65fcf5ef2aSThomas Huth     if (oe) {
66f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
67fcf5ef2aSThomas Huth     }
68fcf5ef2aSThomas Huth 
69fcf5ef2aSThomas Huth     return (target_ulong)rt;
70fcf5ef2aSThomas Huth }
71fcf5ef2aSThomas Huth 
72fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb,
73fcf5ef2aSThomas Huth                           uint32_t oe)
74fcf5ef2aSThomas Huth {
75fcf5ef2aSThomas Huth     int64_t rt = 0;
76fcf5ef2aSThomas Huth     int overflow = 0;
77fcf5ef2aSThomas Huth 
78fcf5ef2aSThomas Huth     int64_t dividend = (int64_t)ra << 32;
79fcf5ef2aSThomas Huth     int64_t divisor = (int64_t)((int32_t)rb);
80fcf5ef2aSThomas Huth 
81fcf5ef2aSThomas Huth     if (unlikely((divisor == 0) ||
82fcf5ef2aSThomas Huth                  ((divisor == -1ull) && (dividend == INT64_MIN)))) {
83fcf5ef2aSThomas Huth         overflow = 1;
84fcf5ef2aSThomas Huth     } else {
85fcf5ef2aSThomas Huth         rt = dividend / divisor;
86fcf5ef2aSThomas Huth         overflow = rt != (int32_t)rt;
87fcf5ef2aSThomas Huth     }
88fcf5ef2aSThomas Huth 
89fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
90fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
91fcf5ef2aSThomas Huth     }
92fcf5ef2aSThomas Huth 
93fcf5ef2aSThomas Huth     if (oe) {
94f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
95fcf5ef2aSThomas Huth     }
96fcf5ef2aSThomas Huth 
97fcf5ef2aSThomas Huth     return (target_ulong)rt;
98fcf5ef2aSThomas Huth }
99fcf5ef2aSThomas Huth 
100fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
101fcf5ef2aSThomas Huth 
102fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe)
103fcf5ef2aSThomas Huth {
104fcf5ef2aSThomas Huth     uint64_t rt = 0;
105fcf5ef2aSThomas Huth     int overflow = 0;
106fcf5ef2aSThomas Huth 
1079276a31cSLuis Pires     if (unlikely(rb == 0 || ra >= rb)) {
1089276a31cSLuis Pires         overflow = 1;
109fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1109276a31cSLuis Pires     } else {
1119276a31cSLuis Pires         divu128(&rt, &ra, rb);
112fcf5ef2aSThomas Huth     }
113fcf5ef2aSThomas Huth 
114fcf5ef2aSThomas Huth     if (oe) {
115f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
116fcf5ef2aSThomas Huth     }
117fcf5ef2aSThomas Huth 
118fcf5ef2aSThomas Huth     return rt;
119fcf5ef2aSThomas Huth }
120fcf5ef2aSThomas Huth 
121fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe)
122fcf5ef2aSThomas Huth {
12340f3e79aSLuis Pires     uint64_t rt = 0;
124fcf5ef2aSThomas Huth     int64_t ra = (int64_t)rau;
125fcf5ef2aSThomas Huth     int64_t rb = (int64_t)rbu;
1269276a31cSLuis Pires     int overflow = 0;
127fcf5ef2aSThomas Huth 
1289276a31cSLuis Pires     if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) {
1299276a31cSLuis Pires         overflow = 1;
130fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1319276a31cSLuis Pires     } else {
1329276a31cSLuis Pires         divs128(&rt, &ra, rb);
133fcf5ef2aSThomas Huth     }
134fcf5ef2aSThomas Huth 
135fcf5ef2aSThomas Huth     if (oe) {
136f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
137fcf5ef2aSThomas Huth     }
138fcf5ef2aSThomas Huth 
139fcf5ef2aSThomas Huth     return rt;
140fcf5ef2aSThomas Huth }
141fcf5ef2aSThomas Huth 
142fcf5ef2aSThomas Huth #endif
143fcf5ef2aSThomas Huth 
144fcf5ef2aSThomas Huth 
145fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
146fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */
147fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff))
148fcf5ef2aSThomas Huth 
149b6cb41b2SDavid Gibson /*
150b6cb41b2SDavid Gibson  * subtract 1 from each byte, and with inverse, check if MSB is set at each
151fcf5ef2aSThomas Huth  * byte.
152fcf5ef2aSThomas Huth  * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80
153fcf5ef2aSThomas Huth  *      (0xFF & 0xFF) & 0x80 = 0x80 (zero found)
154fcf5ef2aSThomas Huth  */
155fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80))
156fcf5ef2aSThomas Huth 
157fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */
158fcf5ef2aSThomas Huth #define hasvalue(x, n)  (haszero((x) ^ pattern(n)))
159fcf5ef2aSThomas Huth 
160fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb)
161fcf5ef2aSThomas Huth {
162efa73196SNikunj A Dadhania     return hasvalue(rb, ra) ? CRF_GT : 0;
163fcf5ef2aSThomas Huth }
164fcf5ef2aSThomas Huth 
165fcf5ef2aSThomas Huth #undef pattern
166fcf5ef2aSThomas Huth #undef haszero
167fcf5ef2aSThomas Huth #undef hasvalue
168fcf5ef2aSThomas Huth 
169b6cb41b2SDavid Gibson /*
1703f74b632SRichard Henderson  * Return a random number.
171fcf5ef2aSThomas Huth  */
1723f74b632SRichard Henderson uint64_t helper_darn32(void)
173fcf5ef2aSThomas Huth {
1743f74b632SRichard Henderson     Error *err = NULL;
1753f74b632SRichard Henderson     uint32_t ret;
1763f74b632SRichard Henderson 
1773f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1783f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1793f74b632SRichard Henderson                       error_get_pretty(err));
1803f74b632SRichard Henderson         error_free(err);
181fcf5ef2aSThomas Huth         return -1;
182fcf5ef2aSThomas Huth     }
183fcf5ef2aSThomas Huth 
1843f74b632SRichard Henderson     return ret;
1853f74b632SRichard Henderson }
1863f74b632SRichard Henderson 
1873f74b632SRichard Henderson uint64_t helper_darn64(void)
188fcf5ef2aSThomas Huth {
1893f74b632SRichard Henderson     Error *err = NULL;
1903f74b632SRichard Henderson     uint64_t ret;
1913f74b632SRichard Henderson 
1923f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1933f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1943f74b632SRichard Henderson                       error_get_pretty(err));
1953f74b632SRichard Henderson         error_free(err);
196fcf5ef2aSThomas Huth         return -1;
197fcf5ef2aSThomas Huth     }
198fcf5ef2aSThomas Huth 
1993f74b632SRichard Henderson     return ret;
2003f74b632SRichard Henderson }
201fcf5ef2aSThomas Huth 
202fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb)
203fcf5ef2aSThomas Huth {
204fcf5ef2aSThomas Huth     int i;
205fcf5ef2aSThomas Huth     uint64_t ra = 0;
206fcf5ef2aSThomas Huth 
207fcf5ef2aSThomas Huth     for (i = 0; i < 8; i++) {
208fcf5ef2aSThomas Huth         int index = (rs >> (i * 8)) & 0xFF;
209fcf5ef2aSThomas Huth         if (index < 64) {
210a6a444a8SCédric Le Goater             if (rb & PPC_BIT(index)) {
211fcf5ef2aSThomas Huth                 ra |= 1 << i;
212fcf5ef2aSThomas Huth             }
213fcf5ef2aSThomas Huth         }
214fcf5ef2aSThomas Huth     }
215fcf5ef2aSThomas Huth     return ra;
216fcf5ef2aSThomas Huth }
217fcf5ef2aSThomas Huth 
218fcf5ef2aSThomas Huth #endif
219fcf5ef2aSThomas Huth 
220fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb)
221fcf5ef2aSThomas Huth {
222fcf5ef2aSThomas Huth     target_ulong mask = 0xff;
223fcf5ef2aSThomas Huth     target_ulong ra = 0;
224fcf5ef2aSThomas Huth     int i;
225fcf5ef2aSThomas Huth 
226fcf5ef2aSThomas Huth     for (i = 0; i < sizeof(target_ulong); i++) {
227fcf5ef2aSThomas Huth         if ((rs & mask) == (rb & mask)) {
228fcf5ef2aSThomas Huth             ra |= mask;
229fcf5ef2aSThomas Huth         }
230fcf5ef2aSThomas Huth         mask <<= 8;
231fcf5ef2aSThomas Huth     }
232fcf5ef2aSThomas Huth     return ra;
233fcf5ef2aSThomas Huth }
234fcf5ef2aSThomas Huth 
235fcf5ef2aSThomas Huth /* shift right arithmetic helper */
236fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value,
237fcf5ef2aSThomas Huth                          target_ulong shift)
238fcf5ef2aSThomas Huth {
239fcf5ef2aSThomas Huth     int32_t ret;
240fcf5ef2aSThomas Huth 
241fcf5ef2aSThomas Huth     if (likely(!(shift & 0x20))) {
242fcf5ef2aSThomas Huth         if (likely((uint32_t)shift != 0)) {
243fcf5ef2aSThomas Huth             shift &= 0x1f;
244fcf5ef2aSThomas Huth             ret = (int32_t)value >> shift;
245fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) {
246af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
247fcf5ef2aSThomas Huth             } else {
248af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
249fcf5ef2aSThomas Huth             }
250fcf5ef2aSThomas Huth         } else {
251fcf5ef2aSThomas Huth             ret = (int32_t)value;
252af1c259fSSandipan Das             env->ca32 = env->ca = 0;
253fcf5ef2aSThomas Huth         }
254fcf5ef2aSThomas Huth     } else {
255fcf5ef2aSThomas Huth         ret = (int32_t)value >> 31;
256af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
257fcf5ef2aSThomas Huth     }
258fcf5ef2aSThomas Huth     return (target_long)ret;
259fcf5ef2aSThomas Huth }
260fcf5ef2aSThomas Huth 
261fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
262fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value,
263fcf5ef2aSThomas Huth                          target_ulong shift)
264fcf5ef2aSThomas Huth {
265fcf5ef2aSThomas Huth     int64_t ret;
266fcf5ef2aSThomas Huth 
267fcf5ef2aSThomas Huth     if (likely(!(shift & 0x40))) {
268fcf5ef2aSThomas Huth         if (likely((uint64_t)shift != 0)) {
269fcf5ef2aSThomas Huth             shift &= 0x3f;
270fcf5ef2aSThomas Huth             ret = (int64_t)value >> shift;
271fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) {
272af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
273fcf5ef2aSThomas Huth             } else {
274af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
275fcf5ef2aSThomas Huth             }
276fcf5ef2aSThomas Huth         } else {
277fcf5ef2aSThomas Huth             ret = (int64_t)value;
278af1c259fSSandipan Das             env->ca32 = env->ca = 0;
279fcf5ef2aSThomas Huth         }
280fcf5ef2aSThomas Huth     } else {
281fcf5ef2aSThomas Huth         ret = (int64_t)value >> 63;
282af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
283fcf5ef2aSThomas Huth     }
284fcf5ef2aSThomas Huth     return ret;
285fcf5ef2aSThomas Huth }
286fcf5ef2aSThomas Huth #endif
287fcf5ef2aSThomas Huth 
288fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
289fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
290fcf5ef2aSThomas Huth {
29179770002SRichard Henderson     /* Note that we don't fold past bytes */
292fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
293fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
294fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
295fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
296fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
297fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
298fcf5ef2aSThomas Huth     return val;
299fcf5ef2aSThomas Huth }
300fcf5ef2aSThomas Huth 
301fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val)
302fcf5ef2aSThomas Huth {
30379770002SRichard Henderson     /* Note that we don't fold past words.  */
304fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
305fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
306fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
307fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
308fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
309fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
310fcf5ef2aSThomas Huth     val = (val & 0x00ff00ff00ff00ffULL) + ((val >>  8) &
311fcf5ef2aSThomas Huth                                            0x00ff00ff00ff00ffULL);
312fcf5ef2aSThomas Huth     val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) &
313fcf5ef2aSThomas Huth                                            0x0000ffff0000ffffULL);
314fcf5ef2aSThomas Huth     return val;
315fcf5ef2aSThomas Huth }
316fcf5ef2aSThomas Huth #else
317fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
318fcf5ef2aSThomas Huth {
31979770002SRichard Henderson     /* Note that we don't fold past bytes */
320fcf5ef2aSThomas Huth     val = (val & 0x55555555) + ((val >>  1) & 0x55555555);
321fcf5ef2aSThomas Huth     val = (val & 0x33333333) + ((val >>  2) & 0x33333333);
322fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f) + ((val >>  4) & 0x0f0f0f0f);
323fcf5ef2aSThomas Huth     return val;
324fcf5ef2aSThomas Huth }
325fcf5ef2aSThomas Huth #endif
326fcf5ef2aSThomas Huth 
3276e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask)
32889ccd7dcSMatheus Ferst {
32989ccd7dcSMatheus Ferst     /*
33089ccd7dcSMatheus Ferst      * Instead of processing the mask bit-by-bit from the most significant to
33189ccd7dcSMatheus Ferst      * the least significant bit, as described in PowerISA, we'll handle it in
33289ccd7dcSMatheus Ferst      * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use
33389ccd7dcSMatheus Ferst      * ctz or cto, we negate the mask at the end of the loop.
33489ccd7dcSMatheus Ferst      */
33589ccd7dcSMatheus Ferst     target_ulong m, left = 0, right = 0;
33689ccd7dcSMatheus Ferst     unsigned int n, i = 64;
33789ccd7dcSMatheus Ferst     bool bit = false; /* tracks if we are processing zeros or ones */
33889ccd7dcSMatheus Ferst 
33989ccd7dcSMatheus Ferst     if (mask == 0 || mask == -1) {
34089ccd7dcSMatheus Ferst         return src;
34189ccd7dcSMatheus Ferst     }
34289ccd7dcSMatheus Ferst 
34389ccd7dcSMatheus Ferst     /* Processes the mask in blocks, from LSB to MSB */
34489ccd7dcSMatheus Ferst     while (i) {
34589ccd7dcSMatheus Ferst         /* Find how many bits we should take */
34689ccd7dcSMatheus Ferst         n = ctz64(mask);
34789ccd7dcSMatheus Ferst         if (n > i) {
34889ccd7dcSMatheus Ferst             n = i;
34989ccd7dcSMatheus Ferst         }
35089ccd7dcSMatheus Ferst 
35189ccd7dcSMatheus Ferst         /*
35289ccd7dcSMatheus Ferst          * Extracts 'n' trailing bits of src and put them on the leading 'n'
35389ccd7dcSMatheus Ferst          * bits of 'right' or 'left', pushing down the previously extracted
35489ccd7dcSMatheus Ferst          * values.
35589ccd7dcSMatheus Ferst          */
35689ccd7dcSMatheus Ferst         m = (1ll << n) - 1;
35789ccd7dcSMatheus Ferst         if (bit) {
35889ccd7dcSMatheus Ferst             right = ror64(right | (src & m), n);
35989ccd7dcSMatheus Ferst         } else {
36089ccd7dcSMatheus Ferst             left = ror64(left | (src & m), n);
36189ccd7dcSMatheus Ferst         }
36289ccd7dcSMatheus Ferst 
36389ccd7dcSMatheus Ferst         /*
36489ccd7dcSMatheus Ferst          * Discards the processed bits from 'src' and 'mask'. Note that we are
36589ccd7dcSMatheus Ferst          * removing 'n' trailing zeros from 'mask', but the logical shift will
36689ccd7dcSMatheus Ferst          * add 'n' leading zeros back, so the population count of 'mask' is kept
36789ccd7dcSMatheus Ferst          * the same.
36889ccd7dcSMatheus Ferst          */
36989ccd7dcSMatheus Ferst         src >>= n;
37089ccd7dcSMatheus Ferst         mask >>= n;
37189ccd7dcSMatheus Ferst         i -= n;
37289ccd7dcSMatheus Ferst         bit = !bit;
37389ccd7dcSMatheus Ferst         mask = ~mask;
37489ccd7dcSMatheus Ferst     }
37589ccd7dcSMatheus Ferst 
37689ccd7dcSMatheus Ferst     /*
37789ccd7dcSMatheus Ferst      * At the end, right was ror'ed ctpop(mask) times. To put it back in place,
37889ccd7dcSMatheus Ferst      * we'll shift it more 64-ctpop(mask) times.
37989ccd7dcSMatheus Ferst      */
38089ccd7dcSMatheus Ferst     if (bit) {
38189ccd7dcSMatheus Ferst         n = ctpop64(mask);
38289ccd7dcSMatheus Ferst     } else {
38389ccd7dcSMatheus Ferst         n = 64 - ctpop64(mask);
38489ccd7dcSMatheus Ferst     }
38589ccd7dcSMatheus Ferst 
38689ccd7dcSMatheus Ferst     return left | (right >> n);
38789ccd7dcSMatheus Ferst }
38889ccd7dcSMatheus Ferst 
38921ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask)
39021ba6e58SMatheus Ferst {
39121ba6e58SMatheus Ferst     int i, o;
39221ba6e58SMatheus Ferst     uint64_t result = 0;
39321ba6e58SMatheus Ferst 
39421ba6e58SMatheus Ferst     if (mask == -1) {
39521ba6e58SMatheus Ferst         return src;
39621ba6e58SMatheus Ferst     }
39721ba6e58SMatheus Ferst 
39821ba6e58SMatheus Ferst     for (i = 0; mask != 0; i++) {
39921ba6e58SMatheus Ferst         o = ctz64(mask);
40021ba6e58SMatheus Ferst         mask &= mask - 1;
40121ba6e58SMatheus Ferst         result |= ((src >> i) & 1) << o;
40221ba6e58SMatheus Ferst     }
40321ba6e58SMatheus Ferst 
40421ba6e58SMatheus Ferst     return result;
40521ba6e58SMatheus Ferst }
4068bdb7606SMatheus Ferst 
4078bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask)
4088bdb7606SMatheus Ferst {
4098bdb7606SMatheus Ferst     int i, o;
4108bdb7606SMatheus Ferst     uint64_t result = 0;
4118bdb7606SMatheus Ferst 
4128bdb7606SMatheus Ferst     if (mask == -1) {
4138bdb7606SMatheus Ferst         return src;
4148bdb7606SMatheus Ferst     }
4158bdb7606SMatheus Ferst 
4168bdb7606SMatheus Ferst     for (o = 0; mask != 0; o++) {
4178bdb7606SMatheus Ferst         i = ctz64(mask);
4188bdb7606SMatheus Ferst         mask &= mask - 1;
4198bdb7606SMatheus Ferst         result |= ((src >> i) & 1) << o;
4208bdb7606SMatheus Ferst     }
4218bdb7606SMatheus Ferst 
4228bdb7606SMatheus Ferst     return result;
4238bdb7606SMatheus Ferst }
42421ba6e58SMatheus Ferst 
425fcf5ef2aSThomas Huth /*****************************************************************************/
426fcf5ef2aSThomas Huth /* PowerPC 601 specific instructions (POWER bridge) */
427fcf5ef2aSThomas Huth target_ulong helper_div(CPUPPCState *env, target_ulong arg1, target_ulong arg2)
428fcf5ef2aSThomas Huth {
429fcf5ef2aSThomas Huth     uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ];
430fcf5ef2aSThomas Huth 
431fcf5ef2aSThomas Huth     if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) ||
432fcf5ef2aSThomas Huth         (int32_t)arg2 == 0) {
433fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = 0;
434fcf5ef2aSThomas Huth         return INT32_MIN;
435fcf5ef2aSThomas Huth     } else {
436fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = tmp % arg2;
437fcf5ef2aSThomas Huth         return  tmp / (int32_t)arg2;
438fcf5ef2aSThomas Huth     }
439fcf5ef2aSThomas Huth }
440fcf5ef2aSThomas Huth 
441fcf5ef2aSThomas Huth target_ulong helper_divo(CPUPPCState *env, target_ulong arg1,
442fcf5ef2aSThomas Huth                          target_ulong arg2)
443fcf5ef2aSThomas Huth {
444fcf5ef2aSThomas Huth     uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ];
445fcf5ef2aSThomas Huth 
446fcf5ef2aSThomas Huth     if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) ||
447fcf5ef2aSThomas Huth         (int32_t)arg2 == 0) {
448fcf5ef2aSThomas Huth         env->so = env->ov = 1;
449fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = 0;
450fcf5ef2aSThomas Huth         return INT32_MIN;
451fcf5ef2aSThomas Huth     } else {
452fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = tmp % arg2;
453fcf5ef2aSThomas Huth         tmp /= (int32_t)arg2;
454fcf5ef2aSThomas Huth         if ((int32_t)tmp != tmp) {
455fcf5ef2aSThomas Huth             env->so = env->ov = 1;
456fcf5ef2aSThomas Huth         } else {
457fcf5ef2aSThomas Huth             env->ov = 0;
458fcf5ef2aSThomas Huth         }
459fcf5ef2aSThomas Huth         return tmp;
460fcf5ef2aSThomas Huth     }
461fcf5ef2aSThomas Huth }
462fcf5ef2aSThomas Huth 
463fcf5ef2aSThomas Huth target_ulong helper_divs(CPUPPCState *env, target_ulong arg1,
464fcf5ef2aSThomas Huth                          target_ulong arg2)
465fcf5ef2aSThomas Huth {
466fcf5ef2aSThomas Huth     if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) ||
467fcf5ef2aSThomas Huth         (int32_t)arg2 == 0) {
468fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = 0;
469fcf5ef2aSThomas Huth         return INT32_MIN;
470fcf5ef2aSThomas Huth     } else {
471fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2;
472fcf5ef2aSThomas Huth         return (int32_t)arg1 / (int32_t)arg2;
473fcf5ef2aSThomas Huth     }
474fcf5ef2aSThomas Huth }
475fcf5ef2aSThomas Huth 
476fcf5ef2aSThomas Huth target_ulong helper_divso(CPUPPCState *env, target_ulong arg1,
477fcf5ef2aSThomas Huth                           target_ulong arg2)
478fcf5ef2aSThomas Huth {
479fcf5ef2aSThomas Huth     if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) ||
480fcf5ef2aSThomas Huth         (int32_t)arg2 == 0) {
481fcf5ef2aSThomas Huth         env->so = env->ov = 1;
482fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = 0;
483fcf5ef2aSThomas Huth         return INT32_MIN;
484fcf5ef2aSThomas Huth     } else {
485fcf5ef2aSThomas Huth         env->ov = 0;
486fcf5ef2aSThomas Huth         env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2;
487fcf5ef2aSThomas Huth         return (int32_t)arg1 / (int32_t)arg2;
488fcf5ef2aSThomas Huth     }
489fcf5ef2aSThomas Huth }
490fcf5ef2aSThomas Huth 
491fcf5ef2aSThomas Huth /*****************************************************************************/
492fcf5ef2aSThomas Huth /* 602 specific instructions */
493fcf5ef2aSThomas Huth /* mfrom is the most crazy instruction ever seen, imho ! */
494fcf5ef2aSThomas Huth /* Real implementation uses a ROM table. Do the same */
495b6cb41b2SDavid Gibson /*
496b6cb41b2SDavid Gibson  * Extremely decomposed:
497fcf5ef2aSThomas Huth  *                      -arg / 256
498fcf5ef2aSThomas Huth  * return 256 * log10(10           + 1.0) + 0.5
499fcf5ef2aSThomas Huth  */
500fcf5ef2aSThomas Huth #if !defined(CONFIG_USER_ONLY)
501fcf5ef2aSThomas Huth target_ulong helper_602_mfrom(target_ulong arg)
502fcf5ef2aSThomas Huth {
503fcf5ef2aSThomas Huth     if (likely(arg < 602)) {
504139c1837SPaolo Bonzini #include "mfrom_table.c.inc"
505fcf5ef2aSThomas Huth         return mfrom_ROM_table[arg];
506fcf5ef2aSThomas Huth     } else {
507fcf5ef2aSThomas Huth         return 0;
508fcf5ef2aSThomas Huth     }
509fcf5ef2aSThomas Huth }
510fcf5ef2aSThomas Huth #endif
511fcf5ef2aSThomas Huth 
512fcf5ef2aSThomas Huth /*****************************************************************************/
513fcf5ef2aSThomas Huth /* Altivec extension helpers */
514fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
515fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
516fcf5ef2aSThomas Huth     for (index = 0; index < ARRAY_SIZE(r->element); index++)
517fcf5ef2aSThomas Huth #else
518fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
519fcf5ef2aSThomas Huth     for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--)
520fcf5ef2aSThomas Huth #endif
521fcf5ef2aSThomas Huth 
522fcf5ef2aSThomas Huth /* Saturating arithmetic helpers.  */
523fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max)          \
524fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
525fcf5ef2aSThomas Huth     {                                                           \
526fcf5ef2aSThomas Huth         to_type r;                                              \
527fcf5ef2aSThomas Huth                                                                 \
528fcf5ef2aSThomas Huth         if (x < (from_type)min) {                               \
529fcf5ef2aSThomas Huth             r = min;                                            \
530fcf5ef2aSThomas Huth             *sat = 1;                                           \
531fcf5ef2aSThomas Huth         } else if (x > (from_type)max) {                        \
532fcf5ef2aSThomas Huth             r = max;                                            \
533fcf5ef2aSThomas Huth             *sat = 1;                                           \
534fcf5ef2aSThomas Huth         } else {                                                \
535fcf5ef2aSThomas Huth             r = x;                                              \
536fcf5ef2aSThomas Huth         }                                                       \
537fcf5ef2aSThomas Huth         return r;                                               \
538fcf5ef2aSThomas Huth     }
539fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max)         \
540fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
541fcf5ef2aSThomas Huth     {                                                           \
542fcf5ef2aSThomas Huth         to_type r;                                              \
543fcf5ef2aSThomas Huth                                                                 \
544fcf5ef2aSThomas Huth         if (x > (from_type)max) {                               \
545fcf5ef2aSThomas Huth             r = max;                                            \
546fcf5ef2aSThomas Huth             *sat = 1;                                           \
547fcf5ef2aSThomas Huth         } else {                                                \
548fcf5ef2aSThomas Huth             r = x;                                              \
549fcf5ef2aSThomas Huth         }                                                       \
550fcf5ef2aSThomas Huth         return r;                                               \
551fcf5ef2aSThomas Huth     }
552fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX)
553fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX)
554fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX)
555fcf5ef2aSThomas Huth 
556fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX)
557fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX)
558fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX)
559fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX)
560fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX)
561fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX)
562fcf5ef2aSThomas Huth #undef SATCVT
563fcf5ef2aSThomas Huth #undef SATCVTU
564fcf5ef2aSThomas Huth 
565dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr)
566fcf5ef2aSThomas Huth {
567c19940dbSBruno Larsen (billionai)     ppc_store_vscr(env, vscr);
568fcf5ef2aSThomas Huth }
569fcf5ef2aSThomas Huth 
570cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env)
571cc2b90d7SRichard Henderson {
572c19940dbSBruno Larsen (billionai)     return ppc_get_vscr(env);
573cc2b90d7SRichard Henderson }
574cc2b90d7SRichard Henderson 
5756175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env)
5766175f5a0SRichard Henderson {
5779b5b74daSRichard Henderson     /* The choice of non-zero value is arbitrary.  */
5789b5b74daSRichard Henderson     env->vscr_sat.u32[0] = 1;
5796175f5a0SRichard Henderson }
5806175f5a0SRichard Henderson 
581fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
582fcf5ef2aSThomas Huth {
583fcf5ef2aSThomas Huth     int i;
584fcf5ef2aSThomas Huth 
585fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
586fcf5ef2aSThomas Huth         r->u32[i] = ~a->u32[i] < b->u32[i];
587fcf5ef2aSThomas Huth     }
588fcf5ef2aSThomas Huth }
589fcf5ef2aSThomas Huth 
590fcf5ef2aSThomas Huth /* vprtybw */
591fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b)
592fcf5ef2aSThomas Huth {
593fcf5ef2aSThomas Huth     int i;
594fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
595fcf5ef2aSThomas Huth         uint64_t res = b->u32[i] ^ (b->u32[i] >> 16);
596fcf5ef2aSThomas Huth         res ^= res >> 8;
597fcf5ef2aSThomas Huth         r->u32[i] = res & 1;
598fcf5ef2aSThomas Huth     }
599fcf5ef2aSThomas Huth }
600fcf5ef2aSThomas Huth 
601fcf5ef2aSThomas Huth /* vprtybd */
602fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b)
603fcf5ef2aSThomas Huth {
604fcf5ef2aSThomas Huth     int i;
605fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
606fcf5ef2aSThomas Huth         uint64_t res = b->u64[i] ^ (b->u64[i] >> 32);
607fcf5ef2aSThomas Huth         res ^= res >> 16;
608fcf5ef2aSThomas Huth         res ^= res >> 8;
609fcf5ef2aSThomas Huth         r->u64[i] = res & 1;
610fcf5ef2aSThomas Huth     }
611fcf5ef2aSThomas Huth }
612fcf5ef2aSThomas Huth 
613fcf5ef2aSThomas Huth /* vprtybq */
614fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b)
615fcf5ef2aSThomas Huth {
616fcf5ef2aSThomas Huth     uint64_t res = b->u64[0] ^ b->u64[1];
617fcf5ef2aSThomas Huth     res ^= res >> 32;
618fcf5ef2aSThomas Huth     res ^= res >> 16;
619fcf5ef2aSThomas Huth     res ^= res >> 8;
6203c385a93SMark Cave-Ayland     r->VsrD(1) = res & 1;
6213c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
622fcf5ef2aSThomas Huth }
623fcf5ef2aSThomas Huth 
624fcf5ef2aSThomas Huth #define VARITHFP(suffix, func)                                          \
625fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
626fcf5ef2aSThomas Huth                           ppc_avr_t *b)                                 \
627fcf5ef2aSThomas Huth     {                                                                   \
628fcf5ef2aSThomas Huth         int i;                                                          \
629fcf5ef2aSThomas Huth                                                                         \
63005ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
63105ee3e8aSMark Cave-Ayland             r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status);   \
632fcf5ef2aSThomas Huth         }                                                               \
633fcf5ef2aSThomas Huth     }
634fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add)
635fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub)
636fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min)
637fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max)
638fcf5ef2aSThomas Huth #undef VARITHFP
639fcf5ef2aSThomas Huth 
640fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type)                                       \
641fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
642fcf5ef2aSThomas Huth                            ppc_avr_t *b, ppc_avr_t *c)                  \
643fcf5ef2aSThomas Huth     {                                                                   \
644fcf5ef2aSThomas Huth         int i;                                                          \
64505ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
64605ee3e8aSMark Cave-Ayland             r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \
647fcf5ef2aSThomas Huth                                        type, &env->vec_status);         \
648fcf5ef2aSThomas Huth         }                                                               \
649fcf5ef2aSThomas Huth     }
650fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0);
651fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c);
652fcf5ef2aSThomas Huth #undef VARITHFPFMA
653fcf5ef2aSThomas Huth 
654fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element)                          \
655fcf5ef2aSThomas Huth     {                                                                   \
656fcf5ef2aSThomas Huth         type result = (type)a->element[i] op (type)b->element[i];       \
657fcf5ef2aSThomas Huth         r->element[i] = cvt(result, &sat);                              \
658fcf5ef2aSThomas Huth     }
659fcf5ef2aSThomas Huth 
660fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element)                    \
661fb11ae7dSRichard Henderson     void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat,              \
662fb11ae7dSRichard Henderson                         ppc_avr_t *a, ppc_avr_t *b, uint32_t desc)      \
663fcf5ef2aSThomas Huth     {                                                                   \
664fcf5ef2aSThomas Huth         int sat = 0;                                                    \
665fcf5ef2aSThomas Huth         int i;                                                          \
666fcf5ef2aSThomas Huth                                                                         \
667fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
668fcf5ef2aSThomas Huth             VARITHSAT_CASE(optype, op, cvt, element);                   \
669fcf5ef2aSThomas Huth         }                                                               \
670fcf5ef2aSThomas Huth         if (sat) {                                                      \
671fb11ae7dSRichard Henderson             vscr_sat->u32[0] = 1;                                       \
672fcf5ef2aSThomas Huth         }                                                               \
673fcf5ef2aSThomas Huth     }
674fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt)          \
675fcf5ef2aSThomas Huth     VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element)      \
676fcf5ef2aSThomas Huth     VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element)
677fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt)        \
678fcf5ef2aSThomas Huth     VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element)      \
679fcf5ef2aSThomas Huth     VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element)
680fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb)
681fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh)
682fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw)
683fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub)
684fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh)
685fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw)
686fcf5ef2aSThomas Huth #undef VARITHSAT_CASE
687fcf5ef2aSThomas Huth #undef VARITHSAT_DO
688fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED
689fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED
690fcf5ef2aSThomas Huth 
691fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype)                                   \
692fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
693fcf5ef2aSThomas Huth     {                                                                   \
694fcf5ef2aSThomas Huth         int i;                                                          \
695fcf5ef2aSThomas Huth                                                                         \
696fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
697fcf5ef2aSThomas Huth             etype x = (etype)a->element[i] + (etype)b->element[i] + 1;  \
698fcf5ef2aSThomas Huth             r->element[i] = x >> 1;                                     \
699fcf5ef2aSThomas Huth         }                                                               \
700fcf5ef2aSThomas Huth     }
701fcf5ef2aSThomas Huth 
702fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element,       \
703fcf5ef2aSThomas Huth              unsigned_type)                                             \
704fcf5ef2aSThomas Huth     VAVG_DO(avgs##type, signed_element, signed_type)                    \
705fcf5ef2aSThomas Huth     VAVG_DO(avgu##type, unsigned_element, unsigned_type)
706fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t)
707fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t)
708fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t)
709fcf5ef2aSThomas Huth #undef VAVG_DO
710fcf5ef2aSThomas Huth #undef VAVG
711fcf5ef2aSThomas Huth 
712fcf5ef2aSThomas Huth #define VABSDU_DO(name, element)                                        \
713fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)           \
714fcf5ef2aSThomas Huth {                                                                       \
715fcf5ef2aSThomas Huth     int i;                                                              \
716fcf5ef2aSThomas Huth                                                                         \
717fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
718fcf5ef2aSThomas Huth         r->element[i] = (a->element[i] > b->element[i]) ?               \
719fcf5ef2aSThomas Huth             (a->element[i] - b->element[i]) :                           \
720fcf5ef2aSThomas Huth             (b->element[i] - a->element[i]);                            \
721fcf5ef2aSThomas Huth     }                                                                   \
722fcf5ef2aSThomas Huth }
723fcf5ef2aSThomas Huth 
724b6cb41b2SDavid Gibson /*
725b6cb41b2SDavid Gibson  * VABSDU - Vector absolute difference unsigned
726fcf5ef2aSThomas Huth  *   name    - instruction mnemonic suffix (b: byte, h: halfword, w: word)
727fcf5ef2aSThomas Huth  *   element - element type to access from vector
728fcf5ef2aSThomas Huth  */
729fcf5ef2aSThomas Huth #define VABSDU(type, element)                   \
730fcf5ef2aSThomas Huth     VABSDU_DO(absdu##type, element)
731fcf5ef2aSThomas Huth VABSDU(b, u8)
732fcf5ef2aSThomas Huth VABSDU(h, u16)
733fcf5ef2aSThomas Huth VABSDU(w, u32)
734fcf5ef2aSThomas Huth #undef VABSDU_DO
735fcf5ef2aSThomas Huth #undef VABSDU
736fcf5ef2aSThomas Huth 
737fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element)                                       \
738fcf5ef2aSThomas Huth     void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r,             \
739fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
740fcf5ef2aSThomas Huth     {                                                                   \
741fcf5ef2aSThomas Huth         int i;                                                          \
742fcf5ef2aSThomas Huth                                                                         \
74305ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
744fcf5ef2aSThomas Huth             float32 t = cvt(b->element[i], &env->vec_status);           \
74505ee3e8aSMark Cave-Ayland             r->f32[i] = float32_scalbn(t, -uim, &env->vec_status);      \
746fcf5ef2aSThomas Huth         }                                                               \
747fcf5ef2aSThomas Huth     }
748fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32)
749fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32)
750fcf5ef2aSThomas Huth #undef VCF
751fcf5ef2aSThomas Huth 
752fcf5ef2aSThomas Huth #define VCMP_DO(suffix, compare, element, record)                       \
753fcf5ef2aSThomas Huth     void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r,            \
754fcf5ef2aSThomas Huth                              ppc_avr_t *a, ppc_avr_t *b)                \
755fcf5ef2aSThomas Huth     {                                                                   \
756fcf5ef2aSThomas Huth         uint64_t ones = (uint64_t)-1;                                   \
757fcf5ef2aSThomas Huth         uint64_t all = ones;                                            \
758fcf5ef2aSThomas Huth         uint64_t none = 0;                                              \
759fcf5ef2aSThomas Huth         int i;                                                          \
760fcf5ef2aSThomas Huth                                                                         \
761fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
762fcf5ef2aSThomas Huth             uint64_t result = (a->element[i] compare b->element[i] ?    \
763fcf5ef2aSThomas Huth                                ones : 0x0);                             \
764fcf5ef2aSThomas Huth             switch (sizeof(a->element[0])) {                            \
765fcf5ef2aSThomas Huth             case 8:                                                     \
766fcf5ef2aSThomas Huth                 r->u64[i] = result;                                     \
767fcf5ef2aSThomas Huth                 break;                                                  \
768fcf5ef2aSThomas Huth             case 4:                                                     \
769fcf5ef2aSThomas Huth                 r->u32[i] = result;                                     \
770fcf5ef2aSThomas Huth                 break;                                                  \
771fcf5ef2aSThomas Huth             case 2:                                                     \
772fcf5ef2aSThomas Huth                 r->u16[i] = result;                                     \
773fcf5ef2aSThomas Huth                 break;                                                  \
774fcf5ef2aSThomas Huth             case 1:                                                     \
775fcf5ef2aSThomas Huth                 r->u8[i] = result;                                      \
776fcf5ef2aSThomas Huth                 break;                                                  \
777fcf5ef2aSThomas Huth             }                                                           \
778fcf5ef2aSThomas Huth             all &= result;                                              \
779fcf5ef2aSThomas Huth             none |= result;                                             \
780fcf5ef2aSThomas Huth         }                                                               \
781fcf5ef2aSThomas Huth         if (record) {                                                   \
782fcf5ef2aSThomas Huth             env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1);       \
783fcf5ef2aSThomas Huth         }                                                               \
784fcf5ef2aSThomas Huth     }
785fcf5ef2aSThomas Huth #define VCMP(suffix, compare, element)          \
786fcf5ef2aSThomas Huth     VCMP_DO(suffix, compare, element, 0)        \
787fcf5ef2aSThomas Huth     VCMP_DO(suffix##_dot, compare, element, 1)
788fcf5ef2aSThomas Huth VCMP(equb, ==, u8)
789fcf5ef2aSThomas Huth VCMP(equh, ==, u16)
790fcf5ef2aSThomas Huth VCMP(equw, ==, u32)
791fcf5ef2aSThomas Huth VCMP(equd, ==, u64)
792fcf5ef2aSThomas Huth VCMP(gtub, >, u8)
793fcf5ef2aSThomas Huth VCMP(gtuh, >, u16)
794fcf5ef2aSThomas Huth VCMP(gtuw, >, u32)
795fcf5ef2aSThomas Huth VCMP(gtud, >, u64)
796fcf5ef2aSThomas Huth VCMP(gtsb, >, s8)
797fcf5ef2aSThomas Huth VCMP(gtsh, >, s16)
798fcf5ef2aSThomas Huth VCMP(gtsw, >, s32)
799fcf5ef2aSThomas Huth VCMP(gtsd, >, s64)
800fcf5ef2aSThomas Huth #undef VCMP_DO
801fcf5ef2aSThomas Huth #undef VCMP
802fcf5ef2aSThomas Huth 
803fcf5ef2aSThomas Huth #define VCMPNE_DO(suffix, element, etype, cmpzero, record)              \
804fcf5ef2aSThomas Huth void helper_vcmpne##suffix(CPUPPCState *env, ppc_avr_t *r,              \
805fcf5ef2aSThomas Huth                             ppc_avr_t *a, ppc_avr_t *b)                 \
806fcf5ef2aSThomas Huth {                                                                       \
807fcf5ef2aSThomas Huth     etype ones = (etype)-1;                                             \
808fcf5ef2aSThomas Huth     etype all = ones;                                                   \
809fcf5ef2aSThomas Huth     etype result, none = 0;                                             \
810fcf5ef2aSThomas Huth     int i;                                                              \
811fcf5ef2aSThomas Huth                                                                         \
812fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
813fcf5ef2aSThomas Huth         if (cmpzero) {                                                  \
814fcf5ef2aSThomas Huth             result = ((a->element[i] == 0)                              \
815fcf5ef2aSThomas Huth                            || (b->element[i] == 0)                      \
816fcf5ef2aSThomas Huth                            || (a->element[i] != b->element[i]) ?        \
817fcf5ef2aSThomas Huth                            ones : 0x0);                                 \
818fcf5ef2aSThomas Huth         } else {                                                        \
819fcf5ef2aSThomas Huth             result = (a->element[i] != b->element[i]) ? ones : 0x0;     \
820fcf5ef2aSThomas Huth         }                                                               \
821fcf5ef2aSThomas Huth         r->element[i] = result;                                         \
822fcf5ef2aSThomas Huth         all &= result;                                                  \
823fcf5ef2aSThomas Huth         none |= result;                                                 \
824fcf5ef2aSThomas Huth     }                                                                   \
825fcf5ef2aSThomas Huth     if (record) {                                                       \
826fcf5ef2aSThomas Huth         env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1);           \
827fcf5ef2aSThomas Huth     }                                                                   \
828fcf5ef2aSThomas Huth }
829fcf5ef2aSThomas Huth 
830b6cb41b2SDavid Gibson /*
831b6cb41b2SDavid Gibson  * VCMPNEZ - Vector compare not equal to zero
832fcf5ef2aSThomas Huth  *   suffix  - instruction mnemonic suffix (b: byte, h: halfword, w: word)
833fcf5ef2aSThomas Huth  *   element - element type to access from vector
834fcf5ef2aSThomas Huth  */
835fcf5ef2aSThomas Huth #define VCMPNE(suffix, element, etype, cmpzero)         \
836fcf5ef2aSThomas Huth     VCMPNE_DO(suffix, element, etype, cmpzero, 0)       \
837fcf5ef2aSThomas Huth     VCMPNE_DO(suffix##_dot, element, etype, cmpzero, 1)
838fcf5ef2aSThomas Huth VCMPNE(zb, u8, uint8_t, 1)
839fcf5ef2aSThomas Huth VCMPNE(zh, u16, uint16_t, 1)
840fcf5ef2aSThomas Huth VCMPNE(zw, u32, uint32_t, 1)
841fcf5ef2aSThomas Huth VCMPNE(b, u8, uint8_t, 0)
842fcf5ef2aSThomas Huth VCMPNE(h, u16, uint16_t, 0)
843fcf5ef2aSThomas Huth VCMPNE(w, u32, uint32_t, 0)
844fcf5ef2aSThomas Huth #undef VCMPNE_DO
845fcf5ef2aSThomas Huth #undef VCMPNE
846fcf5ef2aSThomas Huth 
847fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record)                       \
848fcf5ef2aSThomas Huth     void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r,            \
849fcf5ef2aSThomas Huth                              ppc_avr_t *a, ppc_avr_t *b)                \
850fcf5ef2aSThomas Huth     {                                                                   \
851fcf5ef2aSThomas Huth         uint32_t ones = (uint32_t)-1;                                   \
852fcf5ef2aSThomas Huth         uint32_t all = ones;                                            \
853fcf5ef2aSThomas Huth         uint32_t none = 0;                                              \
854fcf5ef2aSThomas Huth         int i;                                                          \
855fcf5ef2aSThomas Huth                                                                         \
85605ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
857fcf5ef2aSThomas Huth             uint32_t result;                                            \
85871bfd65cSRichard Henderson             FloatRelation rel =                                         \
85971bfd65cSRichard Henderson                 float32_compare_quiet(a->f32[i], b->f32[i],             \
860fcf5ef2aSThomas Huth                                       &env->vec_status);                \
861fcf5ef2aSThomas Huth             if (rel == float_relation_unordered) {                      \
862fcf5ef2aSThomas Huth                 result = 0;                                             \
863fcf5ef2aSThomas Huth             } else if (rel compare order) {                             \
864fcf5ef2aSThomas Huth                 result = ones;                                          \
865fcf5ef2aSThomas Huth             } else {                                                    \
866fcf5ef2aSThomas Huth                 result = 0;                                             \
867fcf5ef2aSThomas Huth             }                                                           \
868fcf5ef2aSThomas Huth             r->u32[i] = result;                                         \
869fcf5ef2aSThomas Huth             all &= result;                                              \
870fcf5ef2aSThomas Huth             none |= result;                                             \
871fcf5ef2aSThomas Huth         }                                                               \
872fcf5ef2aSThomas Huth         if (record) {                                                   \
873fcf5ef2aSThomas Huth             env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1);       \
874fcf5ef2aSThomas Huth         }                                                               \
875fcf5ef2aSThomas Huth     }
876fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order)          \
877fcf5ef2aSThomas Huth     VCMPFP_DO(suffix, compare, order, 0)        \
878fcf5ef2aSThomas Huth     VCMPFP_DO(suffix##_dot, compare, order, 1)
879fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal)
880fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less)
881fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater)
882fcf5ef2aSThomas Huth #undef VCMPFP_DO
883fcf5ef2aSThomas Huth #undef VCMPFP
884fcf5ef2aSThomas Huth 
885fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r,
886fcf5ef2aSThomas Huth                                     ppc_avr_t *a, ppc_avr_t *b, int record)
887fcf5ef2aSThomas Huth {
888fcf5ef2aSThomas Huth     int i;
889fcf5ef2aSThomas Huth     int all_in = 0;
890fcf5ef2aSThomas Huth 
89105ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
89271bfd65cSRichard Henderson         FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i],
89305ee3e8aSMark Cave-Ayland                                                      &env->vec_status);
894fcf5ef2aSThomas Huth         if (le_rel == float_relation_unordered) {
895fcf5ef2aSThomas Huth             r->u32[i] = 0xc0000000;
896fcf5ef2aSThomas Huth             all_in = 1;
897fcf5ef2aSThomas Huth         } else {
89805ee3e8aSMark Cave-Ayland             float32 bneg = float32_chs(b->f32[i]);
89971bfd65cSRichard Henderson             FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg,
90005ee3e8aSMark Cave-Ayland                                                          &env->vec_status);
901fcf5ef2aSThomas Huth             int le = le_rel != float_relation_greater;
902fcf5ef2aSThomas Huth             int ge = ge_rel != float_relation_less;
903fcf5ef2aSThomas Huth 
904fcf5ef2aSThomas Huth             r->u32[i] = ((!le) << 31) | ((!ge) << 30);
905fcf5ef2aSThomas Huth             all_in |= (!le | !ge);
906fcf5ef2aSThomas Huth         }
907fcf5ef2aSThomas Huth     }
908fcf5ef2aSThomas Huth     if (record) {
909fcf5ef2aSThomas Huth         env->crf[6] = (all_in == 0) << 1;
910fcf5ef2aSThomas Huth     }
911fcf5ef2aSThomas Huth }
912fcf5ef2aSThomas Huth 
913fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
914fcf5ef2aSThomas Huth {
915fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 0);
916fcf5ef2aSThomas Huth }
917fcf5ef2aSThomas Huth 
918fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
919fcf5ef2aSThomas Huth                         ppc_avr_t *b)
920fcf5ef2aSThomas Huth {
921fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 1);
922fcf5ef2aSThomas Huth }
923fcf5ef2aSThomas Huth 
924fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element)                                    \
925fcf5ef2aSThomas Huth     void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r,             \
926fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
927fcf5ef2aSThomas Huth     {                                                                   \
928fcf5ef2aSThomas Huth         int i;                                                          \
929fcf5ef2aSThomas Huth         int sat = 0;                                                    \
930fcf5ef2aSThomas Huth         float_status s = env->vec_status;                               \
931fcf5ef2aSThomas Huth                                                                         \
932fcf5ef2aSThomas Huth         set_float_rounding_mode(float_round_to_zero, &s);               \
93305ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
93405ee3e8aSMark Cave-Ayland             if (float32_is_any_nan(b->f32[i])) {                        \
935fcf5ef2aSThomas Huth                 r->element[i] = 0;                                      \
936fcf5ef2aSThomas Huth             } else {                                                    \
93705ee3e8aSMark Cave-Ayland                 float64 t = float32_to_float64(b->f32[i], &s);          \
938fcf5ef2aSThomas Huth                 int64_t j;                                              \
939fcf5ef2aSThomas Huth                                                                         \
940fcf5ef2aSThomas Huth                 t = float64_scalbn(t, uim, &s);                         \
941fcf5ef2aSThomas Huth                 j = float64_to_int64(t, &s);                            \
942fcf5ef2aSThomas Huth                 r->element[i] = satcvt(j, &sat);                        \
943fcf5ef2aSThomas Huth             }                                                           \
944fcf5ef2aSThomas Huth         }                                                               \
945fcf5ef2aSThomas Huth         if (sat) {                                                      \
9466175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
947fcf5ef2aSThomas Huth         }                                                               \
948fcf5ef2aSThomas Huth     }
949fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32)
950fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32)
951fcf5ef2aSThomas Huth #undef VCT
952fcf5ef2aSThomas Huth 
953fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r)
954fcf5ef2aSThomas Huth {
955fcf5ef2aSThomas Huth     target_ulong count = 0;
956fcf5ef2aSThomas Huth     int i;
95760594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
95860594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
959fcf5ef2aSThomas Huth             break;
960fcf5ef2aSThomas Huth         }
961fcf5ef2aSThomas Huth         count++;
962fcf5ef2aSThomas Huth     }
963fcf5ef2aSThomas Huth     return count;
964fcf5ef2aSThomas Huth }
965fcf5ef2aSThomas Huth 
966fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r)
967fcf5ef2aSThomas Huth {
968fcf5ef2aSThomas Huth     target_ulong count = 0;
969fcf5ef2aSThomas Huth     int i;
970fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
97160594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
972fcf5ef2aSThomas Huth             break;
973fcf5ef2aSThomas Huth         }
974fcf5ef2aSThomas Huth         count++;
975fcf5ef2aSThomas Huth     }
976fcf5ef2aSThomas Huth     return count;
977fcf5ef2aSThomas Huth }
978fcf5ef2aSThomas Huth 
979fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
980fcf5ef2aSThomas Huth                       ppc_avr_t *b, ppc_avr_t *c)
981fcf5ef2aSThomas Huth {
982fcf5ef2aSThomas Huth     int sat = 0;
983fcf5ef2aSThomas Huth     int i;
984fcf5ef2aSThomas Huth 
985fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
986fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
987fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
988fcf5ef2aSThomas Huth 
989fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
990fcf5ef2aSThomas Huth     }
991fcf5ef2aSThomas Huth 
992fcf5ef2aSThomas Huth     if (sat) {
9936175f5a0SRichard Henderson         set_vscr_sat(env);
994fcf5ef2aSThomas Huth     }
995fcf5ef2aSThomas Huth }
996fcf5ef2aSThomas Huth 
997fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
998fcf5ef2aSThomas Huth                        ppc_avr_t *b, ppc_avr_t *c)
999fcf5ef2aSThomas Huth {
1000fcf5ef2aSThomas Huth     int sat = 0;
1001fcf5ef2aSThomas Huth     int i;
1002fcf5ef2aSThomas Huth 
1003fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1004fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i] + 0x00004000;
1005fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
1006fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
1007fcf5ef2aSThomas Huth     }
1008fcf5ef2aSThomas Huth 
1009fcf5ef2aSThomas Huth     if (sat) {
10106175f5a0SRichard Henderson         set_vscr_sat(env);
1011fcf5ef2aSThomas Huth     }
1012fcf5ef2aSThomas Huth }
1013fcf5ef2aSThomas Huth 
1014fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1015fcf5ef2aSThomas Huth {
1016fcf5ef2aSThomas Huth     int i;
1017fcf5ef2aSThomas Huth 
1018fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1019fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
1020fcf5ef2aSThomas Huth         r->s16[i] = (int16_t) (prod + c->s16[i]);
1021fcf5ef2aSThomas Huth     }
1022fcf5ef2aSThomas Huth }
1023fcf5ef2aSThomas Huth 
1024d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs)                                  \
1025fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)            \
1026fcf5ef2aSThomas Huth     {                                                                        \
1027fcf5ef2aSThomas Huth         ppc_avr_t result;                                                    \
1028d81c2040SMark Cave-Ayland         int i, half = ARRAY_SIZE(r->element) / 2;                            \
1029fcf5ef2aSThomas Huth                                                                              \
1030d81c2040SMark Cave-Ayland         for (i = 0; i < half; i++) {                                         \
1031d81c2040SMark Cave-Ayland             result.access(i * 2 + 0) = a->access(i + ofs);                   \
1032d81c2040SMark Cave-Ayland             result.access(i * 2 + 1) = b->access(i + ofs);                   \
1033fcf5ef2aSThomas Huth         }                                                                    \
1034fcf5ef2aSThomas Huth         *r = result;                                                         \
1035fcf5ef2aSThomas Huth     }
1036d81c2040SMark Cave-Ayland 
1037d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access)          \
1038d81c2040SMark Cave-Ayland     VMRG_DO(mrgl##suffix, element, access, half)   \
1039d81c2040SMark Cave-Ayland     VMRG_DO(mrgh##suffix, element, access, 0)
1040d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB)
1041d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH)
1042d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW)
1043fcf5ef2aSThomas Huth #undef VMRG_DO
1044fcf5ef2aSThomas Huth #undef VMRG
1045fcf5ef2aSThomas Huth 
1046fcf5ef2aSThomas Huth void helper_vmsummbm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1047fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1048fcf5ef2aSThomas Huth {
1049fcf5ef2aSThomas Huth     int32_t prod[16];
1050fcf5ef2aSThomas Huth     int i;
1051fcf5ef2aSThomas Huth 
1052fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s8); i++) {
1053fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s8[i] * b->u8[i];
1054fcf5ef2aSThomas Huth     }
1055fcf5ef2aSThomas Huth 
1056fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1057fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] +
1058fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
1059fcf5ef2aSThomas Huth     }
1060fcf5ef2aSThomas Huth }
1061fcf5ef2aSThomas Huth 
1062fcf5ef2aSThomas Huth void helper_vmsumshm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1063fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1064fcf5ef2aSThomas Huth {
1065fcf5ef2aSThomas Huth     int32_t prod[8];
1066fcf5ef2aSThomas Huth     int i;
1067fcf5ef2aSThomas Huth 
1068fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1069fcf5ef2aSThomas Huth         prod[i] = a->s16[i] * b->s16[i];
1070fcf5ef2aSThomas Huth     }
1071fcf5ef2aSThomas Huth 
1072fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1073fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1];
1074fcf5ef2aSThomas Huth     }
1075fcf5ef2aSThomas Huth }
1076fcf5ef2aSThomas Huth 
1077fcf5ef2aSThomas Huth void helper_vmsumshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1078fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1079fcf5ef2aSThomas Huth {
1080fcf5ef2aSThomas Huth     int32_t prod[8];
1081fcf5ef2aSThomas Huth     int i;
1082fcf5ef2aSThomas Huth     int sat = 0;
1083fcf5ef2aSThomas Huth 
1084fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1085fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s16[i] * b->s16[i];
1086fcf5ef2aSThomas Huth     }
1087fcf5ef2aSThomas Huth 
1088fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1089fcf5ef2aSThomas Huth         int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1];
1090fcf5ef2aSThomas Huth 
1091fcf5ef2aSThomas Huth         r->u32[i] = cvtsdsw(t, &sat);
1092fcf5ef2aSThomas Huth     }
1093fcf5ef2aSThomas Huth 
1094fcf5ef2aSThomas Huth     if (sat) {
10956175f5a0SRichard Henderson         set_vscr_sat(env);
1096fcf5ef2aSThomas Huth     }
1097fcf5ef2aSThomas Huth }
1098fcf5ef2aSThomas Huth 
1099fcf5ef2aSThomas Huth void helper_vmsumubm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1100fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1101fcf5ef2aSThomas Huth {
1102fcf5ef2aSThomas Huth     uint16_t prod[16];
1103fcf5ef2aSThomas Huth     int i;
1104fcf5ef2aSThomas Huth 
1105fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1106fcf5ef2aSThomas Huth         prod[i] = a->u8[i] * b->u8[i];
1107fcf5ef2aSThomas Huth     }
1108fcf5ef2aSThomas Huth 
1109fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
1110fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] +
1111fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
1112fcf5ef2aSThomas Huth     }
1113fcf5ef2aSThomas Huth }
1114fcf5ef2aSThomas Huth 
1115fcf5ef2aSThomas Huth void helper_vmsumuhm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1116fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1117fcf5ef2aSThomas Huth {
1118fcf5ef2aSThomas Huth     uint32_t prod[8];
1119fcf5ef2aSThomas Huth     int i;
1120fcf5ef2aSThomas Huth 
1121fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
1122fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
1123fcf5ef2aSThomas Huth     }
1124fcf5ef2aSThomas Huth 
1125fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
1126fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1];
1127fcf5ef2aSThomas Huth     }
1128fcf5ef2aSThomas Huth }
1129fcf5ef2aSThomas Huth 
1130fcf5ef2aSThomas Huth void helper_vmsumuhs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1131fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1132fcf5ef2aSThomas Huth {
1133fcf5ef2aSThomas Huth     uint32_t prod[8];
1134fcf5ef2aSThomas Huth     int i;
1135fcf5ef2aSThomas Huth     int sat = 0;
1136fcf5ef2aSThomas Huth 
1137fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
1138fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
1139fcf5ef2aSThomas Huth     }
1140fcf5ef2aSThomas Huth 
1141fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1142fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1];
1143fcf5ef2aSThomas Huth 
1144fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
1145fcf5ef2aSThomas Huth     }
1146fcf5ef2aSThomas Huth 
1147fcf5ef2aSThomas Huth     if (sat) {
11486175f5a0SRichard Henderson         set_vscr_sat(env);
1149fcf5ef2aSThomas Huth     }
1150fcf5ef2aSThomas Huth }
1151fcf5ef2aSThomas Huth 
11524fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast)   \
1153fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
1154fcf5ef2aSThomas Huth     {                                                                   \
1155fcf5ef2aSThomas Huth         int i;                                                          \
1156fcf5ef2aSThomas Huth                                                                         \
11574fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
11584fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i) *           \
11594fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i);            \
1160fcf5ef2aSThomas Huth         }                                                               \
1161fcf5ef2aSThomas Huth     }
11624fbc89edSMark Cave-Ayland 
11634fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast)   \
11644fbc89edSMark Cave-Ayland     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
11654fbc89edSMark Cave-Ayland     {                                                                   \
11664fbc89edSMark Cave-Ayland         int i;                                                          \
11674fbc89edSMark Cave-Ayland                                                                         \
11684fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
11694fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) *       \
11704fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i + 1);        \
11714fbc89edSMark Cave-Ayland         }                                                               \
11724fbc89edSMark Cave-Ayland     }
11734fbc89edSMark Cave-Ayland 
11744fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast)       \
11754fbc89edSMark Cave-Ayland     VMUL_DO_EVN(mule##suffix, mul_element, mul_access, prod_access, cast)  \
11764fbc89edSMark Cave-Ayland     VMUL_DO_ODD(mulo##suffix, mul_element, mul_access, prod_access, cast)
11774fbc89edSMark Cave-Ayland VMUL(sb, s8, VsrSB, VsrSH, int16_t)
11784fbc89edSMark Cave-Ayland VMUL(sh, s16, VsrSH, VsrSW, int32_t)
11794fbc89edSMark Cave-Ayland VMUL(sw, s32, VsrSW, VsrSD, int64_t)
11804fbc89edSMark Cave-Ayland VMUL(ub, u8, VsrB, VsrH, uint16_t)
11814fbc89edSMark Cave-Ayland VMUL(uh, u16, VsrH, VsrW, uint32_t)
11824fbc89edSMark Cave-Ayland VMUL(uw, u32, VsrW, VsrD, uint64_t)
11834fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN
11844fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD
1185fcf5ef2aSThomas Huth #undef VMUL
1186fcf5ef2aSThomas Huth 
1187f3e0d864SLijun Pan void helper_vmulhsw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1188f3e0d864SLijun Pan {
1189f3e0d864SLijun Pan     int i;
1190f3e0d864SLijun Pan 
1191f3e0d864SLijun Pan     for (i = 0; i < 4; i++) {
1192f3e0d864SLijun Pan         r->s32[i] = (int32_t)(((int64_t)a->s32[i] * (int64_t)b->s32[i]) >> 32);
1193f3e0d864SLijun Pan     }
1194f3e0d864SLijun Pan }
1195f3e0d864SLijun Pan 
1196f3e0d864SLijun Pan void helper_vmulhuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1197f3e0d864SLijun Pan {
1198f3e0d864SLijun Pan     int i;
1199f3e0d864SLijun Pan 
1200f3e0d864SLijun Pan     for (i = 0; i < 4; i++) {
1201f3e0d864SLijun Pan         r->u32[i] = (uint32_t)(((uint64_t)a->u32[i] *
1202f3e0d864SLijun Pan                                (uint64_t)b->u32[i]) >> 32);
1203f3e0d864SLijun Pan     }
1204f3e0d864SLijun Pan }
1205f3e0d864SLijun Pan 
1206c4b8b49dSLijun Pan void helper_vmulhsd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1207c4b8b49dSLijun Pan {
1208c4b8b49dSLijun Pan     uint64_t discard;
1209c4b8b49dSLijun Pan 
1210c4b8b49dSLijun Pan     muls64(&discard, &r->u64[0], a->s64[0], b->s64[0]);
1211c4b8b49dSLijun Pan     muls64(&discard, &r->u64[1], a->s64[1], b->s64[1]);
1212c4b8b49dSLijun Pan }
1213c4b8b49dSLijun Pan 
1214c4b8b49dSLijun Pan void helper_vmulhud(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1215c4b8b49dSLijun Pan {
1216c4b8b49dSLijun Pan     uint64_t discard;
1217c4b8b49dSLijun Pan 
1218c4b8b49dSLijun Pan     mulu64(&discard, &r->u64[0], a->u64[0], b->u64[0]);
1219c4b8b49dSLijun Pan     mulu64(&discard, &r->u64[1], a->u64[1], b->u64[1]);
1220c4b8b49dSLijun Pan }
1221c4b8b49dSLijun Pan 
1222fcf5ef2aSThomas Huth void helper_vperm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b,
1223fcf5ef2aSThomas Huth                   ppc_avr_t *c)
1224fcf5ef2aSThomas Huth {
1225fcf5ef2aSThomas Huth     ppc_avr_t result;
1226fcf5ef2aSThomas Huth     int i;
1227fcf5ef2aSThomas Huth 
122860594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
122960594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1230fcf5ef2aSThomas Huth         int index = s & 0xf;
1231fcf5ef2aSThomas Huth 
1232fcf5ef2aSThomas Huth         if (s & 0x10) {
123360594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1234fcf5ef2aSThomas Huth         } else {
123560594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1236fcf5ef2aSThomas Huth         }
1237fcf5ef2aSThomas Huth     }
1238fcf5ef2aSThomas Huth     *r = result;
1239fcf5ef2aSThomas Huth }
1240fcf5ef2aSThomas Huth 
1241fcf5ef2aSThomas Huth void helper_vpermr(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b,
1242fcf5ef2aSThomas Huth                   ppc_avr_t *c)
1243fcf5ef2aSThomas Huth {
1244fcf5ef2aSThomas Huth     ppc_avr_t result;
1245fcf5ef2aSThomas Huth     int i;
1246fcf5ef2aSThomas Huth 
124760594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
124860594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1249fcf5ef2aSThomas Huth         int index = 15 - (s & 0xf);
1250fcf5ef2aSThomas Huth 
1251fcf5ef2aSThomas Huth         if (s & 0x10) {
125260594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1253fcf5ef2aSThomas Huth         } else {
125460594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1255fcf5ef2aSThomas Huth         }
1256fcf5ef2aSThomas Huth     }
1257fcf5ef2aSThomas Huth     *r = result;
1258fcf5ef2aSThomas Huth }
1259fcf5ef2aSThomas Huth 
1260fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1261fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)])
1262fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i)
1263fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0)
1264fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1))
1265fcf5ef2aSThomas Huth #else
1266fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)])
1267fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i)
1268fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0)
1269fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \
1270fcf5ef2aSThomas Huth         (extract64((avr)->u64[1 - i], 63 - index, 1))
1271fcf5ef2aSThomas Huth #endif
1272fcf5ef2aSThomas Huth 
1273fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1274fcf5ef2aSThomas Huth {
1275fcf5ef2aSThomas Huth     int i, j;
1276fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
1277fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1278fcf5ef2aSThomas Huth         for (j = 0; j < 8; j++) {
1279fcf5ef2aSThomas Huth             int index = VBPERMQ_INDEX(b, (i * 8) + j);
1280fcf5ef2aSThomas Huth             if (index < 64 && EXTRACT_BIT(a, i, index)) {
1281fcf5ef2aSThomas Huth                 result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j);
1282fcf5ef2aSThomas Huth             }
1283fcf5ef2aSThomas Huth         }
1284fcf5ef2aSThomas Huth     }
1285fcf5ef2aSThomas Huth     *r = result;
1286fcf5ef2aSThomas Huth }
1287fcf5ef2aSThomas Huth 
1288fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1289fcf5ef2aSThomas Huth {
1290fcf5ef2aSThomas Huth     int i;
1291fcf5ef2aSThomas Huth     uint64_t perm = 0;
1292fcf5ef2aSThomas Huth 
1293fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
1294fcf5ef2aSThomas Huth         int index = VBPERMQ_INDEX(b, i);
1295fcf5ef2aSThomas Huth 
1296fcf5ef2aSThomas Huth         if (index < 128) {
1297fcf5ef2aSThomas Huth             uint64_t mask = (1ull << (63 - (index & 0x3F)));
1298fcf5ef2aSThomas Huth             if (a->u64[VBPERMQ_DW(index)] & mask) {
1299fcf5ef2aSThomas Huth                 perm |= (0x8000 >> i);
1300fcf5ef2aSThomas Huth             }
1301fcf5ef2aSThomas Huth         }
1302fcf5ef2aSThomas Huth     }
1303fcf5ef2aSThomas Huth 
13043c385a93SMark Cave-Ayland     r->VsrD(0) = perm;
13053c385a93SMark Cave-Ayland     r->VsrD(1) = 0;
1306fcf5ef2aSThomas Huth }
1307fcf5ef2aSThomas Huth 
1308fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX
1309fcf5ef2aSThomas Huth #undef VBPERMQ_DW
1310fcf5ef2aSThomas Huth 
1311fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp)                   \
1312fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)  \
1313fcf5ef2aSThomas Huth {                                                             \
1314fcf5ef2aSThomas Huth     int i, j;                                                 \
1315fcf5ef2aSThomas Huth     trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])];    \
1316fcf5ef2aSThomas Huth                                                               \
1317fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, srcfld) {                         \
1318fcf5ef2aSThomas Huth         prod[i] = 0;                                          \
1319fcf5ef2aSThomas Huth         for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) {      \
1320fcf5ef2aSThomas Huth             if (a->srcfld[i] & (1ull << j)) {                 \
1321fcf5ef2aSThomas Huth                 prod[i] ^= ((trgtyp)b->srcfld[i] << j);       \
1322fcf5ef2aSThomas Huth             }                                                 \
1323fcf5ef2aSThomas Huth         }                                                     \
1324fcf5ef2aSThomas Huth     }                                                         \
1325fcf5ef2aSThomas Huth                                                               \
1326fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, trgfld) {                         \
1327fcf5ef2aSThomas Huth         r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1];         \
1328fcf5ef2aSThomas Huth     }                                                         \
1329fcf5ef2aSThomas Huth }
1330fcf5ef2aSThomas Huth 
1331fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t)
1332fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t)
1333fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t)
1334fcf5ef2aSThomas Huth 
1335fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1336fcf5ef2aSThomas Huth {
1337fcf5ef2aSThomas Huth 
1338fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1339fcf5ef2aSThomas Huth     int i, j;
1340fcf5ef2aSThomas Huth     __uint128_t prod[2];
1341fcf5ef2aSThomas Huth 
1342fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1343fcf5ef2aSThomas Huth         prod[i] = 0;
1344fcf5ef2aSThomas Huth         for (j = 0; j < 64; j++) {
1345fcf5ef2aSThomas Huth             if (a->u64[i] & (1ull << j)) {
1346fcf5ef2aSThomas Huth                 prod[i] ^= (((__uint128_t)b->u64[i]) << j);
1347fcf5ef2aSThomas Huth             }
1348fcf5ef2aSThomas Huth         }
1349fcf5ef2aSThomas Huth     }
1350fcf5ef2aSThomas Huth 
1351fcf5ef2aSThomas Huth     r->u128 = prod[0] ^ prod[1];
1352fcf5ef2aSThomas Huth 
1353fcf5ef2aSThomas Huth #else
1354fcf5ef2aSThomas Huth     int i, j;
1355fcf5ef2aSThomas Huth     ppc_avr_t prod[2];
1356fcf5ef2aSThomas Huth 
1357fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
13583c385a93SMark Cave-Ayland         prod[i].VsrD(1) = prod[i].VsrD(0) = 0;
1359fcf5ef2aSThomas Huth         for (j = 0; j < 64; j++) {
1360fcf5ef2aSThomas Huth             if (a->u64[i] & (1ull << j)) {
1361fcf5ef2aSThomas Huth                 ppc_avr_t bshift;
1362fcf5ef2aSThomas Huth                 if (j == 0) {
13633c385a93SMark Cave-Ayland                     bshift.VsrD(0) = 0;
13643c385a93SMark Cave-Ayland                     bshift.VsrD(1) = b->u64[i];
1365fcf5ef2aSThomas Huth                 } else {
13663c385a93SMark Cave-Ayland                     bshift.VsrD(0) = b->u64[i] >> (64 - j);
13673c385a93SMark Cave-Ayland                     bshift.VsrD(1) = b->u64[i] << j;
1368fcf5ef2aSThomas Huth                 }
13693c385a93SMark Cave-Ayland                 prod[i].VsrD(1) ^= bshift.VsrD(1);
13703c385a93SMark Cave-Ayland                 prod[i].VsrD(0) ^= bshift.VsrD(0);
1371fcf5ef2aSThomas Huth             }
1372fcf5ef2aSThomas Huth         }
1373fcf5ef2aSThomas Huth     }
1374fcf5ef2aSThomas Huth 
13753c385a93SMark Cave-Ayland     r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1);
13763c385a93SMark Cave-Ayland     r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0);
1377fcf5ef2aSThomas Huth #endif
1378fcf5ef2aSThomas Huth }
1379fcf5ef2aSThomas Huth 
1380fcf5ef2aSThomas Huth 
1381fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1382fcf5ef2aSThomas Huth #define PKBIG 1
1383fcf5ef2aSThomas Huth #else
1384fcf5ef2aSThomas Huth #define PKBIG 0
1385fcf5ef2aSThomas Huth #endif
1386fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1387fcf5ef2aSThomas Huth {
1388fcf5ef2aSThomas Huth     int i, j;
1389fcf5ef2aSThomas Huth     ppc_avr_t result;
1390fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1391fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { a, b };
1392fcf5ef2aSThomas Huth #else
1393fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { b, a };
1394fcf5ef2aSThomas Huth #endif
1395fcf5ef2aSThomas Huth 
1396fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1397fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(j, u32) {
1398fcf5ef2aSThomas Huth             uint32_t e = x[i]->u32[j];
1399fcf5ef2aSThomas Huth 
1400fcf5ef2aSThomas Huth             result.u16[4 * i + j] = (((e >> 9) & 0xfc00) |
1401fcf5ef2aSThomas Huth                                      ((e >> 6) & 0x3e0) |
1402fcf5ef2aSThomas Huth                                      ((e >> 3) & 0x1f));
1403fcf5ef2aSThomas Huth         }
1404fcf5ef2aSThomas Huth     }
1405fcf5ef2aSThomas Huth     *r = result;
1406fcf5ef2aSThomas Huth }
1407fcf5ef2aSThomas Huth 
1408fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat)                               \
1409fcf5ef2aSThomas Huth     void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r,             \
1410fcf5ef2aSThomas Huth                             ppc_avr_t *a, ppc_avr_t *b)                 \
1411fcf5ef2aSThomas Huth     {                                                                   \
1412fcf5ef2aSThomas Huth         int i;                                                          \
1413fcf5ef2aSThomas Huth         int sat = 0;                                                    \
1414fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1415fcf5ef2aSThomas Huth         ppc_avr_t *a0 = PKBIG ? a : b;                                  \
1416fcf5ef2aSThomas Huth         ppc_avr_t *a1 = PKBIG ? b : a;                                  \
1417fcf5ef2aSThomas Huth                                                                         \
1418fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(i, from) {                                 \
1419fcf5ef2aSThomas Huth             result.to[i] = cvt(a0->from[i], &sat);                      \
1420fcf5ef2aSThomas Huth             result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\
1421fcf5ef2aSThomas Huth         }                                                               \
1422fcf5ef2aSThomas Huth         *r = result;                                                    \
1423fcf5ef2aSThomas Huth         if (dosat && sat) {                                             \
14246175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
1425fcf5ef2aSThomas Huth         }                                                               \
1426fcf5ef2aSThomas Huth     }
1427fcf5ef2aSThomas Huth #define I(x, y) (x)
1428fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1)
1429fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1)
1430fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1)
1431fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1)
1432fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1)
1433fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1)
1434fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1)
1435fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1)
1436fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1)
1437fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0)
1438fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0)
1439fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0)
1440fcf5ef2aSThomas Huth #undef I
1441fcf5ef2aSThomas Huth #undef VPK
1442fcf5ef2aSThomas Huth #undef PKBIG
1443fcf5ef2aSThomas Huth 
1444fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1445fcf5ef2aSThomas Huth {
1446fcf5ef2aSThomas Huth     int i;
1447fcf5ef2aSThomas Huth 
144805ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
144905ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status);
1450fcf5ef2aSThomas Huth     }
1451fcf5ef2aSThomas Huth }
1452fcf5ef2aSThomas Huth 
1453fcf5ef2aSThomas Huth #define VRFI(suffix, rounding)                                  \
1454fcf5ef2aSThomas Huth     void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r,    \
1455fcf5ef2aSThomas Huth                              ppc_avr_t *b)                      \
1456fcf5ef2aSThomas Huth     {                                                           \
1457fcf5ef2aSThomas Huth         int i;                                                  \
1458fcf5ef2aSThomas Huth         float_status s = env->vec_status;                       \
1459fcf5ef2aSThomas Huth                                                                 \
1460fcf5ef2aSThomas Huth         set_float_rounding_mode(rounding, &s);                  \
146105ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {              \
146205ee3e8aSMark Cave-Ayland             r->f32[i] = float32_round_to_int (b->f32[i], &s);   \
1463fcf5ef2aSThomas Huth         }                                                       \
1464fcf5ef2aSThomas Huth     }
1465fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even)
1466fcf5ef2aSThomas Huth VRFI(m, float_round_down)
1467fcf5ef2aSThomas Huth VRFI(p, float_round_up)
1468fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero)
1469fcf5ef2aSThomas Huth #undef VRFI
1470fcf5ef2aSThomas Huth 
1471fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1472fcf5ef2aSThomas Huth {
1473fcf5ef2aSThomas Huth     int i;
1474fcf5ef2aSThomas Huth 
147505ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
147605ee3e8aSMark Cave-Ayland         float32 t = float32_sqrt(b->f32[i], &env->vec_status);
1477fcf5ef2aSThomas Huth 
147805ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, t, &env->vec_status);
1479fcf5ef2aSThomas Huth     }
1480fcf5ef2aSThomas Huth }
1481fcf5ef2aSThomas Huth 
1482fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert)                            \
1483fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)          \
1484fcf5ef2aSThomas Huth {                                                                     \
1485fcf5ef2aSThomas Huth     int i;                                                            \
1486fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                    \
1487fcf5ef2aSThomas Huth         uint##size##_t src1 = a->element[i];                          \
1488fcf5ef2aSThomas Huth         uint##size##_t src2 = b->element[i];                          \
1489fcf5ef2aSThomas Huth         uint##size##_t src3 = r->element[i];                          \
1490fcf5ef2aSThomas Huth         uint##size##_t begin, end, shift, mask, rot_val;              \
1491fcf5ef2aSThomas Huth                                                                       \
1492fcf5ef2aSThomas Huth         shift = extract##size(src2, 0, 6);                            \
1493fcf5ef2aSThomas Huth         end   = extract##size(src2, 8, 6);                            \
1494fcf5ef2aSThomas Huth         begin = extract##size(src2, 16, 6);                           \
1495fcf5ef2aSThomas Huth         rot_val = rol##size(src1, shift);                             \
1496fcf5ef2aSThomas Huth         mask = mask_u##size(begin, end);                              \
1497fcf5ef2aSThomas Huth         if (insert) {                                                 \
1498fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask) | (src3 & ~mask);        \
1499fcf5ef2aSThomas Huth         } else {                                                      \
1500fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask);                         \
1501fcf5ef2aSThomas Huth         }                                                             \
1502fcf5ef2aSThomas Huth     }                                                                 \
1503fcf5ef2aSThomas Huth }
1504fcf5ef2aSThomas Huth 
1505fcf5ef2aSThomas Huth VRLMI(vrldmi, 64, u64, 1);
1506fcf5ef2aSThomas Huth VRLMI(vrlwmi, 32, u32, 1);
1507fcf5ef2aSThomas Huth VRLMI(vrldnm, 64, u64, 0);
1508fcf5ef2aSThomas Huth VRLMI(vrlwnm, 32, u32, 0);
1509fcf5ef2aSThomas Huth 
1510fcf5ef2aSThomas Huth void helper_vsel(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b,
1511fcf5ef2aSThomas Huth                  ppc_avr_t *c)
1512fcf5ef2aSThomas Huth {
1513fcf5ef2aSThomas Huth     r->u64[0] = (a->u64[0] & ~c->u64[0]) | (b->u64[0] & c->u64[0]);
1514fcf5ef2aSThomas Huth     r->u64[1] = (a->u64[1] & ~c->u64[1]) | (b->u64[1] & c->u64[1]);
1515fcf5ef2aSThomas Huth }
1516fcf5ef2aSThomas Huth 
1517fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1518fcf5ef2aSThomas Huth {
1519fcf5ef2aSThomas Huth     int i;
1520fcf5ef2aSThomas Huth 
152105ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
152205ee3e8aSMark Cave-Ayland         r->f32[i] = float32_exp2(b->f32[i], &env->vec_status);
1523fcf5ef2aSThomas Huth     }
1524fcf5ef2aSThomas Huth }
1525fcf5ef2aSThomas Huth 
1526fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1527fcf5ef2aSThomas Huth {
1528fcf5ef2aSThomas Huth     int i;
1529fcf5ef2aSThomas Huth 
153005ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
153105ee3e8aSMark Cave-Ayland         r->f32[i] = float32_log2(b->f32[i], &env->vec_status);
1532fcf5ef2aSThomas Huth     }
1533fcf5ef2aSThomas Huth }
1534fcf5ef2aSThomas Huth 
153560caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left)                            \
153660caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b)  \
153760caf221SAvinesh Kumar {                                                               \
1538f297c4c6SMatheus Ferst     int index = (a & 0xf) * 8;                                  \
153960caf221SAvinesh Kumar     if (left) {                                                 \
1540f297c4c6SMatheus Ferst         index = 128 - index - size;                             \
154160caf221SAvinesh Kumar     }                                                           \
154260caf221SAvinesh Kumar     return int128_getlo(int128_rshift(b->s128, index)) &        \
154360caf221SAvinesh Kumar         MAKE_64BIT_MASK(0, size);                               \
154460caf221SAvinesh Kumar }
154560caf221SAvinesh Kumar VEXTU_X_DO(vextublx,  8, 1)
154660caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1)
154760caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1)
154860caf221SAvinesh Kumar VEXTU_X_DO(vextubrx,  8, 0)
154960caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0)
155060caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0)
155160caf221SAvinesh Kumar #undef VEXTU_X_DO
155260caf221SAvinesh Kumar 
1553fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1554fcf5ef2aSThomas Huth {
1555fcf5ef2aSThomas Huth     int i;
1556fcf5ef2aSThomas Huth     unsigned int shift, bytes, size;
1557fcf5ef2aSThomas Huth 
1558fcf5ef2aSThomas Huth     size = ARRAY_SIZE(r->u8);
1559fcf5ef2aSThomas Huth     for (i = 0; i < size; i++) {
156063be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;             /* extract shift value */
156163be02fcSAnton Blanchard         bytes = (a->VsrB(i) << 8) +           /* extract adjacent bytes */
156263be02fcSAnton Blanchard             (((i + 1) < size) ? a->VsrB(i + 1) : 0);
156363be02fcSAnton Blanchard         r->VsrB(i) = (bytes << shift) >> 8;   /* shift and store result */
1564fcf5ef2aSThomas Huth     }
1565fcf5ef2aSThomas Huth }
1566fcf5ef2aSThomas Huth 
1567fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1568fcf5ef2aSThomas Huth {
1569fcf5ef2aSThomas Huth     int i;
1570fcf5ef2aSThomas Huth     unsigned int shift, bytes;
1571fcf5ef2aSThomas Huth 
1572b6cb41b2SDavid Gibson     /*
1573b6cb41b2SDavid Gibson      * Use reverse order, as destination and source register can be
1574b6cb41b2SDavid Gibson      * same. Its being modified in place saving temporary, reverse
1575b6cb41b2SDavid Gibson      * order will guarantee that computed result is not fed back.
1576fcf5ef2aSThomas Huth      */
1577fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
157863be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;               /* extract shift value */
157963be02fcSAnton Blanchard         bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i);
1580fcf5ef2aSThomas Huth                                                 /* extract adjacent bytes */
158163be02fcSAnton Blanchard         r->VsrB(i) = (bytes >> shift) & 0xFF;   /* shift and store result */
1582fcf5ef2aSThomas Huth     }
1583fcf5ef2aSThomas Huth }
1584fcf5ef2aSThomas Huth 
1585fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift)
1586fcf5ef2aSThomas Huth {
1587fcf5ef2aSThomas Huth     int sh = shift & 0xf;
1588fcf5ef2aSThomas Huth     int i;
1589fcf5ef2aSThomas Huth     ppc_avr_t result;
1590fcf5ef2aSThomas Huth 
1591fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1592fcf5ef2aSThomas Huth         int index = sh + i;
1593fcf5ef2aSThomas Huth         if (index > 0xf) {
159460594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index - 0x10);
1595fcf5ef2aSThomas Huth         } else {
159660594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1597fcf5ef2aSThomas Huth         }
1598fcf5ef2aSThomas Huth     }
1599fcf5ef2aSThomas Huth     *r = result;
1600fcf5ef2aSThomas Huth }
1601fcf5ef2aSThomas Huth 
1602fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1603fcf5ef2aSThomas Huth {
16043c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1605fcf5ef2aSThomas Huth 
1606fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1607fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1608fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1609fcf5ef2aSThomas Huth #else
1610fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1611fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1612fcf5ef2aSThomas Huth #endif
1613fcf5ef2aSThomas Huth }
1614fcf5ef2aSThomas Huth 
1615fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
16162cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX])
16172cc12af3SMatheus Ferst #else
16182cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1)
16192cc12af3SMatheus Ferst #endif
16202cc12af3SMatheus Ferst 
16212cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \
16222cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t,       \
16232cc12af3SMatheus Ferst                                          uint64_t val, target_ulong index)     \
16242cc12af3SMatheus Ferst {                                                                              \
16252cc12af3SMatheus Ferst     const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE);                       \
16262cc12af3SMatheus Ferst     target_long idx = index;                                                   \
16272cc12af3SMatheus Ferst                                                                                \
16282cc12af3SMatheus Ferst     if (idx < 0 || idx > maxidx) {                                             \
16292cc12af3SMatheus Ferst         idx =  idx < 0 ? sizeof(TYPE) - idx : idx;                             \
16302cc12af3SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR,                                         \
16312cc12af3SMatheus Ferst             "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx   \
16322cc12af3SMatheus Ferst             ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx);         \
16332cc12af3SMatheus Ferst     } else {                                                                   \
16342cc12af3SMatheus Ferst         TYPE src = val;                                                        \
16352cc12af3SMatheus Ferst         memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE));           \
16362cc12af3SMatheus Ferst     }                                                                          \
16372cc12af3SMatheus Ferst }
16382cc12af3SMatheus Ferst VINSX(B, uint8_t)
16392cc12af3SMatheus Ferst VINSX(H, uint16_t)
16402cc12af3SMatheus Ferst VINSX(W, uint32_t)
16412cc12af3SMatheus Ferst VINSX(D, uint64_t)
16422cc12af3SMatheus Ferst #undef ELEM_ADDR
16432cc12af3SMatheus Ferst #undef VINSX
1644fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
164528110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
164628110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
164728110b72SMatheus Ferst                    target_ulong index)                                         \
164828110b72SMatheus Ferst {                                                                              \
164928110b72SMatheus Ferst     const target_long idx = index;                                             \
165028110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *a, *b };                                             \
165128110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
165228110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
165328110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \
165428110b72SMatheus Ferst     } else {                                                                   \
165528110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
165628110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
165728110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
165828110b72SMatheus Ferst     }                                                                          \
165928110b72SMatheus Ferst }
166028110b72SMatheus Ferst #else
166128110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
166228110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
166328110b72SMatheus Ferst                    target_ulong index)                                         \
166428110b72SMatheus Ferst {                                                                              \
166528110b72SMatheus Ferst     const target_long idx = index;                                             \
166628110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *b, *a };                                             \
166728110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
166828110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
166928110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2],                                  \
167028110b72SMatheus Ferst                (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE);                  \
167128110b72SMatheus Ferst     } else {                                                                   \
167228110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
167328110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
167428110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
167528110b72SMatheus Ferst     }                                                                          \
167628110b72SMatheus Ferst }
167728110b72SMatheus Ferst #endif
167828110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1)
167928110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2)
168028110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4)
168128110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8)
168228110b72SMatheus Ferst #undef VEXTDVLX
168328110b72SMatheus Ferst #if defined(HOST_WORDS_BIGENDIAN)
1684fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1685fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1686fcf5ef2aSThomas Huth     {                                                                        \
1687fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1688fcf5ef2aSThomas Huth         memmove(&r->u8[8 - es], &b->u8[index], es);                          \
1689fcf5ef2aSThomas Huth         memset(&r->u8[8], 0, 8);                                             \
1690fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8 - es);                                        \
1691fcf5ef2aSThomas Huth     }
1692fcf5ef2aSThomas Huth #else
1693fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1694fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1695fcf5ef2aSThomas Huth     {                                                                        \
1696fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1697fcf5ef2aSThomas Huth         uint32_t s = (16 - index) - es;                                      \
1698fcf5ef2aSThomas Huth         memmove(&r->u8[8], &b->u8[s], es);                                   \
1699fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8);                                             \
1700fcf5ef2aSThomas Huth         memset(&r->u8[8 + es], 0, 8 - es);                                   \
1701fcf5ef2aSThomas Huth     }
1702fcf5ef2aSThomas Huth #endif
1703fcf5ef2aSThomas Huth VEXTRACT(ub, u8)
1704fcf5ef2aSThomas Huth VEXTRACT(uh, u16)
1705fcf5ef2aSThomas Huth VEXTRACT(uw, u32)
1706fcf5ef2aSThomas Huth VEXTRACT(d, u64)
1707fcf5ef2aSThomas Huth #undef VEXTRACT
1708fcf5ef2aSThomas Huth 
17095ba5335dSMark Cave-Ayland void helper_xxextractuw(CPUPPCState *env, ppc_vsr_t *xt,
17105ba5335dSMark Cave-Ayland                         ppc_vsr_t *xb, uint32_t index)
17118ad901e5SNikunj A Dadhania {
171203b32c09SMark Cave-Ayland     ppc_vsr_t t = { };
17138ad901e5SNikunj A Dadhania     size_t es = sizeof(uint32_t);
17148ad901e5SNikunj A Dadhania     uint32_t ext_index;
17158ad901e5SNikunj A Dadhania     int i;
17168ad901e5SNikunj A Dadhania 
17178ad901e5SNikunj A Dadhania     ext_index = index;
17188ad901e5SNikunj A Dadhania     for (i = 0; i < es; i++, ext_index++) {
171903b32c09SMark Cave-Ayland         t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16);
17208ad901e5SNikunj A Dadhania     }
17218ad901e5SNikunj A Dadhania 
172203b32c09SMark Cave-Ayland     *xt = t;
17238ad901e5SNikunj A Dadhania }
17248ad901e5SNikunj A Dadhania 
17255ba5335dSMark Cave-Ayland void helper_xxinsertw(CPUPPCState *env, ppc_vsr_t *xt,
17265ba5335dSMark Cave-Ayland                       ppc_vsr_t *xb, uint32_t index)
17273398b742SNikunj A Dadhania {
172803b32c09SMark Cave-Ayland     ppc_vsr_t t = *xt;
17293398b742SNikunj A Dadhania     size_t es = sizeof(uint32_t);
17303398b742SNikunj A Dadhania     int ins_index, i = 0;
17313398b742SNikunj A Dadhania 
17323398b742SNikunj A Dadhania     ins_index = index;
17333398b742SNikunj A Dadhania     for (i = 0; i < es && ins_index < 16; i++, ins_index++) {
173403b32c09SMark Cave-Ayland         t.VsrB(ins_index) = xb->VsrB(8 - es + i);
17353398b742SNikunj A Dadhania     }
17363398b742SNikunj A Dadhania 
173703b32c09SMark Cave-Ayland     *xt = t;
17383398b742SNikunj A Dadhania }
17393398b742SNikunj A Dadhania 
1740*788c6399SMatheus Ferst #define XXBLEND(name, sz) \
1741*788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b,  \
1742*788c6399SMatheus Ferst                                  ppc_avr_t *c, uint32_t desc)               \
1743*788c6399SMatheus Ferst {                                                                           \
1744*788c6399SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) {                  \
1745*788c6399SMatheus Ferst         t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ?               \
1746*788c6399SMatheus Ferst             b->glue(u, sz)[i] : a->glue(u, sz)[i];                          \
1747*788c6399SMatheus Ferst     }                                                                       \
1748*788c6399SMatheus Ferst }
1749*788c6399SMatheus Ferst XXBLEND(B, 8)
1750*788c6399SMatheus Ferst XXBLEND(H, 16)
1751*788c6399SMatheus Ferst XXBLEND(W, 32)
1752*788c6399SMatheus Ferst XXBLEND(D, 64)
1753*788c6399SMatheus Ferst #undef XXBLEND
1754*788c6399SMatheus Ferst 
1755634c5835SMark Cave-Ayland #define VEXT_SIGNED(name, element, cast)                            \
1756fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b)                      \
1757fcf5ef2aSThomas Huth {                                                                   \
1758fcf5ef2aSThomas Huth     int i;                                                          \
175960594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
1760634c5835SMark Cave-Ayland         r->element[i] = (cast)b->element[i];                        \
1761fcf5ef2aSThomas Huth     }                                                               \
1762fcf5ef2aSThomas Huth }
1763634c5835SMark Cave-Ayland VEXT_SIGNED(vextsb2w, s32, int8_t)
1764634c5835SMark Cave-Ayland VEXT_SIGNED(vextsb2d, s64, int8_t)
1765634c5835SMark Cave-Ayland VEXT_SIGNED(vextsh2w, s32, int16_t)
1766634c5835SMark Cave-Ayland VEXT_SIGNED(vextsh2d, s64, int16_t)
1767634c5835SMark Cave-Ayland VEXT_SIGNED(vextsw2d, s64, int32_t)
1768fcf5ef2aSThomas Huth #undef VEXT_SIGNED
1769fcf5ef2aSThomas Huth 
1770fcf5ef2aSThomas Huth #define VNEG(name, element)                                         \
1771fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b)                      \
1772fcf5ef2aSThomas Huth {                                                                   \
1773fcf5ef2aSThomas Huth     int i;                                                          \
177460594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
1775fcf5ef2aSThomas Huth         r->element[i] = -b->element[i];                             \
1776fcf5ef2aSThomas Huth     }                                                               \
1777fcf5ef2aSThomas Huth }
1778fcf5ef2aSThomas Huth VNEG(vnegw, s32)
1779fcf5ef2aSThomas Huth VNEG(vnegd, s64)
1780fcf5ef2aSThomas Huth #undef VNEG
1781fcf5ef2aSThomas Huth 
1782fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1783fcf5ef2aSThomas Huth {
17843c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1785fcf5ef2aSThomas Huth 
1786fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1787fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1788fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1789fcf5ef2aSThomas Huth #else
1790fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1791fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1792fcf5ef2aSThomas Huth #endif
1793fcf5ef2aSThomas Huth }
1794fcf5ef2aSThomas Huth 
1795fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1796fcf5ef2aSThomas Huth {
1797fcf5ef2aSThomas Huth     int i;
1798fcf5ef2aSThomas Huth 
1799fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
1800fcf5ef2aSThomas Huth         r->u32[i] = a->u32[i] >= b->u32[i];
1801fcf5ef2aSThomas Huth     }
1802fcf5ef2aSThomas Huth }
1803fcf5ef2aSThomas Huth 
1804fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1805fcf5ef2aSThomas Huth {
1806fcf5ef2aSThomas Huth     int64_t t;
1807fcf5ef2aSThomas Huth     int i, upper;
1808fcf5ef2aSThomas Huth     ppc_avr_t result;
1809fcf5ef2aSThomas Huth     int sat = 0;
1810fcf5ef2aSThomas Huth 
1811fcf5ef2aSThomas Huth     upper = ARRAY_SIZE(r->s32) - 1;
181260594feaSMark Cave-Ayland     t = (int64_t)b->VsrSW(upper);
1813fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
181460594feaSMark Cave-Ayland         t += a->VsrSW(i);
181560594feaSMark Cave-Ayland         result.VsrSW(i) = 0;
1816fcf5ef2aSThomas Huth     }
181760594feaSMark Cave-Ayland     result.VsrSW(upper) = cvtsdsw(t, &sat);
1818fcf5ef2aSThomas Huth     *r = result;
1819fcf5ef2aSThomas Huth 
1820fcf5ef2aSThomas Huth     if (sat) {
18216175f5a0SRichard Henderson         set_vscr_sat(env);
1822fcf5ef2aSThomas Huth     }
1823fcf5ef2aSThomas Huth }
1824fcf5ef2aSThomas Huth 
1825fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1826fcf5ef2aSThomas Huth {
1827fcf5ef2aSThomas Huth     int i, j, upper;
1828fcf5ef2aSThomas Huth     ppc_avr_t result;
1829fcf5ef2aSThomas Huth     int sat = 0;
1830fcf5ef2aSThomas Huth 
1831fcf5ef2aSThomas Huth     upper = 1;
1832fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
183360594feaSMark Cave-Ayland         int64_t t = (int64_t)b->VsrSW(upper + i * 2);
1834fcf5ef2aSThomas Huth 
18357fa0ddc1SAnton Blanchard         result.VsrD(i) = 0;
1836fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u64); j++) {
183760594feaSMark Cave-Ayland             t += a->VsrSW(2 * i + j);
1838fcf5ef2aSThomas Huth         }
183960594feaSMark Cave-Ayland         result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat);
1840fcf5ef2aSThomas Huth     }
1841fcf5ef2aSThomas Huth 
1842fcf5ef2aSThomas Huth     *r = result;
1843fcf5ef2aSThomas Huth     if (sat) {
18446175f5a0SRichard Henderson         set_vscr_sat(env);
1845fcf5ef2aSThomas Huth     }
1846fcf5ef2aSThomas Huth }
1847fcf5ef2aSThomas Huth 
1848fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1849fcf5ef2aSThomas Huth {
1850fcf5ef2aSThomas Huth     int i, j;
1851fcf5ef2aSThomas Huth     int sat = 0;
1852fcf5ef2aSThomas Huth 
1853fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1854fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1855fcf5ef2aSThomas Huth 
1856fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->s32); j++) {
1857fcf5ef2aSThomas Huth             t += a->s8[4 * i + j];
1858fcf5ef2aSThomas Huth         }
1859fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1860fcf5ef2aSThomas Huth     }
1861fcf5ef2aSThomas Huth 
1862fcf5ef2aSThomas Huth     if (sat) {
18636175f5a0SRichard Henderson         set_vscr_sat(env);
1864fcf5ef2aSThomas Huth     }
1865fcf5ef2aSThomas Huth }
1866fcf5ef2aSThomas Huth 
1867fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1868fcf5ef2aSThomas Huth {
1869fcf5ef2aSThomas Huth     int sat = 0;
1870fcf5ef2aSThomas Huth     int i;
1871fcf5ef2aSThomas Huth 
1872fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1873fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1874fcf5ef2aSThomas Huth 
1875fcf5ef2aSThomas Huth         t += a->s16[2 * i] + a->s16[2 * i + 1];
1876fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1877fcf5ef2aSThomas Huth     }
1878fcf5ef2aSThomas Huth 
1879fcf5ef2aSThomas Huth     if (sat) {
18806175f5a0SRichard Henderson         set_vscr_sat(env);
1881fcf5ef2aSThomas Huth     }
1882fcf5ef2aSThomas Huth }
1883fcf5ef2aSThomas Huth 
1884fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1885fcf5ef2aSThomas Huth {
1886fcf5ef2aSThomas Huth     int i, j;
1887fcf5ef2aSThomas Huth     int sat = 0;
1888fcf5ef2aSThomas Huth 
1889fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
1890fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)b->u32[i];
1891fcf5ef2aSThomas Huth 
1892fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u32); j++) {
1893fcf5ef2aSThomas Huth             t += a->u8[4 * i + j];
1894fcf5ef2aSThomas Huth         }
1895fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
1896fcf5ef2aSThomas Huth     }
1897fcf5ef2aSThomas Huth 
1898fcf5ef2aSThomas Huth     if (sat) {
18996175f5a0SRichard Henderson         set_vscr_sat(env);
1900fcf5ef2aSThomas Huth     }
1901fcf5ef2aSThomas Huth }
1902fcf5ef2aSThomas Huth 
1903fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
1904fcf5ef2aSThomas Huth #define UPKHI 1
1905fcf5ef2aSThomas Huth #define UPKLO 0
1906fcf5ef2aSThomas Huth #else
1907fcf5ef2aSThomas Huth #define UPKHI 0
1908fcf5ef2aSThomas Huth #define UPKLO 1
1909fcf5ef2aSThomas Huth #endif
1910fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi)                                              \
1911fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
1912fcf5ef2aSThomas Huth     {                                                                   \
1913fcf5ef2aSThomas Huth         int i;                                                          \
1914fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1915fcf5ef2aSThomas Huth                                                                         \
1916fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->u32); i++) {                      \
1917fcf5ef2aSThomas Huth             uint16_t e = b->u16[hi ? i : i + 4];                        \
1918fcf5ef2aSThomas Huth             uint8_t a = (e >> 15) ? 0xff : 0;                           \
1919fcf5ef2aSThomas Huth             uint8_t r = (e >> 10) & 0x1f;                               \
1920fcf5ef2aSThomas Huth             uint8_t g = (e >> 5) & 0x1f;                                \
1921fcf5ef2aSThomas Huth             uint8_t b = e & 0x1f;                                       \
1922fcf5ef2aSThomas Huth                                                                         \
1923fcf5ef2aSThomas Huth             result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b;       \
1924fcf5ef2aSThomas Huth         }                                                               \
1925fcf5ef2aSThomas Huth         *r = result;                                                    \
1926fcf5ef2aSThomas Huth     }
1927fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO)
1928fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI)
1929fcf5ef2aSThomas Huth #undef VUPKPX
1930fcf5ef2aSThomas Huth 
1931fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi)                              \
1932fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
1933fcf5ef2aSThomas Huth     {                                                                   \
1934fcf5ef2aSThomas Huth         int i;                                                          \
1935fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1936fcf5ef2aSThomas Huth                                                                         \
1937fcf5ef2aSThomas Huth         if (hi) {                                                       \
1938fcf5ef2aSThomas Huth             for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) {             \
1939fcf5ef2aSThomas Huth                 result.unpacked[i] = b->packee[i];                      \
1940fcf5ef2aSThomas Huth             }                                                           \
1941fcf5ef2aSThomas Huth         } else {                                                        \
1942fcf5ef2aSThomas Huth             for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \
1943fcf5ef2aSThomas Huth                  i++) {                                                 \
1944fcf5ef2aSThomas Huth                 result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \
1945fcf5ef2aSThomas Huth             }                                                           \
1946fcf5ef2aSThomas Huth         }                                                               \
1947fcf5ef2aSThomas Huth         *r = result;                                                    \
1948fcf5ef2aSThomas Huth     }
1949fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI)
1950fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI)
1951fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI)
1952fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO)
1953fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO)
1954fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO)
1955fcf5ef2aSThomas Huth #undef VUPK
1956fcf5ef2aSThomas Huth #undef UPKHI
1957fcf5ef2aSThomas Huth #undef UPKLO
1958fcf5ef2aSThomas Huth 
1959fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element)                                      \
1960fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *b)                     \
1961fcf5ef2aSThomas Huth     {                                                                   \
1962fcf5ef2aSThomas Huth         int i;                                                          \
1963fcf5ef2aSThomas Huth                                                                         \
196460594feaSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
1965fcf5ef2aSThomas Huth             r->element[i] = name(b->element[i]);                        \
1966fcf5ef2aSThomas Huth         }                                                               \
1967fcf5ef2aSThomas Huth     }
1968fcf5ef2aSThomas Huth 
1969fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8)
1970fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16)
1971fcf5ef2aSThomas Huth 
1972fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8)
1973fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16)
1974fcf5ef2aSThomas Huth 
1975fcf5ef2aSThomas Huth #undef clzb
1976fcf5ef2aSThomas Huth #undef clzh
1977fcf5ef2aSThomas Huth 
1978fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8)
1979fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16)
1980fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v))
1981fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v))
1982fcf5ef2aSThomas Huth 
1983fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8)
1984fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16)
1985fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32)
1986fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64)
1987fcf5ef2aSThomas Huth 
1988fcf5ef2aSThomas Huth #undef ctzb
1989fcf5ef2aSThomas Huth #undef ctzh
1990fcf5ef2aSThomas Huth #undef ctzw
1991fcf5ef2aSThomas Huth #undef ctzd
1992fcf5ef2aSThomas Huth 
1993fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v)
1994fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v)
1995fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v)
1996fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v)
1997fcf5ef2aSThomas Huth 
1998fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8)
1999fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16)
2000fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32)
2001fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64)
2002fcf5ef2aSThomas Huth 
2003fcf5ef2aSThomas Huth #undef popcntb
2004fcf5ef2aSThomas Huth #undef popcnth
2005fcf5ef2aSThomas Huth #undef popcntw
2006fcf5ef2aSThomas Huth #undef popcntd
2007fcf5ef2aSThomas Huth 
2008fcf5ef2aSThomas Huth #undef VGENERIC_DO
2009fcf5ef2aSThomas Huth 
2010fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN)
2011fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } }
2012fcf5ef2aSThomas Huth #else
2013fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } }
2014fcf5ef2aSThomas Huth #endif
2015fcf5ef2aSThomas Huth 
2016fcf5ef2aSThomas Huth #ifndef CONFIG_INT128
2017fcf5ef2aSThomas Huth 
2018fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a)
2019fcf5ef2aSThomas Huth {
2020fcf5ef2aSThomas Huth     t->u64[0] = ~a.u64[0];
2021fcf5ef2aSThomas Huth     t->u64[1] = ~a.u64[1];
2022fcf5ef2aSThomas Huth }
2023fcf5ef2aSThomas Huth 
2024fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b)
2025fcf5ef2aSThomas Huth {
20263c385a93SMark Cave-Ayland     if (a.VsrD(0) < b.VsrD(0)) {
2027fcf5ef2aSThomas Huth         return -1;
20283c385a93SMark Cave-Ayland     } else if (a.VsrD(0) > b.VsrD(0)) {
2029fcf5ef2aSThomas Huth         return 1;
20303c385a93SMark Cave-Ayland     } else if (a.VsrD(1) < b.VsrD(1)) {
2031fcf5ef2aSThomas Huth         return -1;
20323c385a93SMark Cave-Ayland     } else if (a.VsrD(1) > b.VsrD(1)) {
2033fcf5ef2aSThomas Huth         return 1;
2034fcf5ef2aSThomas Huth     } else {
2035fcf5ef2aSThomas Huth         return 0;
2036fcf5ef2aSThomas Huth     }
2037fcf5ef2aSThomas Huth }
2038fcf5ef2aSThomas Huth 
2039fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b)
2040fcf5ef2aSThomas Huth {
20413c385a93SMark Cave-Ayland     t->VsrD(1) = a.VsrD(1) + b.VsrD(1);
20423c385a93SMark Cave-Ayland     t->VsrD(0) = a.VsrD(0) + b.VsrD(0) +
20433c385a93SMark Cave-Ayland                      (~a.VsrD(1) < b.VsrD(1));
2044fcf5ef2aSThomas Huth }
2045fcf5ef2aSThomas Huth 
2046fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b)
2047fcf5ef2aSThomas Huth {
2048fcf5ef2aSThomas Huth     ppc_avr_t not_a;
20493c385a93SMark Cave-Ayland     t->VsrD(1) = a.VsrD(1) + b.VsrD(1);
20503c385a93SMark Cave-Ayland     t->VsrD(0) = a.VsrD(0) + b.VsrD(0) +
20513c385a93SMark Cave-Ayland                      (~a.VsrD(1) < b.VsrD(1));
2052fcf5ef2aSThomas Huth     avr_qw_not(&not_a, a);
2053fcf5ef2aSThomas Huth     return avr_qw_cmpu(not_a, b) < 0;
2054fcf5ef2aSThomas Huth }
2055fcf5ef2aSThomas Huth 
2056fcf5ef2aSThomas Huth #endif
2057fcf5ef2aSThomas Huth 
2058fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2059fcf5ef2aSThomas Huth {
2060fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2061fcf5ef2aSThomas Huth     r->u128 = a->u128 + b->u128;
2062fcf5ef2aSThomas Huth #else
2063fcf5ef2aSThomas Huth     avr_qw_add(r, *a, *b);
2064fcf5ef2aSThomas Huth #endif
2065fcf5ef2aSThomas Huth }
2066fcf5ef2aSThomas Huth 
2067fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2068fcf5ef2aSThomas Huth {
2069fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2070fcf5ef2aSThomas Huth     r->u128 = a->u128 + b->u128 + (c->u128 & 1);
2071fcf5ef2aSThomas Huth #else
2072fcf5ef2aSThomas Huth 
20733c385a93SMark Cave-Ayland     if (c->VsrD(1) & 1) {
2074fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2075fcf5ef2aSThomas Huth 
20763c385a93SMark Cave-Ayland         tmp.VsrD(0) = 0;
20773c385a93SMark Cave-Ayland         tmp.VsrD(1) = c->VsrD(1) & 1;
2078fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
2079fcf5ef2aSThomas Huth         avr_qw_add(r, tmp, *b);
2080fcf5ef2aSThomas Huth     } else {
2081fcf5ef2aSThomas Huth         avr_qw_add(r, *a, *b);
2082fcf5ef2aSThomas Huth     }
2083fcf5ef2aSThomas Huth #endif
2084fcf5ef2aSThomas Huth }
2085fcf5ef2aSThomas Huth 
2086fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2087fcf5ef2aSThomas Huth {
2088fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2089fcf5ef2aSThomas Huth     r->u128 = (~a->u128 < b->u128);
2090fcf5ef2aSThomas Huth #else
2091fcf5ef2aSThomas Huth     ppc_avr_t not_a;
2092fcf5ef2aSThomas Huth 
2093fcf5ef2aSThomas Huth     avr_qw_not(&not_a, *a);
2094fcf5ef2aSThomas Huth 
20953c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
20963c385a93SMark Cave-Ayland     r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0);
2097fcf5ef2aSThomas Huth #endif
2098fcf5ef2aSThomas Huth }
2099fcf5ef2aSThomas Huth 
2100fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2101fcf5ef2aSThomas Huth {
2102fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2103fcf5ef2aSThomas Huth     int carry_out = (~a->u128 < b->u128);
2104fcf5ef2aSThomas Huth     if (!carry_out && (c->u128 & 1)) {
2105fcf5ef2aSThomas Huth         carry_out = ((a->u128 + b->u128 + 1) == 0) &&
2106fcf5ef2aSThomas Huth                     ((a->u128 != 0) || (b->u128 != 0));
2107fcf5ef2aSThomas Huth     }
2108fcf5ef2aSThomas Huth     r->u128 = carry_out;
2109fcf5ef2aSThomas Huth #else
2110fcf5ef2aSThomas Huth 
21113c385a93SMark Cave-Ayland     int carry_in = c->VsrD(1) & 1;
2112fcf5ef2aSThomas Huth     int carry_out = 0;
2113fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2114fcf5ef2aSThomas Huth 
2115fcf5ef2aSThomas Huth     carry_out = avr_qw_addc(&tmp, *a, *b);
2116fcf5ef2aSThomas Huth 
2117fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
2118fcf5ef2aSThomas Huth         ppc_avr_t one = QW_ONE;
2119fcf5ef2aSThomas Huth         carry_out = avr_qw_addc(&tmp, tmp, one);
2120fcf5ef2aSThomas Huth     }
21213c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
21223c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
2123fcf5ef2aSThomas Huth #endif
2124fcf5ef2aSThomas Huth }
2125fcf5ef2aSThomas Huth 
2126fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2127fcf5ef2aSThomas Huth {
2128fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2129fcf5ef2aSThomas Huth     r->u128 = a->u128 - b->u128;
2130fcf5ef2aSThomas Huth #else
2131fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2132fcf5ef2aSThomas Huth     ppc_avr_t one = QW_ONE;
2133fcf5ef2aSThomas Huth 
2134fcf5ef2aSThomas Huth     avr_qw_not(&tmp, *b);
2135fcf5ef2aSThomas Huth     avr_qw_add(&tmp, *a, tmp);
2136fcf5ef2aSThomas Huth     avr_qw_add(r, tmp, one);
2137fcf5ef2aSThomas Huth #endif
2138fcf5ef2aSThomas Huth }
2139fcf5ef2aSThomas Huth 
2140fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2141fcf5ef2aSThomas Huth {
2142fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2143fcf5ef2aSThomas Huth     r->u128 = a->u128 + ~b->u128 + (c->u128 & 1);
2144fcf5ef2aSThomas Huth #else
2145fcf5ef2aSThomas Huth     ppc_avr_t tmp, sum;
2146fcf5ef2aSThomas Huth 
2147fcf5ef2aSThomas Huth     avr_qw_not(&tmp, *b);
2148fcf5ef2aSThomas Huth     avr_qw_add(&sum, *a, tmp);
2149fcf5ef2aSThomas Huth 
21503c385a93SMark Cave-Ayland     tmp.VsrD(0) = 0;
21513c385a93SMark Cave-Ayland     tmp.VsrD(1) = c->VsrD(1) & 1;
2152fcf5ef2aSThomas Huth     avr_qw_add(r, sum, tmp);
2153fcf5ef2aSThomas Huth #endif
2154fcf5ef2aSThomas Huth }
2155fcf5ef2aSThomas Huth 
2156fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2157fcf5ef2aSThomas Huth {
2158fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2159fcf5ef2aSThomas Huth     r->u128 = (~a->u128 < ~b->u128) ||
2160fcf5ef2aSThomas Huth                  (a->u128 + ~b->u128 == (__uint128_t)-1);
2161fcf5ef2aSThomas Huth #else
2162fcf5ef2aSThomas Huth     int carry = (avr_qw_cmpu(*a, *b) > 0);
2163fcf5ef2aSThomas Huth     if (!carry) {
2164fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2165fcf5ef2aSThomas Huth         avr_qw_not(&tmp, *b);
2166fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
21673c385a93SMark Cave-Ayland         carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull));
2168fcf5ef2aSThomas Huth     }
21693c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
21703c385a93SMark Cave-Ayland     r->VsrD(1) = carry;
2171fcf5ef2aSThomas Huth #endif
2172fcf5ef2aSThomas Huth }
2173fcf5ef2aSThomas Huth 
2174fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2175fcf5ef2aSThomas Huth {
2176fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2177fcf5ef2aSThomas Huth     r->u128 =
2178fcf5ef2aSThomas Huth         (~a->u128 < ~b->u128) ||
2179fcf5ef2aSThomas Huth         ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1));
2180fcf5ef2aSThomas Huth #else
21813c385a93SMark Cave-Ayland     int carry_in = c->VsrD(1) & 1;
2182fcf5ef2aSThomas Huth     int carry_out = (avr_qw_cmpu(*a, *b) > 0);
2183fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
2184fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2185fcf5ef2aSThomas Huth         avr_qw_not(&tmp, *b);
2186fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
21873c385a93SMark Cave-Ayland         carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull));
2188fcf5ef2aSThomas Huth     }
2189fcf5ef2aSThomas Huth 
21903c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
21913c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
2192fcf5ef2aSThomas Huth #endif
2193fcf5ef2aSThomas Huth }
2194fcf5ef2aSThomas Huth 
2195fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC
2196fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF
2197fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1  0xA
2198fcf5ef2aSThomas Huth #define BCD_NEG_PREF    0xD
2199fcf5ef2aSThomas Huth #define BCD_NEG_ALT     0xB
2200fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2  0xE
2201fcf5ef2aSThomas Huth #define NATIONAL_PLUS   0x2B
2202fcf5ef2aSThomas Huth #define NATIONAL_NEG    0x2D
2203fcf5ef2aSThomas Huth 
2204365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2))
2205fcf5ef2aSThomas Huth 
2206fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd)
2207fcf5ef2aSThomas Huth {
2208428115c3SMark Cave-Ayland     switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) {
2209fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_1:
2210fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_2:
2211fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_1:
2212fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_2:
2213fcf5ef2aSThomas Huth     {
2214fcf5ef2aSThomas Huth         return 1;
2215fcf5ef2aSThomas Huth     }
2216fcf5ef2aSThomas Huth 
2217fcf5ef2aSThomas Huth     case BCD_NEG_PREF:
2218fcf5ef2aSThomas Huth     case BCD_NEG_ALT:
2219fcf5ef2aSThomas Huth     {
2220fcf5ef2aSThomas Huth         return -1;
2221fcf5ef2aSThomas Huth     }
2222fcf5ef2aSThomas Huth 
2223fcf5ef2aSThomas Huth     default:
2224fcf5ef2aSThomas Huth     {
2225fcf5ef2aSThomas Huth         return 0;
2226fcf5ef2aSThomas Huth     }
2227fcf5ef2aSThomas Huth     }
2228fcf5ef2aSThomas Huth }
2229fcf5ef2aSThomas Huth 
2230fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps)
2231fcf5ef2aSThomas Huth {
2232fcf5ef2aSThomas Huth     if (sgn >= 0) {
2233fcf5ef2aSThomas Huth         return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2;
2234fcf5ef2aSThomas Huth     } else {
2235fcf5ef2aSThomas Huth         return BCD_NEG_PREF;
2236fcf5ef2aSThomas Huth     }
2237fcf5ef2aSThomas Huth }
2238fcf5ef2aSThomas Huth 
2239fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid)
2240fcf5ef2aSThomas Huth {
2241fcf5ef2aSThomas Huth     uint8_t result;
2242fcf5ef2aSThomas Huth     if (n & 1) {
2243428115c3SMark Cave-Ayland         result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4;
2244fcf5ef2aSThomas Huth     } else {
2245428115c3SMark Cave-Ayland        result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF;
2246fcf5ef2aSThomas Huth     }
2247fcf5ef2aSThomas Huth 
2248fcf5ef2aSThomas Huth     if (unlikely(result > 9)) {
2249fcf5ef2aSThomas Huth         *invalid = true;
2250fcf5ef2aSThomas Huth     }
2251fcf5ef2aSThomas Huth     return result;
2252fcf5ef2aSThomas Huth }
2253fcf5ef2aSThomas Huth 
2254fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n)
2255fcf5ef2aSThomas Huth {
2256fcf5ef2aSThomas Huth     if (n & 1) {
2257428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F;
2258428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4);
2259fcf5ef2aSThomas Huth     } else {
2260428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0;
2261428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= digit;
2262fcf5ef2aSThomas Huth     }
2263fcf5ef2aSThomas Huth }
2264fcf5ef2aSThomas Huth 
2265071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd)
2266071663dfSJose Ricardo Ziviani {
2267071663dfSJose Ricardo Ziviani     int i;
2268071663dfSJose Ricardo Ziviani     int invalid = 0;
2269071663dfSJose Ricardo Ziviani 
2270071663dfSJose Ricardo Ziviani     if (bcd_get_sgn(bcd) == 0) {
2271071663dfSJose Ricardo Ziviani         return false;
2272071663dfSJose Ricardo Ziviani     }
2273071663dfSJose Ricardo Ziviani 
2274071663dfSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2275071663dfSJose Ricardo Ziviani         bcd_get_digit(bcd, i, &invalid);
2276071663dfSJose Ricardo Ziviani         if (unlikely(invalid)) {
2277071663dfSJose Ricardo Ziviani             return false;
2278071663dfSJose Ricardo Ziviani         }
2279071663dfSJose Ricardo Ziviani     }
2280071663dfSJose Ricardo Ziviani     return true;
2281071663dfSJose Ricardo Ziviani }
2282071663dfSJose Ricardo Ziviani 
2283fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd)
2284fcf5ef2aSThomas Huth {
22853c385a93SMark Cave-Ayland     if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) {
2286efa73196SNikunj A Dadhania         return CRF_EQ;
2287fcf5ef2aSThomas Huth     } else {
2288efa73196SNikunj A Dadhania         return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT;
2289fcf5ef2aSThomas Huth     }
2290fcf5ef2aSThomas Huth }
2291fcf5ef2aSThomas Huth 
2292fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n)
2293fcf5ef2aSThomas Huth {
229460594feaSMark Cave-Ayland     return reg->VsrH(7 - n);
2295fcf5ef2aSThomas Huth }
2296fcf5ef2aSThomas Huth 
2297fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n)
2298fcf5ef2aSThomas Huth {
229960594feaSMark Cave-Ayland     reg->VsrH(7 - n) = val;
2300fcf5ef2aSThomas Huth }
2301fcf5ef2aSThomas Huth 
2302fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b)
2303fcf5ef2aSThomas Huth {
2304fcf5ef2aSThomas Huth     int i;
2305fcf5ef2aSThomas Huth     int invalid = 0;
2306fcf5ef2aSThomas Huth     for (i = 31; i > 0; i--) {
2307fcf5ef2aSThomas Huth         uint8_t dig_a = bcd_get_digit(a, i, &invalid);
2308fcf5ef2aSThomas Huth         uint8_t dig_b = bcd_get_digit(b, i, &invalid);
2309fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2310fcf5ef2aSThomas Huth             return 0; /* doesn't matter */
2311fcf5ef2aSThomas Huth         } else if (dig_a > dig_b) {
2312fcf5ef2aSThomas Huth             return 1;
2313fcf5ef2aSThomas Huth         } else if (dig_a < dig_b) {
2314fcf5ef2aSThomas Huth             return -1;
2315fcf5ef2aSThomas Huth         }
2316fcf5ef2aSThomas Huth     }
2317fcf5ef2aSThomas Huth 
2318fcf5ef2aSThomas Huth     return 0;
2319fcf5ef2aSThomas Huth }
2320fcf5ef2aSThomas Huth 
2321936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2322fcf5ef2aSThomas Huth                        int *overflow)
2323fcf5ef2aSThomas Huth {
2324fcf5ef2aSThomas Huth     int carry = 0;
2325fcf5ef2aSThomas Huth     int i;
2326936fda4dSFabiano Rosas     int is_zero = 1;
2327936fda4dSFabiano Rosas 
2328fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2329fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) +
2330fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2331936fda4dSFabiano Rosas         is_zero &= (digit == 0);
2332fcf5ef2aSThomas Huth         if (digit > 9) {
2333fcf5ef2aSThomas Huth             carry = 1;
2334fcf5ef2aSThomas Huth             digit -= 10;
2335fcf5ef2aSThomas Huth         } else {
2336fcf5ef2aSThomas Huth             carry = 0;
2337fcf5ef2aSThomas Huth         }
2338fcf5ef2aSThomas Huth 
2339fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2340fcf5ef2aSThomas Huth     }
2341fcf5ef2aSThomas Huth 
2342fcf5ef2aSThomas Huth     *overflow = carry;
2343936fda4dSFabiano Rosas     return is_zero;
2344fcf5ef2aSThomas Huth }
2345fcf5ef2aSThomas Huth 
2346d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2347fcf5ef2aSThomas Huth                        int *overflow)
2348fcf5ef2aSThomas Huth {
2349fcf5ef2aSThomas Huth     int carry = 0;
2350fcf5ef2aSThomas Huth     int i;
2351d03b174aSYasmin Beatriz 
2352fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2353fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) -
2354fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2355fcf5ef2aSThomas Huth         if (digit & 0x80) {
2356fcf5ef2aSThomas Huth             carry = -1;
2357fcf5ef2aSThomas Huth             digit += 10;
2358fcf5ef2aSThomas Huth         } else {
2359fcf5ef2aSThomas Huth             carry = 0;
2360fcf5ef2aSThomas Huth         }
2361fcf5ef2aSThomas Huth 
2362fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2363fcf5ef2aSThomas Huth     }
2364fcf5ef2aSThomas Huth 
2365fcf5ef2aSThomas Huth     *overflow = carry;
2366fcf5ef2aSThomas Huth }
2367fcf5ef2aSThomas Huth 
2368fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2369fcf5ef2aSThomas Huth {
2370fcf5ef2aSThomas Huth 
2371fcf5ef2aSThomas Huth     int sgna = bcd_get_sgn(a);
2372fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2373fcf5ef2aSThomas Huth     int invalid = (sgna == 0) || (sgnb == 0);
2374fcf5ef2aSThomas Huth     int overflow = 0;
2375936fda4dSFabiano Rosas     int zero = 0;
2376fcf5ef2aSThomas Huth     uint32_t cr = 0;
2377fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
2378fcf5ef2aSThomas Huth 
2379fcf5ef2aSThomas Huth     if (!invalid) {
2380fcf5ef2aSThomas Huth         if (sgna == sgnb) {
2381428115c3SMark Cave-Ayland             result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2382936fda4dSFabiano Rosas             zero = bcd_add_mag(&result, a, b, &invalid, &overflow);
2383936fda4dSFabiano Rosas             cr = (sgna > 0) ? CRF_GT : CRF_LT;
2384fcf5ef2aSThomas Huth         } else {
2385d03b174aSYasmin Beatriz             int magnitude = bcd_cmp_mag(a, b);
2386d03b174aSYasmin Beatriz             if (magnitude > 0) {
2387428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2388d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, a, b, &invalid, &overflow);
2389d03b174aSYasmin Beatriz                 cr = (sgna > 0) ? CRF_GT : CRF_LT;
2390d03b174aSYasmin Beatriz             } else if (magnitude < 0) {
2391428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps);
2392d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, b, a, &invalid, &overflow);
2393efa73196SNikunj A Dadhania                 cr = (sgnb > 0) ? CRF_GT : CRF_LT;
2394d03b174aSYasmin Beatriz             } else {
2395428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps);
2396d03b174aSYasmin Beatriz                 cr = CRF_EQ;
2397d03b174aSYasmin Beatriz             }
2398fcf5ef2aSThomas Huth         }
2399fcf5ef2aSThomas Huth     }
2400fcf5ef2aSThomas Huth 
2401fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
24023c385a93SMark Cave-Ayland         result.VsrD(0) = result.VsrD(1) = -1;
2403efa73196SNikunj A Dadhania         cr = CRF_SO;
2404fcf5ef2aSThomas Huth     } else if (overflow) {
2405efa73196SNikunj A Dadhania         cr |= CRF_SO;
2406936fda4dSFabiano Rosas     } else if (zero) {
2407936fda4dSFabiano Rosas         cr |= CRF_EQ;
2408fcf5ef2aSThomas Huth     }
2409fcf5ef2aSThomas Huth 
2410fcf5ef2aSThomas Huth     *r = result;
2411fcf5ef2aSThomas Huth 
2412fcf5ef2aSThomas Huth     return cr;
2413fcf5ef2aSThomas Huth }
2414fcf5ef2aSThomas Huth 
2415fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2416fcf5ef2aSThomas Huth {
2417fcf5ef2aSThomas Huth     ppc_avr_t bcopy = *b;
2418fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2419fcf5ef2aSThomas Huth     if (sgnb < 0) {
2420fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0);
2421fcf5ef2aSThomas Huth     } else if (sgnb > 0) {
2422fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_NEG_PREF, 0);
2423fcf5ef2aSThomas Huth     }
2424fcf5ef2aSThomas Huth     /* else invalid ... defer to bcdadd code for proper handling */
2425fcf5ef2aSThomas Huth 
2426fcf5ef2aSThomas Huth     return helper_bcdadd(r, a, &bcopy, ps);
2427fcf5ef2aSThomas Huth }
2428fcf5ef2aSThomas Huth 
2429fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2430fcf5ef2aSThomas Huth {
2431fcf5ef2aSThomas Huth     int i;
2432fcf5ef2aSThomas Huth     int cr = 0;
2433fcf5ef2aSThomas Huth     uint16_t national = 0;
2434fcf5ef2aSThomas Huth     uint16_t sgnb = get_national_digit(b, 0);
2435fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2436fcf5ef2aSThomas Huth     int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG);
2437fcf5ef2aSThomas Huth 
2438fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2439fcf5ef2aSThomas Huth         national = get_national_digit(b, i);
2440fcf5ef2aSThomas Huth         if (unlikely(national < 0x30 || national > 0x39)) {
2441fcf5ef2aSThomas Huth             invalid = 1;
2442fcf5ef2aSThomas Huth             break;
2443fcf5ef2aSThomas Huth         }
2444fcf5ef2aSThomas Huth 
2445fcf5ef2aSThomas Huth         bcd_put_digit(&ret, national & 0xf, i);
2446fcf5ef2aSThomas Huth     }
2447fcf5ef2aSThomas Huth 
2448fcf5ef2aSThomas Huth     if (sgnb == NATIONAL_PLUS) {
2449fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0);
2450fcf5ef2aSThomas Huth     } else {
2451fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2452fcf5ef2aSThomas Huth     }
2453fcf5ef2aSThomas Huth 
2454fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2455fcf5ef2aSThomas Huth 
2456fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2457efa73196SNikunj A Dadhania         cr = CRF_SO;
2458fcf5ef2aSThomas Huth     }
2459fcf5ef2aSThomas Huth 
2460fcf5ef2aSThomas Huth     *r = ret;
2461fcf5ef2aSThomas Huth 
2462fcf5ef2aSThomas Huth     return cr;
2463fcf5ef2aSThomas Huth }
2464fcf5ef2aSThomas Huth 
2465fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2466fcf5ef2aSThomas Huth {
2467fcf5ef2aSThomas Huth     int i;
2468fcf5ef2aSThomas Huth     int cr = 0;
2469fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2470fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2471fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2472fcf5ef2aSThomas Huth 
24733c385a93SMark Cave-Ayland     int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0);
2474fcf5ef2aSThomas Huth 
2475fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2476fcf5ef2aSThomas Huth         set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i);
2477fcf5ef2aSThomas Huth 
2478fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2479fcf5ef2aSThomas Huth             break;
2480fcf5ef2aSThomas Huth         }
2481fcf5ef2aSThomas Huth     }
2482fcf5ef2aSThomas Huth     set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0);
2483fcf5ef2aSThomas Huth 
2484fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2485fcf5ef2aSThomas Huth 
2486fcf5ef2aSThomas Huth     if (ox_flag) {
2487efa73196SNikunj A Dadhania         cr |= CRF_SO;
2488fcf5ef2aSThomas Huth     }
2489fcf5ef2aSThomas Huth 
2490fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2491efa73196SNikunj A Dadhania         cr = CRF_SO;
2492fcf5ef2aSThomas Huth     }
2493fcf5ef2aSThomas Huth 
2494fcf5ef2aSThomas Huth     *r = ret;
2495fcf5ef2aSThomas Huth 
2496fcf5ef2aSThomas Huth     return cr;
2497fcf5ef2aSThomas Huth }
2498fcf5ef2aSThomas Huth 
2499fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2500fcf5ef2aSThomas Huth {
2501fcf5ef2aSThomas Huth     int i;
2502fcf5ef2aSThomas Huth     int cr = 0;
2503fcf5ef2aSThomas Huth     int invalid = 0;
2504fcf5ef2aSThomas Huth     int zone_digit = 0;
2505fcf5ef2aSThomas Huth     int zone_lead = ps ? 0xF : 0x3;
2506fcf5ef2aSThomas Huth     int digit = 0;
2507fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2508428115c3SMark Cave-Ayland     int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4;
2509fcf5ef2aSThomas Huth 
2510fcf5ef2aSThomas Huth     if (unlikely((sgnb < 0xA) && ps)) {
2511fcf5ef2aSThomas Huth         invalid = 1;
2512fcf5ef2aSThomas Huth     }
2513fcf5ef2aSThomas Huth 
2514fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2515428115c3SMark Cave-Ayland         zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead;
2516428115c3SMark Cave-Ayland         digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF;
2517fcf5ef2aSThomas Huth         if (unlikely(zone_digit != zone_lead || digit > 0x9)) {
2518fcf5ef2aSThomas Huth             invalid = 1;
2519fcf5ef2aSThomas Huth             break;
2520fcf5ef2aSThomas Huth         }
2521fcf5ef2aSThomas Huth 
2522fcf5ef2aSThomas Huth         bcd_put_digit(&ret, digit, i + 1);
2523fcf5ef2aSThomas Huth     }
2524fcf5ef2aSThomas Huth 
2525fcf5ef2aSThomas Huth     if ((ps && (sgnb == 0xB || sgnb == 0xD)) ||
2526fcf5ef2aSThomas Huth             (!ps && (sgnb & 0x4))) {
2527fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2528fcf5ef2aSThomas Huth     } else {
2529fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0);
2530fcf5ef2aSThomas Huth     }
2531fcf5ef2aSThomas Huth 
2532fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2533fcf5ef2aSThomas Huth 
2534fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2535efa73196SNikunj A Dadhania         cr = CRF_SO;
2536fcf5ef2aSThomas Huth     }
2537fcf5ef2aSThomas Huth 
2538fcf5ef2aSThomas Huth     *r = ret;
2539fcf5ef2aSThomas Huth 
2540fcf5ef2aSThomas Huth     return cr;
2541fcf5ef2aSThomas Huth }
2542fcf5ef2aSThomas Huth 
2543fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2544fcf5ef2aSThomas Huth {
2545fcf5ef2aSThomas Huth     int i;
2546fcf5ef2aSThomas Huth     int cr = 0;
2547fcf5ef2aSThomas Huth     uint8_t digit = 0;
2548fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2549fcf5ef2aSThomas Huth     int zone_lead = (ps) ? 0xF0 : 0x30;
2550fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2551fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2552fcf5ef2aSThomas Huth 
25533c385a93SMark Cave-Ayland     int ox_flag = ((b->VsrD(0) >> 4) != 0);
2554fcf5ef2aSThomas Huth 
2555fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2556fcf5ef2aSThomas Huth         digit = bcd_get_digit(b, i + 1, &invalid);
2557fcf5ef2aSThomas Huth 
2558fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2559fcf5ef2aSThomas Huth             break;
2560fcf5ef2aSThomas Huth         }
2561fcf5ef2aSThomas Huth 
2562428115c3SMark Cave-Ayland         ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit;
2563fcf5ef2aSThomas Huth     }
2564fcf5ef2aSThomas Huth 
2565fcf5ef2aSThomas Huth     if (ps) {
2566fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1);
2567fcf5ef2aSThomas Huth     } else {
2568fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1);
2569fcf5ef2aSThomas Huth     }
2570fcf5ef2aSThomas Huth 
2571fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2572fcf5ef2aSThomas Huth 
2573fcf5ef2aSThomas Huth     if (ox_flag) {
2574efa73196SNikunj A Dadhania         cr |= CRF_SO;
2575fcf5ef2aSThomas Huth     }
2576fcf5ef2aSThomas Huth 
2577fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2578efa73196SNikunj A Dadhania         cr = CRF_SO;
2579fcf5ef2aSThomas Huth     }
2580fcf5ef2aSThomas Huth 
2581fcf5ef2aSThomas Huth     *r = ret;
2582fcf5ef2aSThomas Huth 
2583fcf5ef2aSThomas Huth     return cr;
2584fcf5ef2aSThomas Huth }
2585fcf5ef2aSThomas Huth 
2586a3d67f3eSLuis Pires /**
2587a3d67f3eSLuis Pires  * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs
2588a3d67f3eSLuis Pires  *
2589a3d67f3eSLuis Pires  * Returns:
2590a3d67f3eSLuis Pires  * > 0 if ahi|alo > bhi|blo,
2591a3d67f3eSLuis Pires  * 0 if ahi|alo == bhi|blo,
2592a3d67f3eSLuis Pires  * < 0 if ahi|alo < bhi|blo
2593a3d67f3eSLuis Pires  */
2594a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi,
2595a3d67f3eSLuis Pires                           uint64_t blo, uint64_t bhi)
2596a3d67f3eSLuis Pires {
2597a3d67f3eSLuis Pires     return (ahi == bhi) ?
2598a3d67f3eSLuis Pires         (alo > blo ? 1 : (alo == blo ? 0 : -1)) :
2599a3d67f3eSLuis Pires         (ahi > bhi ? 1 : -1);
2600a3d67f3eSLuis Pires }
2601a3d67f3eSLuis Pires 
2602a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2603a406c058SJose Ricardo Ziviani {
2604a406c058SJose Ricardo Ziviani     int i;
2605a3d67f3eSLuis Pires     int cr;
2606a406c058SJose Ricardo Ziviani     uint64_t lo_value;
2607a406c058SJose Ricardo Ziviani     uint64_t hi_value;
260840f3e79aSLuis Pires     uint64_t rem;
2609a406c058SJose Ricardo Ziviani     ppc_avr_t ret = { .u64 = { 0, 0 } };
2610a406c058SJose Ricardo Ziviani 
26113c385a93SMark Cave-Ayland     if (b->VsrSD(0) < 0) {
26123c385a93SMark Cave-Ayland         lo_value = -b->VsrSD(1);
26133c385a93SMark Cave-Ayland         hi_value = ~b->VsrD(0) + !lo_value;
2614a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, 0xD, 0);
2615a3d67f3eSLuis Pires 
2616a3d67f3eSLuis Pires         cr = CRF_LT;
2617a406c058SJose Ricardo Ziviani     } else {
26183c385a93SMark Cave-Ayland         lo_value = b->VsrD(1);
26193c385a93SMark Cave-Ayland         hi_value = b->VsrD(0);
2620a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0);
2621a3d67f3eSLuis Pires 
2622a3d67f3eSLuis Pires         if (hi_value == 0 && lo_value == 0) {
2623a3d67f3eSLuis Pires             cr = CRF_EQ;
2624a3d67f3eSLuis Pires         } else {
2625a3d67f3eSLuis Pires             cr = CRF_GT;
2626a3d67f3eSLuis Pires         }
2627a406c058SJose Ricardo Ziviani     }
2628a406c058SJose Ricardo Ziviani 
2629a3d67f3eSLuis Pires     /*
2630a3d67f3eSLuis Pires      * Check src limits: abs(src) <= 10^31 - 1
2631a3d67f3eSLuis Pires      *
2632a3d67f3eSLuis Pires      * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff
2633a3d67f3eSLuis Pires      */
2634a3d67f3eSLuis Pires     if (ucmp128(lo_value, hi_value,
2635a3d67f3eSLuis Pires                 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) {
2636a3d67f3eSLuis Pires         cr |= CRF_SO;
2637a3d67f3eSLuis Pires 
2638a3d67f3eSLuis Pires         /*
2639a3d67f3eSLuis Pires          * According to the ISA, if src wouldn't fit in the destination
2640a3d67f3eSLuis Pires          * register, the result is undefined.
2641a3d67f3eSLuis Pires          * In that case, we leave r unchanged.
2642a3d67f3eSLuis Pires          */
2643a3d67f3eSLuis Pires     } else {
264440f3e79aSLuis Pires         rem = divu128(&lo_value, &hi_value, 1000000000000000ULL);
2645a406c058SJose Ricardo Ziviani 
264640f3e79aSLuis Pires         for (i = 1; i < 16; rem /= 10, i++) {
264740f3e79aSLuis Pires             bcd_put_digit(&ret, rem % 10, i);
2648a406c058SJose Ricardo Ziviani         }
2649a406c058SJose Ricardo Ziviani 
2650a406c058SJose Ricardo Ziviani         for (; i < 32; lo_value /= 10, i++) {
2651a406c058SJose Ricardo Ziviani             bcd_put_digit(&ret, lo_value % 10, i);
2652a406c058SJose Ricardo Ziviani         }
2653a406c058SJose Ricardo Ziviani 
2654a406c058SJose Ricardo Ziviani         *r = ret;
2655a3d67f3eSLuis Pires     }
2656a406c058SJose Ricardo Ziviani 
2657a406c058SJose Ricardo Ziviani     return cr;
2658a406c058SJose Ricardo Ziviani }
2659a406c058SJose Ricardo Ziviani 
2660c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2661c85bc7ddSJose Ricardo Ziviani {
2662c85bc7ddSJose Ricardo Ziviani     uint8_t i;
2663c85bc7ddSJose Ricardo Ziviani     int cr;
2664c85bc7ddSJose Ricardo Ziviani     uint64_t carry;
2665c85bc7ddSJose Ricardo Ziviani     uint64_t unused;
2666c85bc7ddSJose Ricardo Ziviani     uint64_t lo_value;
2667c85bc7ddSJose Ricardo Ziviani     uint64_t hi_value = 0;
2668c85bc7ddSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2669c85bc7ddSJose Ricardo Ziviani     int invalid = (sgnb == 0);
2670c85bc7ddSJose Ricardo Ziviani 
2671c85bc7ddSJose Ricardo Ziviani     lo_value = bcd_get_digit(b, 31, &invalid);
2672c85bc7ddSJose Ricardo Ziviani     for (i = 30; i > 0; i--) {
2673c85bc7ddSJose Ricardo Ziviani         mulu64(&lo_value, &carry, lo_value, 10ULL);
2674c85bc7ddSJose Ricardo Ziviani         mulu64(&hi_value, &unused, hi_value, 10ULL);
2675c85bc7ddSJose Ricardo Ziviani         lo_value += bcd_get_digit(b, i, &invalid);
2676c85bc7ddSJose Ricardo Ziviani         hi_value += carry;
2677c85bc7ddSJose Ricardo Ziviani 
2678c85bc7ddSJose Ricardo Ziviani         if (unlikely(invalid)) {
2679c85bc7ddSJose Ricardo Ziviani             break;
2680c85bc7ddSJose Ricardo Ziviani         }
2681c85bc7ddSJose Ricardo Ziviani     }
2682c85bc7ddSJose Ricardo Ziviani 
2683c85bc7ddSJose Ricardo Ziviani     if (sgnb == -1) {
26843c385a93SMark Cave-Ayland         r->VsrSD(1) = -lo_value;
26853c385a93SMark Cave-Ayland         r->VsrSD(0) = ~hi_value + !r->VsrSD(1);
2686c85bc7ddSJose Ricardo Ziviani     } else {
26873c385a93SMark Cave-Ayland         r->VsrSD(1) = lo_value;
26883c385a93SMark Cave-Ayland         r->VsrSD(0) = hi_value;
2689c85bc7ddSJose Ricardo Ziviani     }
2690c85bc7ddSJose Ricardo Ziviani 
2691c85bc7ddSJose Ricardo Ziviani     cr = bcd_cmp_zero(b);
2692c85bc7ddSJose Ricardo Ziviani 
2693c85bc7ddSJose Ricardo Ziviani     if (unlikely(invalid)) {
2694c85bc7ddSJose Ricardo Ziviani         cr = CRF_SO;
2695c85bc7ddSJose Ricardo Ziviani     }
2696c85bc7ddSJose Ricardo Ziviani 
2697c85bc7ddSJose Ricardo Ziviani     return cr;
2698c85bc7ddSJose Ricardo Ziviani }
2699c85bc7ddSJose Ricardo Ziviani 
2700c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2701c3025c3bSJose Ricardo Ziviani {
2702c3025c3bSJose Ricardo Ziviani     int i;
2703c3025c3bSJose Ricardo Ziviani     int invalid = 0;
2704c3025c3bSJose Ricardo Ziviani 
2705c3025c3bSJose Ricardo Ziviani     if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) {
2706c3025c3bSJose Ricardo Ziviani         return CRF_SO;
2707c3025c3bSJose Ricardo Ziviani     }
2708c3025c3bSJose Ricardo Ziviani 
2709c3025c3bSJose Ricardo Ziviani     *r = *a;
2710428115c3SMark Cave-Ayland     bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0);
2711c3025c3bSJose Ricardo Ziviani 
2712c3025c3bSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2713c3025c3bSJose Ricardo Ziviani         bcd_get_digit(a, i, &invalid);
2714c3025c3bSJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2715c3025c3bSJose Ricardo Ziviani         if (unlikely(invalid)) {
2716c3025c3bSJose Ricardo Ziviani             return CRF_SO;
2717c3025c3bSJose Ricardo Ziviani         }
2718c3025c3bSJose Ricardo Ziviani     }
2719c3025c3bSJose Ricardo Ziviani 
2720c3025c3bSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2721c3025c3bSJose Ricardo Ziviani }
2722c3025c3bSJose Ricardo Ziviani 
2723466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2724466a3f9cSJose Ricardo Ziviani {
2725466a3f9cSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2726466a3f9cSJose Ricardo Ziviani 
2727466a3f9cSJose Ricardo Ziviani     *r = *b;
2728466a3f9cSJose Ricardo Ziviani     bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0);
2729466a3f9cSJose Ricardo Ziviani 
2730071663dfSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2731466a3f9cSJose Ricardo Ziviani         return CRF_SO;
2732466a3f9cSJose Ricardo Ziviani     }
2733466a3f9cSJose Ricardo Ziviani 
2734466a3f9cSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2735466a3f9cSJose Ricardo Ziviani }
2736466a3f9cSJose Ricardo Ziviani 
2737e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2738e04797f7SJose Ricardo Ziviani {
2739e04797f7SJose Ricardo Ziviani     int cr;
2740428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2741e04797f7SJose Ricardo Ziviani     bool ox_flag = false;
2742e04797f7SJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2743e04797f7SJose Ricardo Ziviani     ppc_avr_t ret = *b;
27443c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2745e04797f7SJose Ricardo Ziviani 
2746e04797f7SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2747e04797f7SJose Ricardo Ziviani         return CRF_SO;
2748e04797f7SJose Ricardo Ziviani     }
2749e04797f7SJose Ricardo Ziviani 
2750e04797f7SJose Ricardo Ziviani     if (unlikely(i > 31)) {
2751e04797f7SJose Ricardo Ziviani         i = 31;
2752e04797f7SJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2753e04797f7SJose Ricardo Ziviani         i = -31;
2754e04797f7SJose Ricardo Ziviani     }
2755e04797f7SJose Ricardo Ziviani 
2756e04797f7SJose Ricardo Ziviani     if (i > 0) {
27573c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2758e04797f7SJose Ricardo Ziviani     } else {
27593c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2760e04797f7SJose Ricardo Ziviani     }
2761e04797f7SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2762e04797f7SJose Ricardo Ziviani 
2763e04797f7SJose Ricardo Ziviani     *r = ret;
2764e04797f7SJose Ricardo Ziviani 
2765e04797f7SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2766e04797f7SJose Ricardo Ziviani     if (ox_flag) {
2767e04797f7SJose Ricardo Ziviani         cr |= CRF_SO;
2768e04797f7SJose Ricardo Ziviani     }
2769e04797f7SJose Ricardo Ziviani 
2770e04797f7SJose Ricardo Ziviani     return cr;
2771e04797f7SJose Ricardo Ziviani }
2772e04797f7SJose Ricardo Ziviani 
2773a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2774a49a95e9SJose Ricardo Ziviani {
2775a49a95e9SJose Ricardo Ziviani     int cr;
2776a49a95e9SJose Ricardo Ziviani     int i;
2777a49a95e9SJose Ricardo Ziviani     int invalid = 0;
2778a49a95e9SJose Ricardo Ziviani     bool ox_flag = false;
2779a49a95e9SJose Ricardo Ziviani     ppc_avr_t ret = *b;
2780a49a95e9SJose Ricardo Ziviani 
2781a49a95e9SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
2782a49a95e9SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2783a49a95e9SJose Ricardo Ziviani 
2784a49a95e9SJose Ricardo Ziviani         if (unlikely(invalid)) {
2785a49a95e9SJose Ricardo Ziviani             return CRF_SO;
2786a49a95e9SJose Ricardo Ziviani         }
2787a49a95e9SJose Ricardo Ziviani     }
2788a49a95e9SJose Ricardo Ziviani 
2789428115c3SMark Cave-Ayland     i = a->VsrSB(7);
2790a49a95e9SJose Ricardo Ziviani     if (i >= 32) {
2791a49a95e9SJose Ricardo Ziviani         ox_flag = true;
27923c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2793a49a95e9SJose Ricardo Ziviani     } else if (i <= -32) {
27943c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2795a49a95e9SJose Ricardo Ziviani     } else if (i > 0) {
27963c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2797a49a95e9SJose Ricardo Ziviani     } else {
27983c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2799a49a95e9SJose Ricardo Ziviani     }
2800a49a95e9SJose Ricardo Ziviani     *r = ret;
2801a49a95e9SJose Ricardo Ziviani 
2802a49a95e9SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2803a49a95e9SJose Ricardo Ziviani     if (ox_flag) {
2804a49a95e9SJose Ricardo Ziviani         cr |= CRF_SO;
2805a49a95e9SJose Ricardo Ziviani     }
2806a49a95e9SJose Ricardo Ziviani 
2807a49a95e9SJose Ricardo Ziviani     return cr;
2808a49a95e9SJose Ricardo Ziviani }
2809a49a95e9SJose Ricardo Ziviani 
2810a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2811a54238adSJose Ricardo Ziviani {
2812a54238adSJose Ricardo Ziviani     int cr;
2813a54238adSJose Ricardo Ziviani     int unused = 0;
2814a54238adSJose Ricardo Ziviani     int invalid = 0;
2815a54238adSJose Ricardo Ziviani     bool ox_flag = false;
2816a54238adSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2817a54238adSJose Ricardo Ziviani     ppc_avr_t ret = *b;
28183c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2819a54238adSJose Ricardo Ziviani 
2820428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2821428115c3SMark Cave-Ayland     ppc_avr_t bcd_one;
2822428115c3SMark Cave-Ayland 
2823428115c3SMark Cave-Ayland     bcd_one.VsrD(0) = 0;
2824428115c3SMark Cave-Ayland     bcd_one.VsrD(1) = 0x10;
2825a54238adSJose Ricardo Ziviani 
2826a54238adSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2827a54238adSJose Ricardo Ziviani         return CRF_SO;
2828a54238adSJose Ricardo Ziviani     }
2829a54238adSJose Ricardo Ziviani 
2830a54238adSJose Ricardo Ziviani     if (unlikely(i > 31)) {
2831a54238adSJose Ricardo Ziviani         i = 31;
2832a54238adSJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2833a54238adSJose Ricardo Ziviani         i = -31;
2834a54238adSJose Ricardo Ziviani     }
2835a54238adSJose Ricardo Ziviani 
2836a54238adSJose Ricardo Ziviani     if (i > 0) {
28373c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2838a54238adSJose Ricardo Ziviani     } else {
28393c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2840a54238adSJose Ricardo Ziviani 
2841a54238adSJose Ricardo Ziviani         if (bcd_get_digit(&ret, 0, &invalid) >= 5) {
2842a54238adSJose Ricardo Ziviani             bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused);
2843a54238adSJose Ricardo Ziviani         }
2844a54238adSJose Ricardo Ziviani     }
2845a54238adSJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2846a54238adSJose Ricardo Ziviani 
2847a54238adSJose Ricardo Ziviani     cr = bcd_cmp_zero(&ret);
2848a54238adSJose Ricardo Ziviani     if (ox_flag) {
2849a54238adSJose Ricardo Ziviani         cr |= CRF_SO;
2850a54238adSJose Ricardo Ziviani     }
2851a54238adSJose Ricardo Ziviani     *r = ret;
2852a54238adSJose Ricardo Ziviani 
2853a54238adSJose Ricardo Ziviani     return cr;
2854a54238adSJose Ricardo Ziviani }
2855a54238adSJose Ricardo Ziviani 
285631bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
285731bc4d11SJose Ricardo Ziviani {
285831bc4d11SJose Ricardo Ziviani     uint64_t mask;
285931bc4d11SJose Ricardo Ziviani     uint32_t ox_flag = 0;
2860428115c3SMark Cave-Ayland     int i = a->VsrSH(3) + 1;
286131bc4d11SJose Ricardo Ziviani     ppc_avr_t ret = *b;
286231bc4d11SJose Ricardo Ziviani 
286331bc4d11SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
286431bc4d11SJose Ricardo Ziviani         return CRF_SO;
286531bc4d11SJose Ricardo Ziviani     }
286631bc4d11SJose Ricardo Ziviani 
286731bc4d11SJose Ricardo Ziviani     if (i > 16 && i < 32) {
286831bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
28693c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
287031bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
287131bc4d11SJose Ricardo Ziviani         }
287231bc4d11SJose Ricardo Ziviani 
28733c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
287431bc4d11SJose Ricardo Ziviani     } else if (i >= 0 && i <= 16) {
287531bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
28763c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
287731bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
287831bc4d11SJose Ricardo Ziviani         }
287931bc4d11SJose Ricardo Ziviani 
28803c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
28813c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
288231bc4d11SJose Ricardo Ziviani     }
288331bc4d11SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0);
288431bc4d11SJose Ricardo Ziviani     *r = ret;
288531bc4d11SJose Ricardo Ziviani 
288631bc4d11SJose Ricardo Ziviani     return bcd_cmp_zero(&ret) | ox_flag;
288731bc4d11SJose Ricardo Ziviani }
288831bc4d11SJose Ricardo Ziviani 
28895c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
28905c32e2e4SJose Ricardo Ziviani {
28915c32e2e4SJose Ricardo Ziviani     int i;
28925c32e2e4SJose Ricardo Ziviani     uint64_t mask;
28935c32e2e4SJose Ricardo Ziviani     uint32_t ox_flag = 0;
28945c32e2e4SJose Ricardo Ziviani     int invalid = 0;
28955c32e2e4SJose Ricardo Ziviani     ppc_avr_t ret = *b;
28965c32e2e4SJose Ricardo Ziviani 
28975c32e2e4SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
28985c32e2e4SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
28995c32e2e4SJose Ricardo Ziviani 
29005c32e2e4SJose Ricardo Ziviani         if (unlikely(invalid)) {
29015c32e2e4SJose Ricardo Ziviani             return CRF_SO;
29025c32e2e4SJose Ricardo Ziviani         }
29035c32e2e4SJose Ricardo Ziviani     }
29045c32e2e4SJose Ricardo Ziviani 
2905428115c3SMark Cave-Ayland     i = a->VsrSH(3);
29065c32e2e4SJose Ricardo Ziviani     if (i > 16 && i < 33) {
29075c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
29083c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
29095c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
29105c32e2e4SJose Ricardo Ziviani         }
29115c32e2e4SJose Ricardo Ziviani 
29123c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
29135c32e2e4SJose Ricardo Ziviani     } else if (i > 0 && i <= 16) {
29145c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
29153c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
29165c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
29175c32e2e4SJose Ricardo Ziviani         }
29185c32e2e4SJose Ricardo Ziviani 
29193c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
29203c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
29215c32e2e4SJose Ricardo Ziviani     } else if (i == 0) {
29223c385a93SMark Cave-Ayland         if (ret.VsrD(0) || ret.VsrD(1)) {
29235c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
29245c32e2e4SJose Ricardo Ziviani         }
29253c385a93SMark Cave-Ayland         ret.VsrD(0) = ret.VsrD(1) = 0;
29265c32e2e4SJose Ricardo Ziviani     }
29275c32e2e4SJose Ricardo Ziviani 
29285c32e2e4SJose Ricardo Ziviani     *r = ret;
29293c385a93SMark Cave-Ayland     if (r->VsrD(0) == 0 && r->VsrD(1) == 0) {
29305c32e2e4SJose Ricardo Ziviani         return ox_flag | CRF_EQ;
29315c32e2e4SJose Ricardo Ziviani     }
29325c32e2e4SJose Ricardo Ziviani 
29335c32e2e4SJose Ricardo Ziviani     return ox_flag | CRF_GT;
29345c32e2e4SJose Ricardo Ziviani }
29355c32e2e4SJose Ricardo Ziviani 
2936fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a)
2937fcf5ef2aSThomas Huth {
2938fcf5ef2aSThomas Huth     int i;
2939fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
2940fcf5ef2aSThomas Huth         r->u8[i] = AES_sbox[a->u8[i]];
2941fcf5ef2aSThomas Huth     }
2942fcf5ef2aSThomas Huth }
2943fcf5ef2aSThomas Huth 
2944fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2945fcf5ef2aSThomas Huth {
2946fcf5ef2aSThomas Huth     ppc_avr_t result;
2947fcf5ef2aSThomas Huth     int i;
2948fcf5ef2aSThomas Huth 
2949fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
29502dea57dbSMark Cave-Ayland         result.VsrW(i) = b->VsrW(i) ^
29512dea57dbSMark Cave-Ayland             (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^
29522dea57dbSMark Cave-Ayland              AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^
29532dea57dbSMark Cave-Ayland              AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^
29542dea57dbSMark Cave-Ayland              AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]);
2955fcf5ef2aSThomas Huth     }
2956fcf5ef2aSThomas Huth     *r = result;
2957fcf5ef2aSThomas Huth }
2958fcf5ef2aSThomas Huth 
2959fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2960fcf5ef2aSThomas Huth {
2961fcf5ef2aSThomas Huth     ppc_avr_t result;
2962fcf5ef2aSThomas Huth     int i;
2963fcf5ef2aSThomas Huth 
2964fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
29652dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]);
2966fcf5ef2aSThomas Huth     }
2967fcf5ef2aSThomas Huth     *r = result;
2968fcf5ef2aSThomas Huth }
2969fcf5ef2aSThomas Huth 
2970fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2971fcf5ef2aSThomas Huth {
2972fcf5ef2aSThomas Huth     /* This differs from what is written in ISA V2.07.  The RTL is */
2973fcf5ef2aSThomas Huth     /* incorrect and will be fixed in V2.07B.                      */
2974fcf5ef2aSThomas Huth     int i;
2975fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2976fcf5ef2aSThomas Huth 
2977fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
29782dea57dbSMark Cave-Ayland         tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])];
2979fcf5ef2aSThomas Huth     }
2980fcf5ef2aSThomas Huth 
2981fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
29822dea57dbSMark Cave-Ayland         r->VsrW(i) =
29832dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 0)][0] ^
29842dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 1)][1] ^
29852dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 2)][2] ^
29862dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 3)][3];
2987fcf5ef2aSThomas Huth     }
2988fcf5ef2aSThomas Huth }
2989fcf5ef2aSThomas Huth 
2990fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2991fcf5ef2aSThomas Huth {
2992fcf5ef2aSThomas Huth     ppc_avr_t result;
2993fcf5ef2aSThomas Huth     int i;
2994fcf5ef2aSThomas Huth 
2995fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
29962dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]);
2997fcf5ef2aSThomas Huth     }
2998fcf5ef2aSThomas Huth     *r = result;
2999fcf5ef2aSThomas Huth }
3000fcf5ef2aSThomas Huth 
3001fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
3002fcf5ef2aSThomas Huth {
3003fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
3004fcf5ef2aSThomas Huth     int six = st_six & 0xF;
3005fcf5ef2aSThomas Huth     int i;
3006fcf5ef2aSThomas Huth 
3007730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
3008fcf5ef2aSThomas Huth         if (st == 0) {
3009fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
30100ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 7) ^
30110ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 18) ^
3012730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 3);
3013fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
30140ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 17) ^
30150ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 19) ^
3016730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 10);
3017fcf5ef2aSThomas Huth             }
3018fcf5ef2aSThomas Huth         } else { /* st == 1 */
3019fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
30200ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 2) ^
30210ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 13) ^
30220ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 22);
3023fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
30240ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 6) ^
30250ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 11) ^
30260ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 25);
3027fcf5ef2aSThomas Huth             }
3028fcf5ef2aSThomas Huth         }
3029fcf5ef2aSThomas Huth     }
3030fcf5ef2aSThomas Huth }
3031fcf5ef2aSThomas Huth 
3032fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
3033fcf5ef2aSThomas Huth {
3034fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
3035fcf5ef2aSThomas Huth     int six = st_six & 0xF;
3036fcf5ef2aSThomas Huth     int i;
3037fcf5ef2aSThomas Huth 
3038730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
3039fcf5ef2aSThomas Huth         if (st == 0) {
3040fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
30410ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 1) ^
30420ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 8) ^
3043730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 7);
3044fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
30450ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 19) ^
30460ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 61) ^
3047730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 6);
3048fcf5ef2aSThomas Huth             }
3049fcf5ef2aSThomas Huth         } else { /* st == 1 */
3050fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
30510ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 28) ^
30520ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 34) ^
30530ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 39);
3054fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
30550ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 14) ^
30560ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 18) ^
30570ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 41);
3058fcf5ef2aSThomas Huth             }
3059fcf5ef2aSThomas Huth         }
3060fcf5ef2aSThomas Huth     }
3061fcf5ef2aSThomas Huth }
3062fcf5ef2aSThomas Huth 
3063fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
3064fcf5ef2aSThomas Huth {
3065fcf5ef2aSThomas Huth     ppc_avr_t result;
3066fcf5ef2aSThomas Huth     int i;
3067fcf5ef2aSThomas Huth 
306860594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
306960594feaSMark Cave-Ayland         int indexA = c->VsrB(i) >> 4;
307060594feaSMark Cave-Ayland         int indexB = c->VsrB(i) & 0xF;
307160594feaSMark Cave-Ayland 
307260594feaSMark Cave-Ayland         result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB);
3073fcf5ef2aSThomas Huth     }
3074fcf5ef2aSThomas Huth     *r = result;
3075fcf5ef2aSThomas Huth }
3076fcf5ef2aSThomas Huth 
3077fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I
3078fcf5ef2aSThomas Huth 
3079fcf5ef2aSThomas Huth /*****************************************************************************/
3080fcf5ef2aSThomas Huth /* SPE extension helpers */
3081fcf5ef2aSThomas Huth /* Use a table to make this quicker */
3082fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = {
3083fcf5ef2aSThomas Huth     0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE,
3084fcf5ef2aSThomas Huth     0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF,
3085fcf5ef2aSThomas Huth };
3086fcf5ef2aSThomas Huth 
3087fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val)
3088fcf5ef2aSThomas Huth {
3089fcf5ef2aSThomas Huth     return hbrev[val >> 4] | (hbrev[val & 0xF] << 4);
3090fcf5ef2aSThomas Huth }
3091fcf5ef2aSThomas Huth 
3092fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val)
3093fcf5ef2aSThomas Huth {
3094fcf5ef2aSThomas Huth     return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) |
3095fcf5ef2aSThomas Huth         (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24);
3096fcf5ef2aSThomas Huth }
3097fcf5ef2aSThomas Huth 
3098fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */
3099fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2)
3100fcf5ef2aSThomas Huth {
3101fcf5ef2aSThomas Huth     uint32_t a, b, d, mask;
3102fcf5ef2aSThomas Huth 
3103fcf5ef2aSThomas Huth     mask = UINT32_MAX >> (32 - MASKBITS);
3104fcf5ef2aSThomas Huth     a = arg1 & mask;
3105fcf5ef2aSThomas Huth     b = arg2 & mask;
3106fcf5ef2aSThomas Huth     d = word_reverse(1 + word_reverse(a | ~b));
3107fcf5ef2aSThomas Huth     return (arg1 & ~mask) | (d & b);
3108fcf5ef2aSThomas Huth }
3109fcf5ef2aSThomas Huth 
3110fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val)
3111fcf5ef2aSThomas Huth {
3112fcf5ef2aSThomas Huth     if (val & 0x80000000) {
3113fcf5ef2aSThomas Huth         return clz32(~val);
3114fcf5ef2aSThomas Huth     } else {
3115fcf5ef2aSThomas Huth         return clz32(val);
3116fcf5ef2aSThomas Huth     }
3117fcf5ef2aSThomas Huth }
3118fcf5ef2aSThomas Huth 
3119fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val)
3120fcf5ef2aSThomas Huth {
3121fcf5ef2aSThomas Huth     return clz32(val);
3122fcf5ef2aSThomas Huth }
3123fcf5ef2aSThomas Huth 
3124fcf5ef2aSThomas Huth /* 440 specific */
3125fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high,
3126fcf5ef2aSThomas Huth                           target_ulong low, uint32_t update_Rc)
3127fcf5ef2aSThomas Huth {
3128fcf5ef2aSThomas Huth     target_ulong mask;
3129fcf5ef2aSThomas Huth     int i;
3130fcf5ef2aSThomas Huth 
3131fcf5ef2aSThomas Huth     i = 1;
3132fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3133fcf5ef2aSThomas Huth         if ((high & mask) == 0) {
3134fcf5ef2aSThomas Huth             if (update_Rc) {
3135fcf5ef2aSThomas Huth                 env->crf[0] = 0x4;
3136fcf5ef2aSThomas Huth             }
3137fcf5ef2aSThomas Huth             goto done;
3138fcf5ef2aSThomas Huth         }
3139fcf5ef2aSThomas Huth         i++;
3140fcf5ef2aSThomas Huth     }
3141fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3142fcf5ef2aSThomas Huth         if ((low & mask) == 0) {
3143fcf5ef2aSThomas Huth             if (update_Rc) {
3144fcf5ef2aSThomas Huth                 env->crf[0] = 0x8;
3145fcf5ef2aSThomas Huth             }
3146fcf5ef2aSThomas Huth             goto done;
3147fcf5ef2aSThomas Huth         }
3148fcf5ef2aSThomas Huth         i++;
3149fcf5ef2aSThomas Huth     }
3150fcf5ef2aSThomas Huth     i = 8;
3151fcf5ef2aSThomas Huth     if (update_Rc) {
3152fcf5ef2aSThomas Huth         env->crf[0] = 0x2;
3153fcf5ef2aSThomas Huth     }
3154fcf5ef2aSThomas Huth  done:
3155fcf5ef2aSThomas Huth     env->xer = (env->xer & ~0x7F) | i;
3156fcf5ef2aSThomas Huth     if (update_Rc) {
3157fcf5ef2aSThomas Huth         env->crf[0] |= xer_so;
3158fcf5ef2aSThomas Huth     }
3159fcf5ef2aSThomas Huth     return i;
3160fcf5ef2aSThomas Huth }
3161