xref: /openbmc/qemu/target/ppc/int_helper.c (revision 345531533f26df49e74f16dafc88408408173ece)
1fcf5ef2aSThomas Huth /*
2fcf5ef2aSThomas Huth  *  PowerPC integer and vector emulation helpers for QEMU.
3fcf5ef2aSThomas Huth  *
4fcf5ef2aSThomas Huth  *  Copyright (c) 2003-2007 Jocelyn Mayer
5fcf5ef2aSThomas Huth  *
6fcf5ef2aSThomas Huth  * This library is free software; you can redistribute it and/or
7fcf5ef2aSThomas Huth  * modify it under the terms of the GNU Lesser General Public
8fcf5ef2aSThomas Huth  * License as published by the Free Software Foundation; either
96bd039cdSChetan Pant  * version 2.1 of the License, or (at your option) any later version.
10fcf5ef2aSThomas Huth  *
11fcf5ef2aSThomas Huth  * This library is distributed in the hope that it will be useful,
12fcf5ef2aSThomas Huth  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13fcf5ef2aSThomas Huth  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14fcf5ef2aSThomas Huth  * Lesser General Public License for more details.
15fcf5ef2aSThomas Huth  *
16fcf5ef2aSThomas Huth  * You should have received a copy of the GNU Lesser General Public
17fcf5ef2aSThomas Huth  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18fcf5ef2aSThomas Huth  */
19db725815SMarkus Armbruster 
20fcf5ef2aSThomas Huth #include "qemu/osdep.h"
21fcf5ef2aSThomas Huth #include "cpu.h"
22fcf5ef2aSThomas Huth #include "internal.h"
23fcf5ef2aSThomas Huth #include "qemu/host-utils.h"
24db725815SMarkus Armbruster #include "qemu/main-loop.h"
258a05fd9aSRichard Henderson #include "qemu/log.h"
26fcf5ef2aSThomas Huth #include "exec/helper-proto.h"
27fcf5ef2aSThomas Huth #include "crypto/aes.h"
2824f91e81SAlex Bennée #include "fpu/softfloat.h"
293f74b632SRichard Henderson #include "qapi/error.h"
303f74b632SRichard Henderson #include "qemu/guest-random.h"
311015fcabSMatheus Ferst #include "tcg/tcg-gvec-desc.h"
32fcf5ef2aSThomas Huth 
33fcf5ef2aSThomas Huth #include "helper_regs.h"
34fcf5ef2aSThomas Huth /*****************************************************************************/
35fcf5ef2aSThomas Huth /* Fixed point operations helpers */
36fcf5ef2aSThomas Huth 
37f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov)
38f32899deSNikunj A Dadhania {
39f32899deSNikunj A Dadhania     if (unlikely(ov)) {
40f32899deSNikunj A Dadhania         env->so = env->ov = 1;
41f32899deSNikunj A Dadhania     } else {
42f32899deSNikunj A Dadhania         env->ov = 0;
43f32899deSNikunj A Dadhania     }
44f32899deSNikunj A Dadhania }
45f32899deSNikunj A Dadhania 
46fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb,
47fcf5ef2aSThomas Huth                            uint32_t oe)
48fcf5ef2aSThomas Huth {
49fcf5ef2aSThomas Huth     uint64_t rt = 0;
50fcf5ef2aSThomas Huth     int overflow = 0;
51fcf5ef2aSThomas Huth 
52fcf5ef2aSThomas Huth     uint64_t dividend = (uint64_t)ra << 32;
53fcf5ef2aSThomas Huth     uint64_t divisor = (uint32_t)rb;
54fcf5ef2aSThomas Huth 
55fcf5ef2aSThomas Huth     if (unlikely(divisor == 0)) {
56fcf5ef2aSThomas Huth         overflow = 1;
57fcf5ef2aSThomas Huth     } else {
58fcf5ef2aSThomas Huth         rt = dividend / divisor;
59fcf5ef2aSThomas Huth         overflow = rt > UINT32_MAX;
60fcf5ef2aSThomas Huth     }
61fcf5ef2aSThomas Huth 
62fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
63fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
64fcf5ef2aSThomas Huth     }
65fcf5ef2aSThomas Huth 
66fcf5ef2aSThomas Huth     if (oe) {
67f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
68fcf5ef2aSThomas Huth     }
69fcf5ef2aSThomas Huth 
70fcf5ef2aSThomas Huth     return (target_ulong)rt;
71fcf5ef2aSThomas Huth }
72fcf5ef2aSThomas Huth 
73fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb,
74fcf5ef2aSThomas Huth                           uint32_t oe)
75fcf5ef2aSThomas Huth {
76fcf5ef2aSThomas Huth     int64_t rt = 0;
77fcf5ef2aSThomas Huth     int overflow = 0;
78fcf5ef2aSThomas Huth 
79fcf5ef2aSThomas Huth     int64_t dividend = (int64_t)ra << 32;
80fcf5ef2aSThomas Huth     int64_t divisor = (int64_t)((int32_t)rb);
81fcf5ef2aSThomas Huth 
82fcf5ef2aSThomas Huth     if (unlikely((divisor == 0) ||
83fcf5ef2aSThomas Huth                  ((divisor == -1ull) && (dividend == INT64_MIN)))) {
84fcf5ef2aSThomas Huth         overflow = 1;
85fcf5ef2aSThomas Huth     } else {
86fcf5ef2aSThomas Huth         rt = dividend / divisor;
87fcf5ef2aSThomas Huth         overflow = rt != (int32_t)rt;
88fcf5ef2aSThomas Huth     }
89fcf5ef2aSThomas Huth 
90fcf5ef2aSThomas Huth     if (unlikely(overflow)) {
91fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
92fcf5ef2aSThomas Huth     }
93fcf5ef2aSThomas Huth 
94fcf5ef2aSThomas Huth     if (oe) {
95f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
96fcf5ef2aSThomas Huth     }
97fcf5ef2aSThomas Huth 
98fcf5ef2aSThomas Huth     return (target_ulong)rt;
99fcf5ef2aSThomas Huth }
100fcf5ef2aSThomas Huth 
101fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
102fcf5ef2aSThomas Huth 
103fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe)
104fcf5ef2aSThomas Huth {
105fcf5ef2aSThomas Huth     uint64_t rt = 0;
106fcf5ef2aSThomas Huth     int overflow = 0;
107fcf5ef2aSThomas Huth 
1089276a31cSLuis Pires     if (unlikely(rb == 0 || ra >= rb)) {
1099276a31cSLuis Pires         overflow = 1;
110fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1119276a31cSLuis Pires     } else {
1129276a31cSLuis Pires         divu128(&rt, &ra, rb);
113fcf5ef2aSThomas Huth     }
114fcf5ef2aSThomas Huth 
115fcf5ef2aSThomas Huth     if (oe) {
116f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
117fcf5ef2aSThomas Huth     }
118fcf5ef2aSThomas Huth 
119fcf5ef2aSThomas Huth     return rt;
120fcf5ef2aSThomas Huth }
121fcf5ef2aSThomas Huth 
122fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe)
123fcf5ef2aSThomas Huth {
12440f3e79aSLuis Pires     uint64_t rt = 0;
125fcf5ef2aSThomas Huth     int64_t ra = (int64_t)rau;
126fcf5ef2aSThomas Huth     int64_t rb = (int64_t)rbu;
1279276a31cSLuis Pires     int overflow = 0;
128fcf5ef2aSThomas Huth 
1299276a31cSLuis Pires     if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) {
1309276a31cSLuis Pires         overflow = 1;
131fcf5ef2aSThomas Huth         rt = 0; /* Undefined */
1329276a31cSLuis Pires     } else {
1339276a31cSLuis Pires         divs128(&rt, &ra, rb);
134fcf5ef2aSThomas Huth     }
135fcf5ef2aSThomas Huth 
136fcf5ef2aSThomas Huth     if (oe) {
137f32899deSNikunj A Dadhania         helper_update_ov_legacy(env, overflow);
138fcf5ef2aSThomas Huth     }
139fcf5ef2aSThomas Huth 
140fcf5ef2aSThomas Huth     return rt;
141fcf5ef2aSThomas Huth }
142fcf5ef2aSThomas Huth 
143fcf5ef2aSThomas Huth #endif
144fcf5ef2aSThomas Huth 
145fcf5ef2aSThomas Huth 
146fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
147fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */
148fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff))
149fcf5ef2aSThomas Huth 
150b6cb41b2SDavid Gibson /*
151b6cb41b2SDavid Gibson  * subtract 1 from each byte, and with inverse, check if MSB is set at each
152fcf5ef2aSThomas Huth  * byte.
153fcf5ef2aSThomas Huth  * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80
154fcf5ef2aSThomas Huth  *      (0xFF & 0xFF) & 0x80 = 0x80 (zero found)
155fcf5ef2aSThomas Huth  */
156fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80))
157fcf5ef2aSThomas Huth 
158fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */
159fcf5ef2aSThomas Huth #define hasvalue(x, n)  (haszero((x) ^ pattern(n)))
160fcf5ef2aSThomas Huth 
161fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb)
162fcf5ef2aSThomas Huth {
163efa73196SNikunj A Dadhania     return hasvalue(rb, ra) ? CRF_GT : 0;
164fcf5ef2aSThomas Huth }
165fcf5ef2aSThomas Huth 
166fcf5ef2aSThomas Huth #undef pattern
167fcf5ef2aSThomas Huth #undef haszero
168fcf5ef2aSThomas Huth #undef hasvalue
169fcf5ef2aSThomas Huth 
170b6cb41b2SDavid Gibson /*
1713f74b632SRichard Henderson  * Return a random number.
172fcf5ef2aSThomas Huth  */
1733f74b632SRichard Henderson uint64_t helper_darn32(void)
174fcf5ef2aSThomas Huth {
1753f74b632SRichard Henderson     Error *err = NULL;
1763f74b632SRichard Henderson     uint32_t ret;
1773f74b632SRichard Henderson 
1783f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1793f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1803f74b632SRichard Henderson                       error_get_pretty(err));
1813f74b632SRichard Henderson         error_free(err);
182fcf5ef2aSThomas Huth         return -1;
183fcf5ef2aSThomas Huth     }
184fcf5ef2aSThomas Huth 
1853f74b632SRichard Henderson     return ret;
1863f74b632SRichard Henderson }
1873f74b632SRichard Henderson 
1883f74b632SRichard Henderson uint64_t helper_darn64(void)
189fcf5ef2aSThomas Huth {
1903f74b632SRichard Henderson     Error *err = NULL;
1913f74b632SRichard Henderson     uint64_t ret;
1923f74b632SRichard Henderson 
1933f74b632SRichard Henderson     if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) {
1943f74b632SRichard Henderson         qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s",
1953f74b632SRichard Henderson                       error_get_pretty(err));
1963f74b632SRichard Henderson         error_free(err);
197fcf5ef2aSThomas Huth         return -1;
198fcf5ef2aSThomas Huth     }
199fcf5ef2aSThomas Huth 
2003f74b632SRichard Henderson     return ret;
2013f74b632SRichard Henderson }
202fcf5ef2aSThomas Huth 
203fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb)
204fcf5ef2aSThomas Huth {
205fcf5ef2aSThomas Huth     int i;
206fcf5ef2aSThomas Huth     uint64_t ra = 0;
207fcf5ef2aSThomas Huth 
208fcf5ef2aSThomas Huth     for (i = 0; i < 8; i++) {
209fcf5ef2aSThomas Huth         int index = (rs >> (i * 8)) & 0xFF;
210fcf5ef2aSThomas Huth         if (index < 64) {
211a6a444a8SCédric Le Goater             if (rb & PPC_BIT(index)) {
212fcf5ef2aSThomas Huth                 ra |= 1 << i;
213fcf5ef2aSThomas Huth             }
214fcf5ef2aSThomas Huth         }
215fcf5ef2aSThomas Huth     }
216fcf5ef2aSThomas Huth     return ra;
217fcf5ef2aSThomas Huth }
218fcf5ef2aSThomas Huth 
219fcf5ef2aSThomas Huth #endif
220fcf5ef2aSThomas Huth 
221fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb)
222fcf5ef2aSThomas Huth {
223fcf5ef2aSThomas Huth     target_ulong mask = 0xff;
224fcf5ef2aSThomas Huth     target_ulong ra = 0;
225fcf5ef2aSThomas Huth     int i;
226fcf5ef2aSThomas Huth 
227fcf5ef2aSThomas Huth     for (i = 0; i < sizeof(target_ulong); i++) {
228fcf5ef2aSThomas Huth         if ((rs & mask) == (rb & mask)) {
229fcf5ef2aSThomas Huth             ra |= mask;
230fcf5ef2aSThomas Huth         }
231fcf5ef2aSThomas Huth         mask <<= 8;
232fcf5ef2aSThomas Huth     }
233fcf5ef2aSThomas Huth     return ra;
234fcf5ef2aSThomas Huth }
235fcf5ef2aSThomas Huth 
236fcf5ef2aSThomas Huth /* shift right arithmetic helper */
237fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value,
238fcf5ef2aSThomas Huth                          target_ulong shift)
239fcf5ef2aSThomas Huth {
240fcf5ef2aSThomas Huth     int32_t ret;
241fcf5ef2aSThomas Huth 
242fcf5ef2aSThomas Huth     if (likely(!(shift & 0x20))) {
243fcf5ef2aSThomas Huth         if (likely((uint32_t)shift != 0)) {
244fcf5ef2aSThomas Huth             shift &= 0x1f;
245fcf5ef2aSThomas Huth             ret = (int32_t)value >> shift;
246fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) {
247af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
248fcf5ef2aSThomas Huth             } else {
249af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
250fcf5ef2aSThomas Huth             }
251fcf5ef2aSThomas Huth         } else {
252fcf5ef2aSThomas Huth             ret = (int32_t)value;
253af1c259fSSandipan Das             env->ca32 = env->ca = 0;
254fcf5ef2aSThomas Huth         }
255fcf5ef2aSThomas Huth     } else {
256fcf5ef2aSThomas Huth         ret = (int32_t)value >> 31;
257af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
258fcf5ef2aSThomas Huth     }
259fcf5ef2aSThomas Huth     return (target_long)ret;
260fcf5ef2aSThomas Huth }
261fcf5ef2aSThomas Huth 
262fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
263fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value,
264fcf5ef2aSThomas Huth                          target_ulong shift)
265fcf5ef2aSThomas Huth {
266fcf5ef2aSThomas Huth     int64_t ret;
267fcf5ef2aSThomas Huth 
268fcf5ef2aSThomas Huth     if (likely(!(shift & 0x40))) {
269fcf5ef2aSThomas Huth         if (likely((uint64_t)shift != 0)) {
270fcf5ef2aSThomas Huth             shift &= 0x3f;
271fcf5ef2aSThomas Huth             ret = (int64_t)value >> shift;
272fcf5ef2aSThomas Huth             if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) {
273af1c259fSSandipan Das                 env->ca32 = env->ca = 0;
274fcf5ef2aSThomas Huth             } else {
275af1c259fSSandipan Das                 env->ca32 = env->ca = 1;
276fcf5ef2aSThomas Huth             }
277fcf5ef2aSThomas Huth         } else {
278fcf5ef2aSThomas Huth             ret = (int64_t)value;
279af1c259fSSandipan Das             env->ca32 = env->ca = 0;
280fcf5ef2aSThomas Huth         }
281fcf5ef2aSThomas Huth     } else {
282fcf5ef2aSThomas Huth         ret = (int64_t)value >> 63;
283af1c259fSSandipan Das         env->ca32 = env->ca = (ret != 0);
284fcf5ef2aSThomas Huth     }
285fcf5ef2aSThomas Huth     return ret;
286fcf5ef2aSThomas Huth }
287fcf5ef2aSThomas Huth #endif
288fcf5ef2aSThomas Huth 
289fcf5ef2aSThomas Huth #if defined(TARGET_PPC64)
290fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
291fcf5ef2aSThomas Huth {
29279770002SRichard Henderson     /* Note that we don't fold past bytes */
293fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
294fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
295fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
296fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
297fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
298fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
299fcf5ef2aSThomas Huth     return val;
300fcf5ef2aSThomas Huth }
301fcf5ef2aSThomas Huth 
302fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val)
303fcf5ef2aSThomas Huth {
30479770002SRichard Henderson     /* Note that we don't fold past words.  */
305fcf5ef2aSThomas Huth     val = (val & 0x5555555555555555ULL) + ((val >>  1) &
306fcf5ef2aSThomas Huth                                            0x5555555555555555ULL);
307fcf5ef2aSThomas Huth     val = (val & 0x3333333333333333ULL) + ((val >>  2) &
308fcf5ef2aSThomas Huth                                            0x3333333333333333ULL);
309fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >>  4) &
310fcf5ef2aSThomas Huth                                            0x0f0f0f0f0f0f0f0fULL);
311fcf5ef2aSThomas Huth     val = (val & 0x00ff00ff00ff00ffULL) + ((val >>  8) &
312fcf5ef2aSThomas Huth                                            0x00ff00ff00ff00ffULL);
313fcf5ef2aSThomas Huth     val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) &
314fcf5ef2aSThomas Huth                                            0x0000ffff0000ffffULL);
315fcf5ef2aSThomas Huth     return val;
316fcf5ef2aSThomas Huth }
317fcf5ef2aSThomas Huth #else
318fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val)
319fcf5ef2aSThomas Huth {
32079770002SRichard Henderson     /* Note that we don't fold past bytes */
321fcf5ef2aSThomas Huth     val = (val & 0x55555555) + ((val >>  1) & 0x55555555);
322fcf5ef2aSThomas Huth     val = (val & 0x33333333) + ((val >>  2) & 0x33333333);
323fcf5ef2aSThomas Huth     val = (val & 0x0f0f0f0f) + ((val >>  4) & 0x0f0f0f0f);
324fcf5ef2aSThomas Huth     return val;
325fcf5ef2aSThomas Huth }
326fcf5ef2aSThomas Huth #endif
327fcf5ef2aSThomas Huth 
3286e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask)
32989ccd7dcSMatheus Ferst {
33089ccd7dcSMatheus Ferst     /*
33189ccd7dcSMatheus Ferst      * Instead of processing the mask bit-by-bit from the most significant to
33289ccd7dcSMatheus Ferst      * the least significant bit, as described in PowerISA, we'll handle it in
33389ccd7dcSMatheus Ferst      * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use
33489ccd7dcSMatheus Ferst      * ctz or cto, we negate the mask at the end of the loop.
33589ccd7dcSMatheus Ferst      */
33689ccd7dcSMatheus Ferst     target_ulong m, left = 0, right = 0;
33789ccd7dcSMatheus Ferst     unsigned int n, i = 64;
33889ccd7dcSMatheus Ferst     bool bit = false; /* tracks if we are processing zeros or ones */
33989ccd7dcSMatheus Ferst 
34089ccd7dcSMatheus Ferst     if (mask == 0 || mask == -1) {
34189ccd7dcSMatheus Ferst         return src;
34289ccd7dcSMatheus Ferst     }
34389ccd7dcSMatheus Ferst 
34489ccd7dcSMatheus Ferst     /* Processes the mask in blocks, from LSB to MSB */
34589ccd7dcSMatheus Ferst     while (i) {
34689ccd7dcSMatheus Ferst         /* Find how many bits we should take */
34789ccd7dcSMatheus Ferst         n = ctz64(mask);
34889ccd7dcSMatheus Ferst         if (n > i) {
34989ccd7dcSMatheus Ferst             n = i;
35089ccd7dcSMatheus Ferst         }
35189ccd7dcSMatheus Ferst 
35289ccd7dcSMatheus Ferst         /*
35389ccd7dcSMatheus Ferst          * Extracts 'n' trailing bits of src and put them on the leading 'n'
35489ccd7dcSMatheus Ferst          * bits of 'right' or 'left', pushing down the previously extracted
35589ccd7dcSMatheus Ferst          * values.
35689ccd7dcSMatheus Ferst          */
35789ccd7dcSMatheus Ferst         m = (1ll << n) - 1;
35889ccd7dcSMatheus Ferst         if (bit) {
35989ccd7dcSMatheus Ferst             right = ror64(right | (src & m), n);
36089ccd7dcSMatheus Ferst         } else {
36189ccd7dcSMatheus Ferst             left = ror64(left | (src & m), n);
36289ccd7dcSMatheus Ferst         }
36389ccd7dcSMatheus Ferst 
36489ccd7dcSMatheus Ferst         /*
36589ccd7dcSMatheus Ferst          * Discards the processed bits from 'src' and 'mask'. Note that we are
36689ccd7dcSMatheus Ferst          * removing 'n' trailing zeros from 'mask', but the logical shift will
36789ccd7dcSMatheus Ferst          * add 'n' leading zeros back, so the population count of 'mask' is kept
36889ccd7dcSMatheus Ferst          * the same.
36989ccd7dcSMatheus Ferst          */
37089ccd7dcSMatheus Ferst         src >>= n;
37189ccd7dcSMatheus Ferst         mask >>= n;
37289ccd7dcSMatheus Ferst         i -= n;
37389ccd7dcSMatheus Ferst         bit = !bit;
37489ccd7dcSMatheus Ferst         mask = ~mask;
37589ccd7dcSMatheus Ferst     }
37689ccd7dcSMatheus Ferst 
37789ccd7dcSMatheus Ferst     /*
37889ccd7dcSMatheus Ferst      * At the end, right was ror'ed ctpop(mask) times. To put it back in place,
37989ccd7dcSMatheus Ferst      * we'll shift it more 64-ctpop(mask) times.
38089ccd7dcSMatheus Ferst      */
38189ccd7dcSMatheus Ferst     if (bit) {
38289ccd7dcSMatheus Ferst         n = ctpop64(mask);
38389ccd7dcSMatheus Ferst     } else {
38489ccd7dcSMatheus Ferst         n = 64 - ctpop64(mask);
38589ccd7dcSMatheus Ferst     }
38689ccd7dcSMatheus Ferst 
38789ccd7dcSMatheus Ferst     return left | (right >> n);
38889ccd7dcSMatheus Ferst }
38989ccd7dcSMatheus Ferst 
39021ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask)
39121ba6e58SMatheus Ferst {
39221ba6e58SMatheus Ferst     int i, o;
39321ba6e58SMatheus Ferst     uint64_t result = 0;
39421ba6e58SMatheus Ferst 
39521ba6e58SMatheus Ferst     if (mask == -1) {
39621ba6e58SMatheus Ferst         return src;
39721ba6e58SMatheus Ferst     }
39821ba6e58SMatheus Ferst 
39921ba6e58SMatheus Ferst     for (i = 0; mask != 0; i++) {
40021ba6e58SMatheus Ferst         o = ctz64(mask);
40121ba6e58SMatheus Ferst         mask &= mask - 1;
40221ba6e58SMatheus Ferst         result |= ((src >> i) & 1) << o;
40321ba6e58SMatheus Ferst     }
40421ba6e58SMatheus Ferst 
40521ba6e58SMatheus Ferst     return result;
40621ba6e58SMatheus Ferst }
4078bdb7606SMatheus Ferst 
4088bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask)
4098bdb7606SMatheus Ferst {
4108bdb7606SMatheus Ferst     int i, o;
4118bdb7606SMatheus Ferst     uint64_t result = 0;
4128bdb7606SMatheus Ferst 
4138bdb7606SMatheus Ferst     if (mask == -1) {
4148bdb7606SMatheus Ferst         return src;
4158bdb7606SMatheus Ferst     }
4168bdb7606SMatheus Ferst 
4178bdb7606SMatheus Ferst     for (o = 0; mask != 0; o++) {
4188bdb7606SMatheus Ferst         i = ctz64(mask);
4198bdb7606SMatheus Ferst         mask &= mask - 1;
4208bdb7606SMatheus Ferst         result |= ((src >> i) & 1) << o;
4218bdb7606SMatheus Ferst     }
4228bdb7606SMatheus Ferst 
4238bdb7606SMatheus Ferst     return result;
4248bdb7606SMatheus Ferst }
42521ba6e58SMatheus Ferst 
426fcf5ef2aSThomas Huth /*****************************************************************************/
427fcf5ef2aSThomas Huth /* Altivec extension helpers */
428e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
429fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
430fcf5ef2aSThomas Huth     for (index = 0; index < ARRAY_SIZE(r->element); index++)
431fcf5ef2aSThomas Huth #else
432fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element)                    \
433fcf5ef2aSThomas Huth     for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--)
434fcf5ef2aSThomas Huth #endif
435fcf5ef2aSThomas Huth 
436fcf5ef2aSThomas Huth /* Saturating arithmetic helpers.  */
437fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max)          \
438fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
439fcf5ef2aSThomas Huth     {                                                           \
440fcf5ef2aSThomas Huth         to_type r;                                              \
441fcf5ef2aSThomas Huth                                                                 \
442fcf5ef2aSThomas Huth         if (x < (from_type)min) {                               \
443fcf5ef2aSThomas Huth             r = min;                                            \
444fcf5ef2aSThomas Huth             *sat = 1;                                           \
445fcf5ef2aSThomas Huth         } else if (x > (from_type)max) {                        \
446fcf5ef2aSThomas Huth             r = max;                                            \
447fcf5ef2aSThomas Huth             *sat = 1;                                           \
448fcf5ef2aSThomas Huth         } else {                                                \
449fcf5ef2aSThomas Huth             r = x;                                              \
450fcf5ef2aSThomas Huth         }                                                       \
451fcf5ef2aSThomas Huth         return r;                                               \
452fcf5ef2aSThomas Huth     }
453fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max)         \
454fcf5ef2aSThomas Huth     static inline to_type cvt##from##to(from_type x, int *sat)  \
455fcf5ef2aSThomas Huth     {                                                           \
456fcf5ef2aSThomas Huth         to_type r;                                              \
457fcf5ef2aSThomas Huth                                                                 \
458fcf5ef2aSThomas Huth         if (x > (from_type)max) {                               \
459fcf5ef2aSThomas Huth             r = max;                                            \
460fcf5ef2aSThomas Huth             *sat = 1;                                           \
461fcf5ef2aSThomas Huth         } else {                                                \
462fcf5ef2aSThomas Huth             r = x;                                              \
463fcf5ef2aSThomas Huth         }                                                       \
464fcf5ef2aSThomas Huth         return r;                                               \
465fcf5ef2aSThomas Huth     }
466fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX)
467fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX)
468fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX)
469fcf5ef2aSThomas Huth 
470fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX)
471fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX)
472fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX)
473fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX)
474fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX)
475fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX)
476fcf5ef2aSThomas Huth #undef SATCVT
477fcf5ef2aSThomas Huth #undef SATCVTU
478fcf5ef2aSThomas Huth 
479dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr)
480fcf5ef2aSThomas Huth {
481c19940dbSBruno Larsen (billionai)     ppc_store_vscr(env, vscr);
482fcf5ef2aSThomas Huth }
483fcf5ef2aSThomas Huth 
484cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env)
485cc2b90d7SRichard Henderson {
486c19940dbSBruno Larsen (billionai)     return ppc_get_vscr(env);
487cc2b90d7SRichard Henderson }
488cc2b90d7SRichard Henderson 
4896175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env)
4906175f5a0SRichard Henderson {
4919b5b74daSRichard Henderson     /* The choice of non-zero value is arbitrary.  */
4929b5b74daSRichard Henderson     env->vscr_sat.u32[0] = 1;
4936175f5a0SRichard Henderson }
4946175f5a0SRichard Henderson 
495fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
496fcf5ef2aSThomas Huth {
497fcf5ef2aSThomas Huth     int i;
498fcf5ef2aSThomas Huth 
499fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
500fcf5ef2aSThomas Huth         r->u32[i] = ~a->u32[i] < b->u32[i];
501fcf5ef2aSThomas Huth     }
502fcf5ef2aSThomas Huth }
503fcf5ef2aSThomas Huth 
504fcf5ef2aSThomas Huth /* vprtybw */
505fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b)
506fcf5ef2aSThomas Huth {
507fcf5ef2aSThomas Huth     int i;
508fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
509fcf5ef2aSThomas Huth         uint64_t res = b->u32[i] ^ (b->u32[i] >> 16);
510fcf5ef2aSThomas Huth         res ^= res >> 8;
511fcf5ef2aSThomas Huth         r->u32[i] = res & 1;
512fcf5ef2aSThomas Huth     }
513fcf5ef2aSThomas Huth }
514fcf5ef2aSThomas Huth 
515fcf5ef2aSThomas Huth /* vprtybd */
516fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b)
517fcf5ef2aSThomas Huth {
518fcf5ef2aSThomas Huth     int i;
519fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
520fcf5ef2aSThomas Huth         uint64_t res = b->u64[i] ^ (b->u64[i] >> 32);
521fcf5ef2aSThomas Huth         res ^= res >> 16;
522fcf5ef2aSThomas Huth         res ^= res >> 8;
523fcf5ef2aSThomas Huth         r->u64[i] = res & 1;
524fcf5ef2aSThomas Huth     }
525fcf5ef2aSThomas Huth }
526fcf5ef2aSThomas Huth 
527fcf5ef2aSThomas Huth /* vprtybq */
528fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b)
529fcf5ef2aSThomas Huth {
530fcf5ef2aSThomas Huth     uint64_t res = b->u64[0] ^ b->u64[1];
531fcf5ef2aSThomas Huth     res ^= res >> 32;
532fcf5ef2aSThomas Huth     res ^= res >> 16;
533fcf5ef2aSThomas Huth     res ^= res >> 8;
5343c385a93SMark Cave-Ayland     r->VsrD(1) = res & 1;
5353c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
536fcf5ef2aSThomas Huth }
537fcf5ef2aSThomas Huth 
538fcf5ef2aSThomas Huth #define VARITHFP(suffix, func)                                          \
539fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
540fcf5ef2aSThomas Huth                           ppc_avr_t *b)                                 \
541fcf5ef2aSThomas Huth     {                                                                   \
542fcf5ef2aSThomas Huth         int i;                                                          \
543fcf5ef2aSThomas Huth                                                                         \
54405ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
54505ee3e8aSMark Cave-Ayland             r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status);   \
546fcf5ef2aSThomas Huth         }                                                               \
547fcf5ef2aSThomas Huth     }
548fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add)
549fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub)
550fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min)
551fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max)
552fcf5ef2aSThomas Huth #undef VARITHFP
553fcf5ef2aSThomas Huth 
554fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type)                                       \
555fcf5ef2aSThomas Huth     void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \
556fcf5ef2aSThomas Huth                            ppc_avr_t *b, ppc_avr_t *c)                  \
557fcf5ef2aSThomas Huth     {                                                                   \
558fcf5ef2aSThomas Huth         int i;                                                          \
55905ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
56005ee3e8aSMark Cave-Ayland             r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \
561fcf5ef2aSThomas Huth                                        type, &env->vec_status);         \
562fcf5ef2aSThomas Huth         }                                                               \
563fcf5ef2aSThomas Huth     }
564fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0);
565fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c);
566fcf5ef2aSThomas Huth #undef VARITHFPFMA
567fcf5ef2aSThomas Huth 
568fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element)                          \
569fcf5ef2aSThomas Huth     {                                                                   \
570fcf5ef2aSThomas Huth         type result = (type)a->element[i] op (type)b->element[i];       \
571fcf5ef2aSThomas Huth         r->element[i] = cvt(result, &sat);                              \
572fcf5ef2aSThomas Huth     }
573fcf5ef2aSThomas Huth 
574fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element)                    \
575fb11ae7dSRichard Henderson     void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat,              \
576fb11ae7dSRichard Henderson                         ppc_avr_t *a, ppc_avr_t *b, uint32_t desc)      \
577fcf5ef2aSThomas Huth     {                                                                   \
578fcf5ef2aSThomas Huth         int sat = 0;                                                    \
579fcf5ef2aSThomas Huth         int i;                                                          \
580fcf5ef2aSThomas Huth                                                                         \
581fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
582fcf5ef2aSThomas Huth             VARITHSAT_CASE(optype, op, cvt, element);                   \
583fcf5ef2aSThomas Huth         }                                                               \
584fcf5ef2aSThomas Huth         if (sat) {                                                      \
585fb11ae7dSRichard Henderson             vscr_sat->u32[0] = 1;                                       \
586fcf5ef2aSThomas Huth         }                                                               \
587fcf5ef2aSThomas Huth     }
588fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt)          \
589fcf5ef2aSThomas Huth     VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element)      \
590fcf5ef2aSThomas Huth     VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element)
591fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt)        \
592fcf5ef2aSThomas Huth     VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element)      \
593fcf5ef2aSThomas Huth     VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element)
594fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb)
595fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh)
596fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw)
597fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub)
598fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh)
599fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw)
600fcf5ef2aSThomas Huth #undef VARITHSAT_CASE
601fcf5ef2aSThomas Huth #undef VARITHSAT_DO
602fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED
603fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED
604fcf5ef2aSThomas Huth 
605fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype)                                   \
606fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
607fcf5ef2aSThomas Huth     {                                                                   \
608fcf5ef2aSThomas Huth         int i;                                                          \
609fcf5ef2aSThomas Huth                                                                         \
610fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
611fcf5ef2aSThomas Huth             etype x = (etype)a->element[i] + (etype)b->element[i] + 1;  \
612fcf5ef2aSThomas Huth             r->element[i] = x >> 1;                                     \
613fcf5ef2aSThomas Huth         }                                                               \
614fcf5ef2aSThomas Huth     }
615fcf5ef2aSThomas Huth 
616fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element,       \
617fcf5ef2aSThomas Huth              unsigned_type)                                             \
618fcf5ef2aSThomas Huth     VAVG_DO(avgs##type, signed_element, signed_type)                    \
619fcf5ef2aSThomas Huth     VAVG_DO(avgu##type, unsigned_element, unsigned_type)
620fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t)
621fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t)
622fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t)
623fcf5ef2aSThomas Huth #undef VAVG_DO
624fcf5ef2aSThomas Huth #undef VAVG
625fcf5ef2aSThomas Huth 
626fcf5ef2aSThomas Huth #define VABSDU_DO(name, element)                                        \
627fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)           \
628fcf5ef2aSThomas Huth {                                                                       \
629fcf5ef2aSThomas Huth     int i;                                                              \
630fcf5ef2aSThomas Huth                                                                         \
631fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
632fcf5ef2aSThomas Huth         r->element[i] = (a->element[i] > b->element[i]) ?               \
633fcf5ef2aSThomas Huth             (a->element[i] - b->element[i]) :                           \
634fcf5ef2aSThomas Huth             (b->element[i] - a->element[i]);                            \
635fcf5ef2aSThomas Huth     }                                                                   \
636fcf5ef2aSThomas Huth }
637fcf5ef2aSThomas Huth 
638b6cb41b2SDavid Gibson /*
639b6cb41b2SDavid Gibson  * VABSDU - Vector absolute difference unsigned
640fcf5ef2aSThomas Huth  *   name    - instruction mnemonic suffix (b: byte, h: halfword, w: word)
641fcf5ef2aSThomas Huth  *   element - element type to access from vector
642fcf5ef2aSThomas Huth  */
643fcf5ef2aSThomas Huth #define VABSDU(type, element)                   \
644fcf5ef2aSThomas Huth     VABSDU_DO(absdu##type, element)
645fcf5ef2aSThomas Huth VABSDU(b, u8)
646fcf5ef2aSThomas Huth VABSDU(h, u16)
647fcf5ef2aSThomas Huth VABSDU(w, u32)
648fcf5ef2aSThomas Huth #undef VABSDU_DO
649fcf5ef2aSThomas Huth #undef VABSDU
650fcf5ef2aSThomas Huth 
651fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element)                                       \
652fcf5ef2aSThomas Huth     void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r,             \
653fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
654fcf5ef2aSThomas Huth     {                                                                   \
655fcf5ef2aSThomas Huth         int i;                                                          \
656fcf5ef2aSThomas Huth                                                                         \
65705ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
658fcf5ef2aSThomas Huth             float32 t = cvt(b->element[i], &env->vec_status);           \
65905ee3e8aSMark Cave-Ayland             r->f32[i] = float32_scalbn(t, -uim, &env->vec_status);      \
660fcf5ef2aSThomas Huth         }                                                               \
661fcf5ef2aSThomas Huth     }
662fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32)
663fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32)
664fcf5ef2aSThomas Huth #undef VCF
665fcf5ef2aSThomas Huth 
666eb936dc0SMatheus Ferst #define VCMPNEZ(NAME, ELEM) \
667eb936dc0SMatheus Ferst void helper_##NAME(ppc_vsr_t *t, ppc_vsr_t *a, ppc_vsr_t *b, uint32_t desc) \
668fcf5ef2aSThomas Huth {                                                                           \
669eb936dc0SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->ELEM); i++) {                         \
670eb936dc0SMatheus Ferst         t->ELEM[i] = ((a->ELEM[i] == 0) || (b->ELEM[i] == 0) ||             \
671eb936dc0SMatheus Ferst                       (a->ELEM[i] != b->ELEM[i])) ? -1 : 0;                 \
672fcf5ef2aSThomas Huth     }                                                                       \
673fcf5ef2aSThomas Huth }
674eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZB, u8)
675eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZH, u16)
676eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZW, u32)
677eb936dc0SMatheus Ferst #undef VCMPNEZ
678fcf5ef2aSThomas Huth 
679fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record)                       \
680fcf5ef2aSThomas Huth     void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r,            \
681fcf5ef2aSThomas Huth                              ppc_avr_t *a, ppc_avr_t *b)                \
682fcf5ef2aSThomas Huth     {                                                                   \
683fcf5ef2aSThomas Huth         uint32_t ones = (uint32_t)-1;                                   \
684fcf5ef2aSThomas Huth         uint32_t all = ones;                                            \
685fcf5ef2aSThomas Huth         uint32_t none = 0;                                              \
686fcf5ef2aSThomas Huth         int i;                                                          \
687fcf5ef2aSThomas Huth                                                                         \
68805ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
689fcf5ef2aSThomas Huth             uint32_t result;                                            \
69071bfd65cSRichard Henderson             FloatRelation rel =                                         \
69171bfd65cSRichard Henderson                 float32_compare_quiet(a->f32[i], b->f32[i],             \
692fcf5ef2aSThomas Huth                                       &env->vec_status);                \
693fcf5ef2aSThomas Huth             if (rel == float_relation_unordered) {                      \
694fcf5ef2aSThomas Huth                 result = 0;                                             \
695fcf5ef2aSThomas Huth             } else if (rel compare order) {                             \
696fcf5ef2aSThomas Huth                 result = ones;                                          \
697fcf5ef2aSThomas Huth             } else {                                                    \
698fcf5ef2aSThomas Huth                 result = 0;                                             \
699fcf5ef2aSThomas Huth             }                                                           \
700fcf5ef2aSThomas Huth             r->u32[i] = result;                                         \
701fcf5ef2aSThomas Huth             all &= result;                                              \
702fcf5ef2aSThomas Huth             none |= result;                                             \
703fcf5ef2aSThomas Huth         }                                                               \
704fcf5ef2aSThomas Huth         if (record) {                                                   \
705fcf5ef2aSThomas Huth             env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1);       \
706fcf5ef2aSThomas Huth         }                                                               \
707fcf5ef2aSThomas Huth     }
708fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order)          \
709fcf5ef2aSThomas Huth     VCMPFP_DO(suffix, compare, order, 0)        \
710fcf5ef2aSThomas Huth     VCMPFP_DO(suffix##_dot, compare, order, 1)
711fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal)
712fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less)
713fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater)
714fcf5ef2aSThomas Huth #undef VCMPFP_DO
715fcf5ef2aSThomas Huth #undef VCMPFP
716fcf5ef2aSThomas Huth 
717fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r,
718fcf5ef2aSThomas Huth                                     ppc_avr_t *a, ppc_avr_t *b, int record)
719fcf5ef2aSThomas Huth {
720fcf5ef2aSThomas Huth     int i;
721fcf5ef2aSThomas Huth     int all_in = 0;
722fcf5ef2aSThomas Huth 
72305ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
72471bfd65cSRichard Henderson         FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i],
72505ee3e8aSMark Cave-Ayland                                                      &env->vec_status);
726fcf5ef2aSThomas Huth         if (le_rel == float_relation_unordered) {
727fcf5ef2aSThomas Huth             r->u32[i] = 0xc0000000;
728fcf5ef2aSThomas Huth             all_in = 1;
729fcf5ef2aSThomas Huth         } else {
73005ee3e8aSMark Cave-Ayland             float32 bneg = float32_chs(b->f32[i]);
73171bfd65cSRichard Henderson             FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg,
73205ee3e8aSMark Cave-Ayland                                                          &env->vec_status);
733fcf5ef2aSThomas Huth             int le = le_rel != float_relation_greater;
734fcf5ef2aSThomas Huth             int ge = ge_rel != float_relation_less;
735fcf5ef2aSThomas Huth 
736fcf5ef2aSThomas Huth             r->u32[i] = ((!le) << 31) | ((!ge) << 30);
737fcf5ef2aSThomas Huth             all_in |= (!le | !ge);
738fcf5ef2aSThomas Huth         }
739fcf5ef2aSThomas Huth     }
740fcf5ef2aSThomas Huth     if (record) {
741fcf5ef2aSThomas Huth         env->crf[6] = (all_in == 0) << 1;
742fcf5ef2aSThomas Huth     }
743fcf5ef2aSThomas Huth }
744fcf5ef2aSThomas Huth 
745fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
746fcf5ef2aSThomas Huth {
747fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 0);
748fcf5ef2aSThomas Huth }
749fcf5ef2aSThomas Huth 
750fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
751fcf5ef2aSThomas Huth                         ppc_avr_t *b)
752fcf5ef2aSThomas Huth {
753fcf5ef2aSThomas Huth     vcmpbfp_internal(env, r, a, b, 1);
754fcf5ef2aSThomas Huth }
755fcf5ef2aSThomas Huth 
756fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element)                                    \
757fcf5ef2aSThomas Huth     void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r,             \
758fcf5ef2aSThomas Huth                             ppc_avr_t *b, uint32_t uim)                 \
759fcf5ef2aSThomas Huth     {                                                                   \
760fcf5ef2aSThomas Huth         int i;                                                          \
761fcf5ef2aSThomas Huth         int sat = 0;                                                    \
762fcf5ef2aSThomas Huth         float_status s = env->vec_status;                               \
763fcf5ef2aSThomas Huth                                                                         \
764fcf5ef2aSThomas Huth         set_float_rounding_mode(float_round_to_zero, &s);               \
76505ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {                      \
76605ee3e8aSMark Cave-Ayland             if (float32_is_any_nan(b->f32[i])) {                        \
767fcf5ef2aSThomas Huth                 r->element[i] = 0;                                      \
768fcf5ef2aSThomas Huth             } else {                                                    \
76905ee3e8aSMark Cave-Ayland                 float64 t = float32_to_float64(b->f32[i], &s);          \
770fcf5ef2aSThomas Huth                 int64_t j;                                              \
771fcf5ef2aSThomas Huth                                                                         \
772fcf5ef2aSThomas Huth                 t = float64_scalbn(t, uim, &s);                         \
773fcf5ef2aSThomas Huth                 j = float64_to_int64(t, &s);                            \
774fcf5ef2aSThomas Huth                 r->element[i] = satcvt(j, &sat);                        \
775fcf5ef2aSThomas Huth             }                                                           \
776fcf5ef2aSThomas Huth         }                                                               \
777fcf5ef2aSThomas Huth         if (sat) {                                                      \
7786175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
779fcf5ef2aSThomas Huth         }                                                               \
780fcf5ef2aSThomas Huth     }
781fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32)
782fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32)
783fcf5ef2aSThomas Huth #undef VCT
784fcf5ef2aSThomas Huth 
785*34553153SLucas Mateus Castro (alqotel) typedef int64_t do_ger(uint32_t, uint32_t, uint32_t);
786*34553153SLucas Mateus Castro (alqotel) 
787*34553153SLucas Mateus Castro (alqotel) static int64_t ger_rank8(uint32_t a, uint32_t b, uint32_t mask)
788*34553153SLucas Mateus Castro (alqotel) {
789*34553153SLucas Mateus Castro (alqotel)     int64_t psum = 0;
790*34553153SLucas Mateus Castro (alqotel)     for (int i = 0; i < 8; i++, mask >>= 1) {
791*34553153SLucas Mateus Castro (alqotel)         if (mask & 1) {
792*34553153SLucas Mateus Castro (alqotel)             psum += sextract32(a, 4 * i, 4) * sextract32(b, 4 * i, 4);
793*34553153SLucas Mateus Castro (alqotel)         }
794*34553153SLucas Mateus Castro (alqotel)     }
795*34553153SLucas Mateus Castro (alqotel)     return psum;
796*34553153SLucas Mateus Castro (alqotel) }
797*34553153SLucas Mateus Castro (alqotel) 
798*34553153SLucas Mateus Castro (alqotel) static int64_t ger_rank4(uint32_t a, uint32_t b, uint32_t mask)
799*34553153SLucas Mateus Castro (alqotel) {
800*34553153SLucas Mateus Castro (alqotel)     int64_t psum = 0;
801*34553153SLucas Mateus Castro (alqotel)     for (int i = 0; i < 4; i++, mask >>= 1) {
802*34553153SLucas Mateus Castro (alqotel)         if (mask & 1) {
803*34553153SLucas Mateus Castro (alqotel)             psum += sextract32(a, 8 * i, 8) * (int64_t)extract32(b, 8 * i, 8);
804*34553153SLucas Mateus Castro (alqotel)         }
805*34553153SLucas Mateus Castro (alqotel)     }
806*34553153SLucas Mateus Castro (alqotel)     return psum;
807*34553153SLucas Mateus Castro (alqotel) }
808*34553153SLucas Mateus Castro (alqotel) 
809*34553153SLucas Mateus Castro (alqotel) static int64_t ger_rank2(uint32_t a, uint32_t b, uint32_t mask)
810*34553153SLucas Mateus Castro (alqotel) {
811*34553153SLucas Mateus Castro (alqotel)     int64_t psum = 0;
812*34553153SLucas Mateus Castro (alqotel)     for (int i = 0; i < 2; i++, mask >>= 1) {
813*34553153SLucas Mateus Castro (alqotel)         if (mask & 1) {
814*34553153SLucas Mateus Castro (alqotel)             psum += sextract32(a, 16 * i, 16) * sextract32(b, 16 * i, 16);
815*34553153SLucas Mateus Castro (alqotel)         }
816*34553153SLucas Mateus Castro (alqotel)     }
817*34553153SLucas Mateus Castro (alqotel)     return psum;
818*34553153SLucas Mateus Castro (alqotel) }
819*34553153SLucas Mateus Castro (alqotel) 
820*34553153SLucas Mateus Castro (alqotel) static void xviger(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, ppc_acc_t  *at,
821*34553153SLucas Mateus Castro (alqotel)                    uint32_t mask, bool sat, bool acc, do_ger ger)
822*34553153SLucas Mateus Castro (alqotel) {
823*34553153SLucas Mateus Castro (alqotel)     uint8_t pmsk = FIELD_EX32(mask, GER_MSK, PMSK),
824*34553153SLucas Mateus Castro (alqotel)             xmsk = FIELD_EX32(mask, GER_MSK, XMSK),
825*34553153SLucas Mateus Castro (alqotel)             ymsk = FIELD_EX32(mask, GER_MSK, YMSK);
826*34553153SLucas Mateus Castro (alqotel)     uint8_t xmsk_bit, ymsk_bit;
827*34553153SLucas Mateus Castro (alqotel)     int64_t psum;
828*34553153SLucas Mateus Castro (alqotel)     int i, j;
829*34553153SLucas Mateus Castro (alqotel)     for (i = 0, xmsk_bit = 1 << 3; i < 4; i++, xmsk_bit >>= 1) {
830*34553153SLucas Mateus Castro (alqotel)         for (j = 0, ymsk_bit = 1 << 3; j < 4; j++, ymsk_bit >>= 1) {
831*34553153SLucas Mateus Castro (alqotel)             if ((xmsk_bit & xmsk) && (ymsk_bit & ymsk)) {
832*34553153SLucas Mateus Castro (alqotel)                 psum = ger(a->VsrW(i), b->VsrW(j), pmsk);
833*34553153SLucas Mateus Castro (alqotel)                 if (acc) {
834*34553153SLucas Mateus Castro (alqotel)                     psum += at[i].VsrSW(j);
835*34553153SLucas Mateus Castro (alqotel)                 }
836*34553153SLucas Mateus Castro (alqotel)                 if (sat && psum > INT32_MAX) {
837*34553153SLucas Mateus Castro (alqotel)                     set_vscr_sat(env);
838*34553153SLucas Mateus Castro (alqotel)                     at[i].VsrSW(j) = INT32_MAX;
839*34553153SLucas Mateus Castro (alqotel)                 } else if (sat && psum < INT32_MIN) {
840*34553153SLucas Mateus Castro (alqotel)                     set_vscr_sat(env);
841*34553153SLucas Mateus Castro (alqotel)                     at[i].VsrSW(j) = INT32_MIN;
842*34553153SLucas Mateus Castro (alqotel)                 } else {
843*34553153SLucas Mateus Castro (alqotel)                     at[i].VsrSW(j) = (int32_t) psum;
844*34553153SLucas Mateus Castro (alqotel)                 }
845*34553153SLucas Mateus Castro (alqotel)             } else {
846*34553153SLucas Mateus Castro (alqotel)                 at[i].VsrSW(j) = 0;
847*34553153SLucas Mateus Castro (alqotel)             }
848*34553153SLucas Mateus Castro (alqotel)         }
849*34553153SLucas Mateus Castro (alqotel)     }
850*34553153SLucas Mateus Castro (alqotel) }
851*34553153SLucas Mateus Castro (alqotel) 
852*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
853*34553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
854*34553153SLucas Mateus Castro (alqotel)                      ppc_acc_t *at, uint32_t mask)
855*34553153SLucas Mateus Castro (alqotel) {
856*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, false, ger_rank8);
857*34553153SLucas Mateus Castro (alqotel) }
858*34553153SLucas Mateus Castro (alqotel) 
859*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
860*34553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
861*34553153SLucas Mateus Castro (alqotel)                        ppc_acc_t *at, uint32_t mask)
862*34553153SLucas Mateus Castro (alqotel) {
863*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, true, ger_rank8);
864*34553153SLucas Mateus Castro (alqotel) }
865*34553153SLucas Mateus Castro (alqotel) 
866*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
867*34553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
868*34553153SLucas Mateus Castro (alqotel)                      ppc_acc_t *at, uint32_t mask)
869*34553153SLucas Mateus Castro (alqotel) {
870*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, false, ger_rank4);
871*34553153SLucas Mateus Castro (alqotel) }
872*34553153SLucas Mateus Castro (alqotel) 
873*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
874*34553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
875*34553153SLucas Mateus Castro (alqotel)                        ppc_acc_t *at, uint32_t mask)
876*34553153SLucas Mateus Castro (alqotel) {
877*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, true, ger_rank4);
878*34553153SLucas Mateus Castro (alqotel) }
879*34553153SLucas Mateus Castro (alqotel) 
880*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
881*34553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
882*34553153SLucas Mateus Castro (alqotel)                         ppc_acc_t *at, uint32_t mask)
883*34553153SLucas Mateus Castro (alqotel) {
884*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, true, true, ger_rank4);
885*34553153SLucas Mateus Castro (alqotel) }
886*34553153SLucas Mateus Castro (alqotel) 
887*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
888*34553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
889*34553153SLucas Mateus Castro (alqotel)                       ppc_acc_t *at, uint32_t mask)
890*34553153SLucas Mateus Castro (alqotel) {
891*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, false, ger_rank2);
892*34553153SLucas Mateus Castro (alqotel) }
893*34553153SLucas Mateus Castro (alqotel) 
894*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
895*34553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2S(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
896*34553153SLucas Mateus Castro (alqotel)                        ppc_acc_t *at, uint32_t mask)
897*34553153SLucas Mateus Castro (alqotel) {
898*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, true, false, ger_rank2);
899*34553153SLucas Mateus Castro (alqotel) }
900*34553153SLucas Mateus Castro (alqotel) 
901*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
902*34553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
903*34553153SLucas Mateus Castro (alqotel)                         ppc_acc_t *at, uint32_t mask)
904*34553153SLucas Mateus Castro (alqotel) {
905*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, false, true, ger_rank2);
906*34553153SLucas Mateus Castro (alqotel) }
907*34553153SLucas Mateus Castro (alqotel) 
908*34553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN
909*34553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b,
910*34553153SLucas Mateus Castro (alqotel)                          ppc_acc_t *at, uint32_t mask)
911*34553153SLucas Mateus Castro (alqotel) {
912*34553153SLucas Mateus Castro (alqotel)     xviger(env, a, b, at, mask, true, true, ger_rank2);
913*34553153SLucas Mateus Castro (alqotel) }
914*34553153SLucas Mateus Castro (alqotel) 
915fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r)
916fcf5ef2aSThomas Huth {
917fcf5ef2aSThomas Huth     target_ulong count = 0;
918fcf5ef2aSThomas Huth     int i;
91960594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
92060594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
921fcf5ef2aSThomas Huth             break;
922fcf5ef2aSThomas Huth         }
923fcf5ef2aSThomas Huth         count++;
924fcf5ef2aSThomas Huth     }
925fcf5ef2aSThomas Huth     return count;
926fcf5ef2aSThomas Huth }
927fcf5ef2aSThomas Huth 
928fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r)
929fcf5ef2aSThomas Huth {
930fcf5ef2aSThomas Huth     target_ulong count = 0;
931fcf5ef2aSThomas Huth     int i;
932fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
93360594feaSMark Cave-Ayland         if (r->VsrB(i) & 0x01) {
934fcf5ef2aSThomas Huth             break;
935fcf5ef2aSThomas Huth         }
936fcf5ef2aSThomas Huth         count++;
937fcf5ef2aSThomas Huth     }
938fcf5ef2aSThomas Huth     return count;
939fcf5ef2aSThomas Huth }
940fcf5ef2aSThomas Huth 
941fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
942fcf5ef2aSThomas Huth                       ppc_avr_t *b, ppc_avr_t *c)
943fcf5ef2aSThomas Huth {
944fcf5ef2aSThomas Huth     int sat = 0;
945fcf5ef2aSThomas Huth     int i;
946fcf5ef2aSThomas Huth 
947fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
948fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
949fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
950fcf5ef2aSThomas Huth 
951fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
952fcf5ef2aSThomas Huth     }
953fcf5ef2aSThomas Huth 
954fcf5ef2aSThomas Huth     if (sat) {
9556175f5a0SRichard Henderson         set_vscr_sat(env);
956fcf5ef2aSThomas Huth     }
957fcf5ef2aSThomas Huth }
958fcf5ef2aSThomas Huth 
959fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
960fcf5ef2aSThomas Huth                        ppc_avr_t *b, ppc_avr_t *c)
961fcf5ef2aSThomas Huth {
962fcf5ef2aSThomas Huth     int sat = 0;
963fcf5ef2aSThomas Huth     int i;
964fcf5ef2aSThomas Huth 
965fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
966fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i] + 0x00004000;
967fcf5ef2aSThomas Huth         int32_t t = (int32_t)c->s16[i] + (prod >> 15);
968fcf5ef2aSThomas Huth         r->s16[i] = cvtswsh(t, &sat);
969fcf5ef2aSThomas Huth     }
970fcf5ef2aSThomas Huth 
971fcf5ef2aSThomas Huth     if (sat) {
9726175f5a0SRichard Henderson         set_vscr_sat(env);
973fcf5ef2aSThomas Huth     }
974fcf5ef2aSThomas Huth }
975fcf5ef2aSThomas Huth 
976fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
977fcf5ef2aSThomas Huth {
978fcf5ef2aSThomas Huth     int i;
979fcf5ef2aSThomas Huth 
980fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
981fcf5ef2aSThomas Huth         int32_t prod = a->s16[i] * b->s16[i];
982fcf5ef2aSThomas Huth         r->s16[i] = (int16_t) (prod + c->s16[i]);
983fcf5ef2aSThomas Huth     }
984fcf5ef2aSThomas Huth }
985fcf5ef2aSThomas Huth 
986d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs)                                  \
987fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)            \
988fcf5ef2aSThomas Huth     {                                                                        \
989fcf5ef2aSThomas Huth         ppc_avr_t result;                                                    \
990d81c2040SMark Cave-Ayland         int i, half = ARRAY_SIZE(r->element) / 2;                            \
991fcf5ef2aSThomas Huth                                                                              \
992d81c2040SMark Cave-Ayland         for (i = 0; i < half; i++) {                                         \
993d81c2040SMark Cave-Ayland             result.access(i * 2 + 0) = a->access(i + ofs);                   \
994d81c2040SMark Cave-Ayland             result.access(i * 2 + 1) = b->access(i + ofs);                   \
995fcf5ef2aSThomas Huth         }                                                                    \
996fcf5ef2aSThomas Huth         *r = result;                                                         \
997fcf5ef2aSThomas Huth     }
998d81c2040SMark Cave-Ayland 
999d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access)          \
1000d81c2040SMark Cave-Ayland     VMRG_DO(mrgl##suffix, element, access, half)   \
1001d81c2040SMark Cave-Ayland     VMRG_DO(mrgh##suffix, element, access, 0)
1002d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB)
1003d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH)
1004d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW)
1005fcf5ef2aSThomas Huth #undef VMRG_DO
1006fcf5ef2aSThomas Huth #undef VMRG
1007fcf5ef2aSThomas Huth 
1008b2dc03a5SMatheus Ferst void helper_VMSUMMBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1009fcf5ef2aSThomas Huth {
1010fcf5ef2aSThomas Huth     int32_t prod[16];
1011fcf5ef2aSThomas Huth     int i;
1012fcf5ef2aSThomas Huth 
1013fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s8); i++) {
1014fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s8[i] * b->u8[i];
1015fcf5ef2aSThomas Huth     }
1016fcf5ef2aSThomas Huth 
1017fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1018fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] +
1019fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
1020fcf5ef2aSThomas Huth     }
1021fcf5ef2aSThomas Huth }
1022fcf5ef2aSThomas Huth 
10236f52f731SMatheus Ferst void helper_VMSUMSHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1024fcf5ef2aSThomas Huth {
1025fcf5ef2aSThomas Huth     int32_t prod[8];
1026fcf5ef2aSThomas Huth     int i;
1027fcf5ef2aSThomas Huth 
1028fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1029fcf5ef2aSThomas Huth         prod[i] = a->s16[i] * b->s16[i];
1030fcf5ef2aSThomas Huth     }
1031fcf5ef2aSThomas Huth 
1032fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1033fcf5ef2aSThomas Huth         r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1];
1034fcf5ef2aSThomas Huth     }
1035fcf5ef2aSThomas Huth }
1036fcf5ef2aSThomas Huth 
10376f52f731SMatheus Ferst void helper_VMSUMSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1038fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1039fcf5ef2aSThomas Huth {
1040fcf5ef2aSThomas Huth     int32_t prod[8];
1041fcf5ef2aSThomas Huth     int i;
1042fcf5ef2aSThomas Huth     int sat = 0;
1043fcf5ef2aSThomas Huth 
1044fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s16); i++) {
1045fcf5ef2aSThomas Huth         prod[i] = (int32_t)a->s16[i] * b->s16[i];
1046fcf5ef2aSThomas Huth     }
1047fcf5ef2aSThomas Huth 
1048fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1049fcf5ef2aSThomas Huth         int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1];
1050fcf5ef2aSThomas Huth 
1051fcf5ef2aSThomas Huth         r->u32[i] = cvtsdsw(t, &sat);
1052fcf5ef2aSThomas Huth     }
1053fcf5ef2aSThomas Huth 
1054fcf5ef2aSThomas Huth     if (sat) {
10556175f5a0SRichard Henderson         set_vscr_sat(env);
1056fcf5ef2aSThomas Huth     }
1057fcf5ef2aSThomas Huth }
1058fcf5ef2aSThomas Huth 
1059b2dc03a5SMatheus Ferst void helper_VMSUMUBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1060fcf5ef2aSThomas Huth {
1061fcf5ef2aSThomas Huth     uint16_t prod[16];
1062fcf5ef2aSThomas Huth     int i;
1063fcf5ef2aSThomas Huth 
1064fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1065fcf5ef2aSThomas Huth         prod[i] = a->u8[i] * b->u8[i];
1066fcf5ef2aSThomas Huth     }
1067fcf5ef2aSThomas Huth 
1068fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
1069fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] +
1070fcf5ef2aSThomas Huth             prod[4 * i + 2] + prod[4 * i + 3];
1071fcf5ef2aSThomas Huth     }
1072fcf5ef2aSThomas Huth }
1073fcf5ef2aSThomas Huth 
107489a5a1aeSMatheus Ferst void helper_VMSUMUHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1075fcf5ef2aSThomas Huth {
1076fcf5ef2aSThomas Huth     uint32_t prod[8];
1077fcf5ef2aSThomas Huth     int i;
1078fcf5ef2aSThomas Huth 
1079fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
1080fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
1081fcf5ef2aSThomas Huth     }
1082fcf5ef2aSThomas Huth 
1083fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
1084fcf5ef2aSThomas Huth         r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1];
1085fcf5ef2aSThomas Huth     }
1086fcf5ef2aSThomas Huth }
1087fcf5ef2aSThomas Huth 
108889a5a1aeSMatheus Ferst void helper_VMSUMUHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a,
1089fcf5ef2aSThomas Huth                      ppc_avr_t *b, ppc_avr_t *c)
1090fcf5ef2aSThomas Huth {
1091fcf5ef2aSThomas Huth     uint32_t prod[8];
1092fcf5ef2aSThomas Huth     int i;
1093fcf5ef2aSThomas Huth     int sat = 0;
1094fcf5ef2aSThomas Huth 
1095fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u16); i++) {
1096fcf5ef2aSThomas Huth         prod[i] = a->u16[i] * b->u16[i];
1097fcf5ef2aSThomas Huth     }
1098fcf5ef2aSThomas Huth 
1099fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, s32) {
1100fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1];
1101fcf5ef2aSThomas Huth 
1102fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
1103fcf5ef2aSThomas Huth     }
1104fcf5ef2aSThomas Huth 
1105fcf5ef2aSThomas Huth     if (sat) {
11066175f5a0SRichard Henderson         set_vscr_sat(env);
1107fcf5ef2aSThomas Huth     }
1108fcf5ef2aSThomas Huth }
1109fcf5ef2aSThomas Huth 
11104fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast)   \
111180eca687SLucas Mateus Castro (alqotel)     void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
1112fcf5ef2aSThomas Huth     {                                                                   \
1113fcf5ef2aSThomas Huth         int i;                                                          \
1114fcf5ef2aSThomas Huth                                                                         \
11154fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
11164fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i) *           \
11174fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i);            \
1118fcf5ef2aSThomas Huth         }                                                               \
1119fcf5ef2aSThomas Huth     }
11204fbc89edSMark Cave-Ayland 
11214fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast)   \
112280eca687SLucas Mateus Castro (alqotel)     void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)       \
11234fbc89edSMark Cave-Ayland     {                                                                   \
11244fbc89edSMark Cave-Ayland         int i;                                                          \
11254fbc89edSMark Cave-Ayland                                                                         \
11264fbc89edSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) {           \
11274fbc89edSMark Cave-Ayland             r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) *       \
11284fbc89edSMark Cave-Ayland                                      (cast)b->mul_access(i + 1);        \
11294fbc89edSMark Cave-Ayland         }                                                               \
11304fbc89edSMark Cave-Ayland     }
11314fbc89edSMark Cave-Ayland 
11324fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast)       \
113380eca687SLucas Mateus Castro (alqotel)     VMUL_DO_EVN(MULE##suffix, mul_element, mul_access, prod_access, cast)  \
113480eca687SLucas Mateus Castro (alqotel)     VMUL_DO_ODD(MULO##suffix, mul_element, mul_access, prod_access, cast)
113580eca687SLucas Mateus Castro (alqotel) VMUL(SB, s8, VsrSB, VsrSH, int16_t)
113680eca687SLucas Mateus Castro (alqotel) VMUL(SH, s16, VsrSH, VsrSW, int32_t)
113780eca687SLucas Mateus Castro (alqotel) VMUL(SW, s32, VsrSW, VsrSD, int64_t)
113880eca687SLucas Mateus Castro (alqotel) VMUL(UB, u8, VsrB, VsrH, uint16_t)
113980eca687SLucas Mateus Castro (alqotel) VMUL(UH, u16, VsrH, VsrW, uint32_t)
114080eca687SLucas Mateus Castro (alqotel) VMUL(UW, u32, VsrW, VsrD, uint64_t)
11414fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN
11424fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD
1143fcf5ef2aSThomas Huth #undef VMUL
1144fcf5ef2aSThomas Huth 
114541c2877fSMatheus Ferst void helper_XXPERMX(ppc_vsr_t *t, ppc_vsr_t *s0, ppc_vsr_t *s1, ppc_vsr_t *pcv,
114641c2877fSMatheus Ferst                     target_ulong uim)
114741c2877fSMatheus Ferst {
114841c2877fSMatheus Ferst     int i, idx;
114941c2877fSMatheus Ferst     ppc_vsr_t tmp = { .u64 = {0, 0} };
115041c2877fSMatheus Ferst 
115141c2877fSMatheus Ferst     for (i = 0; i < ARRAY_SIZE(t->u8); i++) {
115241c2877fSMatheus Ferst         if ((pcv->VsrB(i) >> 5) == uim) {
115341c2877fSMatheus Ferst             idx = pcv->VsrB(i) & 0x1f;
115441c2877fSMatheus Ferst             if (idx < ARRAY_SIZE(t->u8)) {
115541c2877fSMatheus Ferst                 tmp.VsrB(i) = s0->VsrB(idx);
115641c2877fSMatheus Ferst             } else {
115741c2877fSMatheus Ferst                 tmp.VsrB(i) = s1->VsrB(idx - ARRAY_SIZE(t->u8));
115841c2877fSMatheus Ferst             }
115941c2877fSMatheus Ferst         }
116041c2877fSMatheus Ferst     }
116141c2877fSMatheus Ferst 
116241c2877fSMatheus Ferst     *t = tmp;
116341c2877fSMatheus Ferst }
116441c2877fSMatheus Ferst 
116528347fe2SMatheus Ferst void helper_VPERM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1166fcf5ef2aSThomas Huth {
1167fcf5ef2aSThomas Huth     ppc_avr_t result;
1168fcf5ef2aSThomas Huth     int i;
1169fcf5ef2aSThomas Huth 
117060594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
117160594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1172fcf5ef2aSThomas Huth         int index = s & 0xf;
1173fcf5ef2aSThomas Huth 
1174fcf5ef2aSThomas Huth         if (s & 0x10) {
117560594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1176fcf5ef2aSThomas Huth         } else {
117760594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1178fcf5ef2aSThomas Huth         }
1179fcf5ef2aSThomas Huth     }
1180fcf5ef2aSThomas Huth     *r = result;
1181fcf5ef2aSThomas Huth }
1182fcf5ef2aSThomas Huth 
118328347fe2SMatheus Ferst void helper_VPERMR(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
1184fcf5ef2aSThomas Huth {
1185fcf5ef2aSThomas Huth     ppc_avr_t result;
1186fcf5ef2aSThomas Huth     int i;
1187fcf5ef2aSThomas Huth 
118860594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
118960594feaSMark Cave-Ayland         int s = c->VsrB(i) & 0x1f;
1190fcf5ef2aSThomas Huth         int index = 15 - (s & 0xf);
1191fcf5ef2aSThomas Huth 
1192fcf5ef2aSThomas Huth         if (s & 0x10) {
119360594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1194fcf5ef2aSThomas Huth         } else {
119560594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index);
1196fcf5ef2aSThomas Huth         }
1197fcf5ef2aSThomas Huth     }
1198fcf5ef2aSThomas Huth     *r = result;
1199fcf5ef2aSThomas Huth }
1200fcf5ef2aSThomas Huth 
1201618574ddSMatheus Ferst #define XXGENPCV_BE_EXP(NAME, SZ) \
1202b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \
1203b090f4f1SMatheus Ferst {                                                                   \
1204b090f4f1SMatheus Ferst     ppc_vsr_t tmp;                                                  \
1205b090f4f1SMatheus Ferst                                                                     \
1206b090f4f1SMatheus Ferst     /* Initialize tmp with the result of an all-zeros mask */       \
1207b090f4f1SMatheus Ferst     tmp.VsrD(0) = 0x1011121314151617;                               \
1208b090f4f1SMatheus Ferst     tmp.VsrD(1) = 0x18191A1B1C1D1E1F;                               \
1209b090f4f1SMatheus Ferst                                                                     \
1210b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1211b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1212b090f4f1SMatheus Ferst         if (b->VsrB(i) & 0x80) {                                    \
1213b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1214b090f4f1SMatheus Ferst             for (int k = 0; k < SZ; k++) {                          \
1215b090f4f1SMatheus Ferst                 tmp.VsrB(i + k) = j + k;                            \
1216b090f4f1SMatheus Ferst             }                                                       \
1217b090f4f1SMatheus Ferst             j += SZ;                                                \
1218b090f4f1SMatheus Ferst         }                                                           \
1219b090f4f1SMatheus Ferst     }                                                               \
1220b090f4f1SMatheus Ferst                                                                     \
1221b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1222618574ddSMatheus Ferst }
1223618574ddSMatheus Ferst 
1224618574ddSMatheus Ferst #define XXGENPCV_BE_COMP(NAME, SZ) \
1225b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\
1226b090f4f1SMatheus Ferst {                                                                   \
1227b090f4f1SMatheus Ferst     ppc_vsr_t tmp = { .u64 = { 0, 0 } };                            \
1228b090f4f1SMatheus Ferst                                                                     \
1229b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1230b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1231b090f4f1SMatheus Ferst         if (b->VsrB(i) & 0x80) {                                    \
1232b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1233b090f4f1SMatheus Ferst             for (int k = 0; k < SZ; k++) {                          \
1234b090f4f1SMatheus Ferst                 tmp.VsrB(j + k) = i + k;                            \
1235b090f4f1SMatheus Ferst             }                                                       \
1236b090f4f1SMatheus Ferst             j += SZ;                                                \
1237b090f4f1SMatheus Ferst         }                                                           \
1238b090f4f1SMatheus Ferst     }                                                               \
1239b090f4f1SMatheus Ferst                                                                     \
1240b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1241618574ddSMatheus Ferst }
1242618574ddSMatheus Ferst 
1243618574ddSMatheus Ferst #define XXGENPCV_LE_EXP(NAME, SZ) \
1244b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \
1245b090f4f1SMatheus Ferst {                                                                   \
1246b090f4f1SMatheus Ferst     ppc_vsr_t tmp;                                                  \
1247b090f4f1SMatheus Ferst                                                                     \
1248b090f4f1SMatheus Ferst     /* Initialize tmp with the result of an all-zeros mask */       \
1249b090f4f1SMatheus Ferst     tmp.VsrD(0) = 0x1F1E1D1C1B1A1918;                               \
1250b090f4f1SMatheus Ferst     tmp.VsrD(1) = 0x1716151413121110;                               \
1251b090f4f1SMatheus Ferst                                                                     \
1252b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1253b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1254b090f4f1SMatheus Ferst         /* Reverse indexing of "i" */                               \
1255b090f4f1SMatheus Ferst         const int idx = ARRAY_SIZE(b->u8) - i - SZ;                 \
1256b090f4f1SMatheus Ferst         if (b->VsrB(idx) & 0x80) {                                  \
1257b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1258b090f4f1SMatheus Ferst             for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) {       \
1259b090f4f1SMatheus Ferst                 tmp.VsrB(idx + rk) = j + k;                         \
1260b090f4f1SMatheus Ferst             }                                                       \
1261b090f4f1SMatheus Ferst             j += SZ;                                                \
1262b090f4f1SMatheus Ferst         }                                                           \
1263b090f4f1SMatheus Ferst     }                                                               \
1264b090f4f1SMatheus Ferst                                                                     \
1265b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1266618574ddSMatheus Ferst }
1267618574ddSMatheus Ferst 
1268618574ddSMatheus Ferst #define XXGENPCV_LE_COMP(NAME, SZ) \
1269b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\
1270b090f4f1SMatheus Ferst {                                                                   \
1271b090f4f1SMatheus Ferst     ppc_vsr_t tmp = { .u64 = { 0, 0 } };                            \
1272b090f4f1SMatheus Ferst                                                                     \
1273b090f4f1SMatheus Ferst     /* Iterate over the most significant byte of each element */    \
1274b090f4f1SMatheus Ferst     for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) {        \
1275b090f4f1SMatheus Ferst         if (b->VsrB(ARRAY_SIZE(b->u8) - i - SZ) & 0x80) {           \
1276b090f4f1SMatheus Ferst             /* Update each byte of the element */                   \
1277b090f4f1SMatheus Ferst             for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) {       \
1278b090f4f1SMatheus Ferst                 /* Reverse indexing of "j" */                       \
1279b090f4f1SMatheus Ferst                 const int idx = ARRAY_SIZE(b->u8) - j - SZ;         \
1280b090f4f1SMatheus Ferst                 tmp.VsrB(idx + rk) = i + k;                         \
1281b090f4f1SMatheus Ferst             }                                                       \
1282b090f4f1SMatheus Ferst             j += SZ;                                                \
1283b090f4f1SMatheus Ferst         }                                                           \
1284b090f4f1SMatheus Ferst     }                                                               \
1285b090f4f1SMatheus Ferst                                                                     \
1286b090f4f1SMatheus Ferst     *t = tmp;                                                       \
1287b090f4f1SMatheus Ferst }
1288b090f4f1SMatheus Ferst 
1289618574ddSMatheus Ferst #define XXGENPCV(NAME, SZ) \
1290618574ddSMatheus Ferst     XXGENPCV_BE_EXP(NAME, SZ)  \
1291618574ddSMatheus Ferst     XXGENPCV_BE_COMP(NAME, SZ) \
1292618574ddSMatheus Ferst     XXGENPCV_LE_EXP(NAME, SZ)  \
1293618574ddSMatheus Ferst     XXGENPCV_LE_COMP(NAME, SZ) \
1294618574ddSMatheus Ferst 
1295b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVBM, 1)
1296b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVHM, 2)
1297b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVWM, 4)
1298b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVDM, 8)
1299618574ddSMatheus Ferst 
1300618574ddSMatheus Ferst #undef XXGENPCV_BE_EXP
1301618574ddSMatheus Ferst #undef XXGENPCV_BE_COMP
1302618574ddSMatheus Ferst #undef XXGENPCV_LE_EXP
1303618574ddSMatheus Ferst #undef XXGENPCV_LE_COMP
1304b090f4f1SMatheus Ferst #undef XXGENPCV
1305b090f4f1SMatheus Ferst 
1306e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1307fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)])
1308fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i)
1309fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0)
1310fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1))
1311fcf5ef2aSThomas Huth #else
1312fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)])
1313fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i)
1314fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0)
1315fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \
1316fcf5ef2aSThomas Huth         (extract64((avr)->u64[1 - i], 63 - index, 1))
1317fcf5ef2aSThomas Huth #endif
1318fcf5ef2aSThomas Huth 
1319fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1320fcf5ef2aSThomas Huth {
1321fcf5ef2aSThomas Huth     int i, j;
1322fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
1323fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1324fcf5ef2aSThomas Huth         for (j = 0; j < 8; j++) {
1325fcf5ef2aSThomas Huth             int index = VBPERMQ_INDEX(b, (i * 8) + j);
1326fcf5ef2aSThomas Huth             if (index < 64 && EXTRACT_BIT(a, i, index)) {
1327fcf5ef2aSThomas Huth                 result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j);
1328fcf5ef2aSThomas Huth             }
1329fcf5ef2aSThomas Huth         }
1330fcf5ef2aSThomas Huth     }
1331fcf5ef2aSThomas Huth     *r = result;
1332fcf5ef2aSThomas Huth }
1333fcf5ef2aSThomas Huth 
1334fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1335fcf5ef2aSThomas Huth {
1336fcf5ef2aSThomas Huth     int i;
1337fcf5ef2aSThomas Huth     uint64_t perm = 0;
1338fcf5ef2aSThomas Huth 
1339fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
1340fcf5ef2aSThomas Huth         int index = VBPERMQ_INDEX(b, i);
1341fcf5ef2aSThomas Huth 
1342fcf5ef2aSThomas Huth         if (index < 128) {
1343fcf5ef2aSThomas Huth             uint64_t mask = (1ull << (63 - (index & 0x3F)));
1344fcf5ef2aSThomas Huth             if (a->u64[VBPERMQ_DW(index)] & mask) {
1345fcf5ef2aSThomas Huth                 perm |= (0x8000 >> i);
1346fcf5ef2aSThomas Huth             }
1347fcf5ef2aSThomas Huth         }
1348fcf5ef2aSThomas Huth     }
1349fcf5ef2aSThomas Huth 
13503c385a93SMark Cave-Ayland     r->VsrD(0) = perm;
13513c385a93SMark Cave-Ayland     r->VsrD(1) = 0;
1352fcf5ef2aSThomas Huth }
1353fcf5ef2aSThomas Huth 
1354fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX
1355fcf5ef2aSThomas Huth #undef VBPERMQ_DW
1356fcf5ef2aSThomas Huth 
1357fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp)                   \
1358fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)  \
1359fcf5ef2aSThomas Huth {                                                             \
1360fcf5ef2aSThomas Huth     int i, j;                                                 \
1361fcf5ef2aSThomas Huth     trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])];    \
1362fcf5ef2aSThomas Huth                                                               \
1363fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, srcfld) {                         \
1364fcf5ef2aSThomas Huth         prod[i] = 0;                                          \
1365fcf5ef2aSThomas Huth         for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) {      \
1366fcf5ef2aSThomas Huth             if (a->srcfld[i] & (1ull << j)) {                 \
1367fcf5ef2aSThomas Huth                 prod[i] ^= ((trgtyp)b->srcfld[i] << j);       \
1368fcf5ef2aSThomas Huth             }                                                 \
1369fcf5ef2aSThomas Huth         }                                                     \
1370fcf5ef2aSThomas Huth     }                                                         \
1371fcf5ef2aSThomas Huth                                                               \
1372fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, trgfld) {                         \
1373fcf5ef2aSThomas Huth         r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1];         \
1374fcf5ef2aSThomas Huth     }                                                         \
1375fcf5ef2aSThomas Huth }
1376fcf5ef2aSThomas Huth 
1377fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t)
1378fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t)
1379fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t)
1380fcf5ef2aSThomas Huth 
1381fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1382fcf5ef2aSThomas Huth {
1383fcf5ef2aSThomas Huth 
1384fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
1385fcf5ef2aSThomas Huth     int i, j;
1386fcf5ef2aSThomas Huth     __uint128_t prod[2];
1387fcf5ef2aSThomas Huth 
1388fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1389fcf5ef2aSThomas Huth         prod[i] = 0;
1390fcf5ef2aSThomas Huth         for (j = 0; j < 64; j++) {
1391fcf5ef2aSThomas Huth             if (a->u64[i] & (1ull << j)) {
1392fcf5ef2aSThomas Huth                 prod[i] ^= (((__uint128_t)b->u64[i]) << j);
1393fcf5ef2aSThomas Huth             }
1394fcf5ef2aSThomas Huth         }
1395fcf5ef2aSThomas Huth     }
1396fcf5ef2aSThomas Huth 
1397fcf5ef2aSThomas Huth     r->u128 = prod[0] ^ prod[1];
1398fcf5ef2aSThomas Huth 
1399fcf5ef2aSThomas Huth #else
1400fcf5ef2aSThomas Huth     int i, j;
1401fcf5ef2aSThomas Huth     ppc_avr_t prod[2];
1402fcf5ef2aSThomas Huth 
1403fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
14043c385a93SMark Cave-Ayland         prod[i].VsrD(1) = prod[i].VsrD(0) = 0;
1405fcf5ef2aSThomas Huth         for (j = 0; j < 64; j++) {
1406fcf5ef2aSThomas Huth             if (a->u64[i] & (1ull << j)) {
1407fcf5ef2aSThomas Huth                 ppc_avr_t bshift;
1408fcf5ef2aSThomas Huth                 if (j == 0) {
14093c385a93SMark Cave-Ayland                     bshift.VsrD(0) = 0;
14103c385a93SMark Cave-Ayland                     bshift.VsrD(1) = b->u64[i];
1411fcf5ef2aSThomas Huth                 } else {
14123c385a93SMark Cave-Ayland                     bshift.VsrD(0) = b->u64[i] >> (64 - j);
14133c385a93SMark Cave-Ayland                     bshift.VsrD(1) = b->u64[i] << j;
1414fcf5ef2aSThomas Huth                 }
14153c385a93SMark Cave-Ayland                 prod[i].VsrD(1) ^= bshift.VsrD(1);
14163c385a93SMark Cave-Ayland                 prod[i].VsrD(0) ^= bshift.VsrD(0);
1417fcf5ef2aSThomas Huth             }
1418fcf5ef2aSThomas Huth         }
1419fcf5ef2aSThomas Huth     }
1420fcf5ef2aSThomas Huth 
14213c385a93SMark Cave-Ayland     r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1);
14223c385a93SMark Cave-Ayland     r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0);
1423fcf5ef2aSThomas Huth #endif
1424fcf5ef2aSThomas Huth }
1425fcf5ef2aSThomas Huth 
1426fcf5ef2aSThomas Huth 
1427e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1428fcf5ef2aSThomas Huth #define PKBIG 1
1429fcf5ef2aSThomas Huth #else
1430fcf5ef2aSThomas Huth #define PKBIG 0
1431fcf5ef2aSThomas Huth #endif
1432fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1433fcf5ef2aSThomas Huth {
1434fcf5ef2aSThomas Huth     int i, j;
1435fcf5ef2aSThomas Huth     ppc_avr_t result;
1436e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1437fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { a, b };
1438fcf5ef2aSThomas Huth #else
1439fcf5ef2aSThomas Huth     const ppc_avr_t *x[2] = { b, a };
1440fcf5ef2aSThomas Huth #endif
1441fcf5ef2aSThomas Huth 
1442fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u64) {
1443fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(j, u32) {
1444fcf5ef2aSThomas Huth             uint32_t e = x[i]->u32[j];
1445fcf5ef2aSThomas Huth 
1446fcf5ef2aSThomas Huth             result.u16[4 * i + j] = (((e >> 9) & 0xfc00) |
1447fcf5ef2aSThomas Huth                                      ((e >> 6) & 0x3e0) |
1448fcf5ef2aSThomas Huth                                      ((e >> 3) & 0x1f));
1449fcf5ef2aSThomas Huth         }
1450fcf5ef2aSThomas Huth     }
1451fcf5ef2aSThomas Huth     *r = result;
1452fcf5ef2aSThomas Huth }
1453fcf5ef2aSThomas Huth 
1454fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat)                               \
1455fcf5ef2aSThomas Huth     void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r,             \
1456fcf5ef2aSThomas Huth                             ppc_avr_t *a, ppc_avr_t *b)                 \
1457fcf5ef2aSThomas Huth     {                                                                   \
1458fcf5ef2aSThomas Huth         int i;                                                          \
1459fcf5ef2aSThomas Huth         int sat = 0;                                                    \
1460fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
1461fcf5ef2aSThomas Huth         ppc_avr_t *a0 = PKBIG ? a : b;                                  \
1462fcf5ef2aSThomas Huth         ppc_avr_t *a1 = PKBIG ? b : a;                                  \
1463fcf5ef2aSThomas Huth                                                                         \
1464fcf5ef2aSThomas Huth         VECTOR_FOR_INORDER_I(i, from) {                                 \
1465fcf5ef2aSThomas Huth             result.to[i] = cvt(a0->from[i], &sat);                      \
1466fcf5ef2aSThomas Huth             result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\
1467fcf5ef2aSThomas Huth         }                                                               \
1468fcf5ef2aSThomas Huth         *r = result;                                                    \
1469fcf5ef2aSThomas Huth         if (dosat && sat) {                                             \
14706175f5a0SRichard Henderson             set_vscr_sat(env);                                          \
1471fcf5ef2aSThomas Huth         }                                                               \
1472fcf5ef2aSThomas Huth     }
1473fcf5ef2aSThomas Huth #define I(x, y) (x)
1474fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1)
1475fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1)
1476fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1)
1477fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1)
1478fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1)
1479fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1)
1480fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1)
1481fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1)
1482fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1)
1483fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0)
1484fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0)
1485fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0)
1486fcf5ef2aSThomas Huth #undef I
1487fcf5ef2aSThomas Huth #undef VPK
1488fcf5ef2aSThomas Huth #undef PKBIG
1489fcf5ef2aSThomas Huth 
1490fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1491fcf5ef2aSThomas Huth {
1492fcf5ef2aSThomas Huth     int i;
1493fcf5ef2aSThomas Huth 
149405ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
149505ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status);
1496fcf5ef2aSThomas Huth     }
1497fcf5ef2aSThomas Huth }
1498fcf5ef2aSThomas Huth 
1499fcf5ef2aSThomas Huth #define VRFI(suffix, rounding)                                  \
1500fcf5ef2aSThomas Huth     void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r,    \
1501fcf5ef2aSThomas Huth                              ppc_avr_t *b)                      \
1502fcf5ef2aSThomas Huth     {                                                           \
1503fcf5ef2aSThomas Huth         int i;                                                  \
1504fcf5ef2aSThomas Huth         float_status s = env->vec_status;                       \
1505fcf5ef2aSThomas Huth                                                                 \
1506fcf5ef2aSThomas Huth         set_float_rounding_mode(rounding, &s);                  \
150705ee3e8aSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->f32); i++) {              \
150805ee3e8aSMark Cave-Ayland             r->f32[i] = float32_round_to_int (b->f32[i], &s);   \
1509fcf5ef2aSThomas Huth         }                                                       \
1510fcf5ef2aSThomas Huth     }
1511fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even)
1512fcf5ef2aSThomas Huth VRFI(m, float_round_down)
1513fcf5ef2aSThomas Huth VRFI(p, float_round_up)
1514fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero)
1515fcf5ef2aSThomas Huth #undef VRFI
1516fcf5ef2aSThomas Huth 
1517fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1518fcf5ef2aSThomas Huth {
1519fcf5ef2aSThomas Huth     int i;
1520fcf5ef2aSThomas Huth 
152105ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
152205ee3e8aSMark Cave-Ayland         float32 t = float32_sqrt(b->f32[i], &env->vec_status);
1523fcf5ef2aSThomas Huth 
152405ee3e8aSMark Cave-Ayland         r->f32[i] = float32_div(float32_one, t, &env->vec_status);
1525fcf5ef2aSThomas Huth     }
1526fcf5ef2aSThomas Huth }
1527fcf5ef2aSThomas Huth 
1528fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert)                                  \
152902c74f0eSMatheus Ferst void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \
1530fcf5ef2aSThomas Huth {                                                                           \
1531fcf5ef2aSThomas Huth     int i;                                                                  \
1532fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                          \
1533fcf5ef2aSThomas Huth         uint##size##_t src1 = a->element[i];                                \
1534fcf5ef2aSThomas Huth         uint##size##_t src2 = b->element[i];                                \
1535fcf5ef2aSThomas Huth         uint##size##_t src3 = r->element[i];                                \
1536fcf5ef2aSThomas Huth         uint##size##_t begin, end, shift, mask, rot_val;                    \
1537fcf5ef2aSThomas Huth                                                                             \
1538fcf5ef2aSThomas Huth         shift = extract##size(src2, 0, 6);                                  \
1539fcf5ef2aSThomas Huth         end   = extract##size(src2, 8, 6);                                  \
1540fcf5ef2aSThomas Huth         begin = extract##size(src2, 16, 6);                                 \
1541fcf5ef2aSThomas Huth         rot_val = rol##size(src1, shift);                                   \
1542fcf5ef2aSThomas Huth         mask = mask_u##size(begin, end);                                    \
1543fcf5ef2aSThomas Huth         if (insert) {                                                       \
1544fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask) | (src3 & ~mask);              \
1545fcf5ef2aSThomas Huth         } else {                                                            \
1546fcf5ef2aSThomas Huth             r->element[i] = (rot_val & mask);                               \
1547fcf5ef2aSThomas Huth         }                                                                   \
1548fcf5ef2aSThomas Huth     }                                                                       \
1549fcf5ef2aSThomas Huth }
1550fcf5ef2aSThomas Huth 
155102c74f0eSMatheus Ferst VRLMI(VRLDMI, 64, u64, 1);
155202c74f0eSMatheus Ferst VRLMI(VRLWMI, 32, u32, 1);
155302c74f0eSMatheus Ferst VRLMI(VRLDNM, 64, u64, 0);
155402c74f0eSMatheus Ferst VRLMI(VRLWNM, 32, u32, 0);
1555fcf5ef2aSThomas Huth 
1556fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1557fcf5ef2aSThomas Huth {
1558fcf5ef2aSThomas Huth     int i;
1559fcf5ef2aSThomas Huth 
156005ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
156105ee3e8aSMark Cave-Ayland         r->f32[i] = float32_exp2(b->f32[i], &env->vec_status);
1562fcf5ef2aSThomas Huth     }
1563fcf5ef2aSThomas Huth }
1564fcf5ef2aSThomas Huth 
1565fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
1566fcf5ef2aSThomas Huth {
1567fcf5ef2aSThomas Huth     int i;
1568fcf5ef2aSThomas Huth 
156905ee3e8aSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->f32); i++) {
157005ee3e8aSMark Cave-Ayland         r->f32[i] = float32_log2(b->f32[i], &env->vec_status);
1571fcf5ef2aSThomas Huth     }
1572fcf5ef2aSThomas Huth }
1573fcf5ef2aSThomas Huth 
157460caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left)                            \
157560caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b)  \
157660caf221SAvinesh Kumar {                                                               \
1577f297c4c6SMatheus Ferst     int index = (a & 0xf) * 8;                                  \
157860caf221SAvinesh Kumar     if (left) {                                                 \
1579f297c4c6SMatheus Ferst         index = 128 - index - size;                             \
158060caf221SAvinesh Kumar     }                                                           \
158160caf221SAvinesh Kumar     return int128_getlo(int128_rshift(b->s128, index)) &        \
158260caf221SAvinesh Kumar         MAKE_64BIT_MASK(0, size);                               \
158360caf221SAvinesh Kumar }
158460caf221SAvinesh Kumar VEXTU_X_DO(vextublx,  8, 1)
158560caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1)
158660caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1)
158760caf221SAvinesh Kumar VEXTU_X_DO(vextubrx,  8, 0)
158860caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0)
158960caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0)
159060caf221SAvinesh Kumar #undef VEXTU_X_DO
159160caf221SAvinesh Kumar 
1592fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1593fcf5ef2aSThomas Huth {
1594fcf5ef2aSThomas Huth     int i;
1595fcf5ef2aSThomas Huth     unsigned int shift, bytes, size;
1596fcf5ef2aSThomas Huth 
1597fcf5ef2aSThomas Huth     size = ARRAY_SIZE(r->u8);
1598fcf5ef2aSThomas Huth     for (i = 0; i < size; i++) {
159963be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;             /* extract shift value */
160063be02fcSAnton Blanchard         bytes = (a->VsrB(i) << 8) +           /* extract adjacent bytes */
160163be02fcSAnton Blanchard             (((i + 1) < size) ? a->VsrB(i + 1) : 0);
160263be02fcSAnton Blanchard         r->VsrB(i) = (bytes << shift) >> 8;   /* shift and store result */
1603fcf5ef2aSThomas Huth     }
1604fcf5ef2aSThomas Huth }
1605fcf5ef2aSThomas Huth 
1606fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1607fcf5ef2aSThomas Huth {
1608fcf5ef2aSThomas Huth     int i;
1609fcf5ef2aSThomas Huth     unsigned int shift, bytes;
1610fcf5ef2aSThomas Huth 
1611b6cb41b2SDavid Gibson     /*
1612b6cb41b2SDavid Gibson      * Use reverse order, as destination and source register can be
1613b6cb41b2SDavid Gibson      * same. Its being modified in place saving temporary, reverse
1614b6cb41b2SDavid Gibson      * order will guarantee that computed result is not fed back.
1615fcf5ef2aSThomas Huth      */
1616fcf5ef2aSThomas Huth     for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) {
161763be02fcSAnton Blanchard         shift = b->VsrB(i) & 0x7;               /* extract shift value */
161863be02fcSAnton Blanchard         bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i);
1619fcf5ef2aSThomas Huth                                                 /* extract adjacent bytes */
162063be02fcSAnton Blanchard         r->VsrB(i) = (bytes >> shift) & 0xFF;   /* shift and store result */
1621fcf5ef2aSThomas Huth     }
1622fcf5ef2aSThomas Huth }
1623fcf5ef2aSThomas Huth 
1624fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift)
1625fcf5ef2aSThomas Huth {
1626fcf5ef2aSThomas Huth     int sh = shift & 0xf;
1627fcf5ef2aSThomas Huth     int i;
1628fcf5ef2aSThomas Huth     ppc_avr_t result;
1629fcf5ef2aSThomas Huth 
1630fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
1631fcf5ef2aSThomas Huth         int index = sh + i;
1632fcf5ef2aSThomas Huth         if (index > 0xf) {
163360594feaSMark Cave-Ayland             result.VsrB(i) = b->VsrB(index - 0x10);
1634fcf5ef2aSThomas Huth         } else {
163560594feaSMark Cave-Ayland             result.VsrB(i) = a->VsrB(index);
1636fcf5ef2aSThomas Huth         }
1637fcf5ef2aSThomas Huth     }
1638fcf5ef2aSThomas Huth     *r = result;
1639fcf5ef2aSThomas Huth }
1640fcf5ef2aSThomas Huth 
1641fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1642fcf5ef2aSThomas Huth {
16433c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1644fcf5ef2aSThomas Huth 
1645e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1646fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1647fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1648fcf5ef2aSThomas Huth #else
1649fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1650fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1651fcf5ef2aSThomas Huth #endif
1652fcf5ef2aSThomas Huth }
1653fcf5ef2aSThomas Huth 
1654e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
16552cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX])
16562cc12af3SMatheus Ferst #else
16572cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1)
16582cc12af3SMatheus Ferst #endif
16592cc12af3SMatheus Ferst 
16602cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \
16612cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t,       \
16622cc12af3SMatheus Ferst                                          uint64_t val, target_ulong index)     \
16632cc12af3SMatheus Ferst {                                                                              \
16642cc12af3SMatheus Ferst     const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE);                       \
16652cc12af3SMatheus Ferst     target_long idx = index;                                                   \
16662cc12af3SMatheus Ferst                                                                                \
16672cc12af3SMatheus Ferst     if (idx < 0 || idx > maxidx) {                                             \
16682cc12af3SMatheus Ferst         idx =  idx < 0 ? sizeof(TYPE) - idx : idx;                             \
16692cc12af3SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR,                                         \
16702cc12af3SMatheus Ferst             "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx   \
16712cc12af3SMatheus Ferst             ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx);         \
16722cc12af3SMatheus Ferst     } else {                                                                   \
16732cc12af3SMatheus Ferst         TYPE src = val;                                                        \
16742cc12af3SMatheus Ferst         memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE));           \
16752cc12af3SMatheus Ferst     }                                                                          \
16762cc12af3SMatheus Ferst }
16772cc12af3SMatheus Ferst VINSX(B, uint8_t)
16782cc12af3SMatheus Ferst VINSX(H, uint16_t)
16792cc12af3SMatheus Ferst VINSX(W, uint32_t)
16802cc12af3SMatheus Ferst VINSX(D, uint64_t)
16812cc12af3SMatheus Ferst #undef ELEM_ADDR
16822cc12af3SMatheus Ferst #undef VINSX
1683e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
168428110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
168528110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
168628110b72SMatheus Ferst                    target_ulong index)                                         \
168728110b72SMatheus Ferst {                                                                              \
168828110b72SMatheus Ferst     const target_long idx = index;                                             \
168928110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *a, *b };                                             \
169028110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
169128110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
169228110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \
169328110b72SMatheus Ferst     } else {                                                                   \
169428110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
169528110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
169628110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
169728110b72SMatheus Ferst     }                                                                          \
169828110b72SMatheus Ferst }
169928110b72SMatheus Ferst #else
170028110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \
170128110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \
170228110b72SMatheus Ferst                    target_ulong index)                                         \
170328110b72SMatheus Ferst {                                                                              \
170428110b72SMatheus Ferst     const target_long idx = index;                                             \
170528110b72SMatheus Ferst     ppc_avr_t tmp[2] = { *b, *a };                                             \
170628110b72SMatheus Ferst     memset(t, 0, sizeof(*t));                                                  \
170728110b72SMatheus Ferst     if (idx >= 0 && idx + SIZE <= sizeof(tmp)) {                               \
170828110b72SMatheus Ferst         memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2],                                  \
170928110b72SMatheus Ferst                (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE);                  \
171028110b72SMatheus Ferst     } else {                                                                   \
171128110b72SMatheus Ferst         qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x"  \
171228110b72SMatheus Ferst                       TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n",         \
171328110b72SMatheus Ferst                       env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE);        \
171428110b72SMatheus Ferst     }                                                                          \
171528110b72SMatheus Ferst }
171628110b72SMatheus Ferst #endif
171728110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1)
171828110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2)
171928110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4)
172028110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8)
172128110b72SMatheus Ferst #undef VEXTDVLX
1722e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1723fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1724fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1725fcf5ef2aSThomas Huth     {                                                                        \
1726fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1727fcf5ef2aSThomas Huth         memmove(&r->u8[8 - es], &b->u8[index], es);                          \
1728fcf5ef2aSThomas Huth         memset(&r->u8[8], 0, 8);                                             \
1729fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8 - es);                                        \
1730fcf5ef2aSThomas Huth     }
1731fcf5ef2aSThomas Huth #else
1732fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element)                                            \
1733fcf5ef2aSThomas Huth     void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \
1734fcf5ef2aSThomas Huth     {                                                                        \
1735fcf5ef2aSThomas Huth         uint32_t es = sizeof(r->element[0]);                                 \
1736fcf5ef2aSThomas Huth         uint32_t s = (16 - index) - es;                                      \
1737fcf5ef2aSThomas Huth         memmove(&r->u8[8], &b->u8[s], es);                                   \
1738fcf5ef2aSThomas Huth         memset(&r->u8[0], 0, 8);                                             \
1739fcf5ef2aSThomas Huth         memset(&r->u8[8 + es], 0, 8 - es);                                   \
1740fcf5ef2aSThomas Huth     }
1741fcf5ef2aSThomas Huth #endif
1742fcf5ef2aSThomas Huth VEXTRACT(ub, u8)
1743fcf5ef2aSThomas Huth VEXTRACT(uh, u16)
1744fcf5ef2aSThomas Huth VEXTRACT(uw, u32)
1745fcf5ef2aSThomas Huth VEXTRACT(d, u64)
1746fcf5ef2aSThomas Huth #undef VEXTRACT
1747fcf5ef2aSThomas Huth 
1748fb5303ccSMatheus Ferst #define VSTRI(NAME, ELEM, NUM_ELEMS, LEFT) \
1749fb5303ccSMatheus Ferst uint32_t helper_##NAME(ppc_avr_t *t, ppc_avr_t *b) \
1750fb5303ccSMatheus Ferst {                                                   \
1751fb5303ccSMatheus Ferst     int i, idx, crf = 0;                            \
1752fb5303ccSMatheus Ferst                                                     \
1753fb5303ccSMatheus Ferst     for (i = 0; i < NUM_ELEMS; i++) {               \
1754fb5303ccSMatheus Ferst         idx = LEFT ? i : NUM_ELEMS - i - 1;         \
1755fb5303ccSMatheus Ferst         if (b->Vsr##ELEM(idx)) {                    \
1756fb5303ccSMatheus Ferst             t->Vsr##ELEM(idx) = b->Vsr##ELEM(idx);  \
1757fb5303ccSMatheus Ferst         } else {                                    \
1758fb5303ccSMatheus Ferst             crf = 0b0010;                           \
1759fb5303ccSMatheus Ferst             break;                                  \
1760fb5303ccSMatheus Ferst         }                                           \
1761fb5303ccSMatheus Ferst     }                                               \
1762fb5303ccSMatheus Ferst                                                     \
1763fb5303ccSMatheus Ferst     for (; i < NUM_ELEMS; i++) {                    \
1764fb5303ccSMatheus Ferst         idx = LEFT ? i : NUM_ELEMS - i - 1;         \
1765fb5303ccSMatheus Ferst         t->Vsr##ELEM(idx) = 0;                      \
1766fb5303ccSMatheus Ferst     }                                               \
1767fb5303ccSMatheus Ferst                                                     \
1768fb5303ccSMatheus Ferst     return crf;                                     \
1769fb5303ccSMatheus Ferst }
1770fb5303ccSMatheus Ferst VSTRI(VSTRIBL, B, 16, true)
1771fb5303ccSMatheus Ferst VSTRI(VSTRIBR, B, 16, false)
1772fb5303ccSMatheus Ferst VSTRI(VSTRIHL, H, 8, true)
1773fb5303ccSMatheus Ferst VSTRI(VSTRIHR, H, 8, false)
1774fb5303ccSMatheus Ferst #undef VSTRI
1775fb5303ccSMatheus Ferst 
17768f5eeee3SMatheus Ferst void helper_XXEXTRACTUW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index)
17778ad901e5SNikunj A Dadhania {
177803b32c09SMark Cave-Ayland     ppc_vsr_t t = { };
17798ad901e5SNikunj A Dadhania     size_t es = sizeof(uint32_t);
17808ad901e5SNikunj A Dadhania     uint32_t ext_index;
17818ad901e5SNikunj A Dadhania     int i;
17828ad901e5SNikunj A Dadhania 
17838ad901e5SNikunj A Dadhania     ext_index = index;
17848ad901e5SNikunj A Dadhania     for (i = 0; i < es; i++, ext_index++) {
178503b32c09SMark Cave-Ayland         t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16);
17868ad901e5SNikunj A Dadhania     }
17878ad901e5SNikunj A Dadhania 
178803b32c09SMark Cave-Ayland     *xt = t;
17898ad901e5SNikunj A Dadhania }
17908ad901e5SNikunj A Dadhania 
17918f5eeee3SMatheus Ferst void helper_XXINSERTW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index)
17923398b742SNikunj A Dadhania {
179303b32c09SMark Cave-Ayland     ppc_vsr_t t = *xt;
17943398b742SNikunj A Dadhania     size_t es = sizeof(uint32_t);
17953398b742SNikunj A Dadhania     int ins_index, i = 0;
17963398b742SNikunj A Dadhania 
17973398b742SNikunj A Dadhania     ins_index = index;
17983398b742SNikunj A Dadhania     for (i = 0; i < es && ins_index < 16; i++, ins_index++) {
179903b32c09SMark Cave-Ayland         t.VsrB(ins_index) = xb->VsrB(8 - es + i);
18003398b742SNikunj A Dadhania     }
18013398b742SNikunj A Dadhania 
180203b32c09SMark Cave-Ayland     *xt = t;
18033398b742SNikunj A Dadhania }
18043398b742SNikunj A Dadhania 
18051015fcabSMatheus Ferst void helper_XXEVAL(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c,
18061015fcabSMatheus Ferst                    uint32_t desc)
18071015fcabSMatheus Ferst {
18081015fcabSMatheus Ferst     /*
18091015fcabSMatheus Ferst      * Instead of processing imm bit-by-bit, we'll skip the computation of
18101015fcabSMatheus Ferst      * conjunctions whose corresponding bit is unset.
18111015fcabSMatheus Ferst      */
18121015fcabSMatheus Ferst     int bit, imm = simd_data(desc);
18131015fcabSMatheus Ferst     Int128 conj, disj = int128_zero();
18141015fcabSMatheus Ferst 
18151015fcabSMatheus Ferst     /* Iterate over set bits from the least to the most significant bit */
18161015fcabSMatheus Ferst     while (imm) {
18171015fcabSMatheus Ferst         /*
18181015fcabSMatheus Ferst          * Get the next bit to be processed with ctz64. Invert the result of
18191015fcabSMatheus Ferst          * ctz64 to match the indexing used by PowerISA.
18201015fcabSMatheus Ferst          */
18211015fcabSMatheus Ferst         bit = 7 - ctzl(imm);
18221015fcabSMatheus Ferst         if (bit & 0x4) {
18231015fcabSMatheus Ferst             conj = a->s128;
18241015fcabSMatheus Ferst         } else {
18251015fcabSMatheus Ferst             conj = int128_not(a->s128);
18261015fcabSMatheus Ferst         }
18271015fcabSMatheus Ferst         if (bit & 0x2) {
18281015fcabSMatheus Ferst             conj = int128_and(conj, b->s128);
18291015fcabSMatheus Ferst         } else {
18301015fcabSMatheus Ferst             conj = int128_and(conj, int128_not(b->s128));
18311015fcabSMatheus Ferst         }
18321015fcabSMatheus Ferst         if (bit & 0x1) {
18331015fcabSMatheus Ferst             conj = int128_and(conj, c->s128);
18341015fcabSMatheus Ferst         } else {
18351015fcabSMatheus Ferst             conj = int128_and(conj, int128_not(c->s128));
18361015fcabSMatheus Ferst         }
18371015fcabSMatheus Ferst         disj = int128_or(disj, conj);
18381015fcabSMatheus Ferst 
18391015fcabSMatheus Ferst         /* Unset the least significant bit that is set */
18401015fcabSMatheus Ferst         imm &= imm - 1;
18411015fcabSMatheus Ferst     }
18421015fcabSMatheus Ferst 
18431015fcabSMatheus Ferst     t->s128 = disj;
18441015fcabSMatheus Ferst }
18451015fcabSMatheus Ferst 
1846788c6399SMatheus Ferst #define XXBLEND(name, sz) \
1847788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b,  \
1848788c6399SMatheus Ferst                                  ppc_avr_t *c, uint32_t desc)               \
1849788c6399SMatheus Ferst {                                                                           \
1850788c6399SMatheus Ferst     for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) {                  \
1851788c6399SMatheus Ferst         t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ?               \
1852788c6399SMatheus Ferst             b->glue(u, sz)[i] : a->glue(u, sz)[i];                          \
1853788c6399SMatheus Ferst     }                                                                       \
1854788c6399SMatheus Ferst }
1855788c6399SMatheus Ferst XXBLEND(B, 8)
1856788c6399SMatheus Ferst XXBLEND(H, 16)
1857788c6399SMatheus Ferst XXBLEND(W, 32)
1858788c6399SMatheus Ferst XXBLEND(D, 64)
1859788c6399SMatheus Ferst #undef XXBLEND
1860788c6399SMatheus Ferst 
1861fcf5ef2aSThomas Huth #define VNEG(name, element)                                         \
1862fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b)                      \
1863fcf5ef2aSThomas Huth {                                                                   \
1864fcf5ef2aSThomas Huth     int i;                                                          \
186560594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
1866fcf5ef2aSThomas Huth         r->element[i] = -b->element[i];                             \
1867fcf5ef2aSThomas Huth     }                                                               \
1868fcf5ef2aSThomas Huth }
1869fcf5ef2aSThomas Huth VNEG(vnegw, s32)
1870fcf5ef2aSThomas Huth VNEG(vnegd, s64)
1871fcf5ef2aSThomas Huth #undef VNEG
1872fcf5ef2aSThomas Huth 
1873fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1874fcf5ef2aSThomas Huth {
18753c385a93SMark Cave-Ayland     int sh = (b->VsrB(0xf) >> 3) & 0xf;
1876fcf5ef2aSThomas Huth 
1877e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1878fcf5ef2aSThomas Huth     memmove(&r->u8[sh], &a->u8[0], 16 - sh);
1879fcf5ef2aSThomas Huth     memset(&r->u8[0], 0, sh);
1880fcf5ef2aSThomas Huth #else
1881fcf5ef2aSThomas Huth     memmove(&r->u8[0], &a->u8[sh], 16 - sh);
1882fcf5ef2aSThomas Huth     memset(&r->u8[16 - sh], 0, sh);
1883fcf5ef2aSThomas Huth #endif
1884fcf5ef2aSThomas Huth }
1885fcf5ef2aSThomas Huth 
1886fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1887fcf5ef2aSThomas Huth {
1888fcf5ef2aSThomas Huth     int i;
1889fcf5ef2aSThomas Huth 
1890fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
1891fcf5ef2aSThomas Huth         r->u32[i] = a->u32[i] >= b->u32[i];
1892fcf5ef2aSThomas Huth     }
1893fcf5ef2aSThomas Huth }
1894fcf5ef2aSThomas Huth 
1895fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1896fcf5ef2aSThomas Huth {
1897fcf5ef2aSThomas Huth     int64_t t;
1898fcf5ef2aSThomas Huth     int i, upper;
1899fcf5ef2aSThomas Huth     ppc_avr_t result;
1900fcf5ef2aSThomas Huth     int sat = 0;
1901fcf5ef2aSThomas Huth 
1902fcf5ef2aSThomas Huth     upper = ARRAY_SIZE(r->s32) - 1;
190360594feaSMark Cave-Ayland     t = (int64_t)b->VsrSW(upper);
1904fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
190560594feaSMark Cave-Ayland         t += a->VsrSW(i);
190660594feaSMark Cave-Ayland         result.VsrSW(i) = 0;
1907fcf5ef2aSThomas Huth     }
190860594feaSMark Cave-Ayland     result.VsrSW(upper) = cvtsdsw(t, &sat);
1909fcf5ef2aSThomas Huth     *r = result;
1910fcf5ef2aSThomas Huth 
1911fcf5ef2aSThomas Huth     if (sat) {
19126175f5a0SRichard Henderson         set_vscr_sat(env);
1913fcf5ef2aSThomas Huth     }
1914fcf5ef2aSThomas Huth }
1915fcf5ef2aSThomas Huth 
1916fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1917fcf5ef2aSThomas Huth {
1918fcf5ef2aSThomas Huth     int i, j, upper;
1919fcf5ef2aSThomas Huth     ppc_avr_t result;
1920fcf5ef2aSThomas Huth     int sat = 0;
1921fcf5ef2aSThomas Huth 
1922fcf5ef2aSThomas Huth     upper = 1;
1923fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
192460594feaSMark Cave-Ayland         int64_t t = (int64_t)b->VsrSW(upper + i * 2);
1925fcf5ef2aSThomas Huth 
19267fa0ddc1SAnton Blanchard         result.VsrD(i) = 0;
1927fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u64); j++) {
192860594feaSMark Cave-Ayland             t += a->VsrSW(2 * i + j);
1929fcf5ef2aSThomas Huth         }
193060594feaSMark Cave-Ayland         result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat);
1931fcf5ef2aSThomas Huth     }
1932fcf5ef2aSThomas Huth 
1933fcf5ef2aSThomas Huth     *r = result;
1934fcf5ef2aSThomas Huth     if (sat) {
19356175f5a0SRichard Henderson         set_vscr_sat(env);
1936fcf5ef2aSThomas Huth     }
1937fcf5ef2aSThomas Huth }
1938fcf5ef2aSThomas Huth 
1939fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1940fcf5ef2aSThomas Huth {
1941fcf5ef2aSThomas Huth     int i, j;
1942fcf5ef2aSThomas Huth     int sat = 0;
1943fcf5ef2aSThomas Huth 
1944fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1945fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1946fcf5ef2aSThomas Huth 
1947fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->s32); j++) {
1948fcf5ef2aSThomas Huth             t += a->s8[4 * i + j];
1949fcf5ef2aSThomas Huth         }
1950fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1951fcf5ef2aSThomas Huth     }
1952fcf5ef2aSThomas Huth 
1953fcf5ef2aSThomas Huth     if (sat) {
19546175f5a0SRichard Henderson         set_vscr_sat(env);
1955fcf5ef2aSThomas Huth     }
1956fcf5ef2aSThomas Huth }
1957fcf5ef2aSThomas Huth 
1958fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1959fcf5ef2aSThomas Huth {
1960fcf5ef2aSThomas Huth     int sat = 0;
1961fcf5ef2aSThomas Huth     int i;
1962fcf5ef2aSThomas Huth 
1963fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->s32); i++) {
1964fcf5ef2aSThomas Huth         int64_t t = (int64_t)b->s32[i];
1965fcf5ef2aSThomas Huth 
1966fcf5ef2aSThomas Huth         t += a->s16[2 * i] + a->s16[2 * i + 1];
1967fcf5ef2aSThomas Huth         r->s32[i] = cvtsdsw(t, &sat);
1968fcf5ef2aSThomas Huth     }
1969fcf5ef2aSThomas Huth 
1970fcf5ef2aSThomas Huth     if (sat) {
19716175f5a0SRichard Henderson         set_vscr_sat(env);
1972fcf5ef2aSThomas Huth     }
1973fcf5ef2aSThomas Huth }
1974fcf5ef2aSThomas Huth 
1975fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
1976fcf5ef2aSThomas Huth {
1977fcf5ef2aSThomas Huth     int i, j;
1978fcf5ef2aSThomas Huth     int sat = 0;
1979fcf5ef2aSThomas Huth 
1980fcf5ef2aSThomas Huth     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
1981fcf5ef2aSThomas Huth         uint64_t t = (uint64_t)b->u32[i];
1982fcf5ef2aSThomas Huth 
1983fcf5ef2aSThomas Huth         for (j = 0; j < ARRAY_SIZE(r->u32); j++) {
1984fcf5ef2aSThomas Huth             t += a->u8[4 * i + j];
1985fcf5ef2aSThomas Huth         }
1986fcf5ef2aSThomas Huth         r->u32[i] = cvtuduw(t, &sat);
1987fcf5ef2aSThomas Huth     }
1988fcf5ef2aSThomas Huth 
1989fcf5ef2aSThomas Huth     if (sat) {
19906175f5a0SRichard Henderson         set_vscr_sat(env);
1991fcf5ef2aSThomas Huth     }
1992fcf5ef2aSThomas Huth }
1993fcf5ef2aSThomas Huth 
1994e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
1995fcf5ef2aSThomas Huth #define UPKHI 1
1996fcf5ef2aSThomas Huth #define UPKLO 0
1997fcf5ef2aSThomas Huth #else
1998fcf5ef2aSThomas Huth #define UPKHI 0
1999fcf5ef2aSThomas Huth #define UPKLO 1
2000fcf5ef2aSThomas Huth #endif
2001fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi)                                              \
2002fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
2003fcf5ef2aSThomas Huth     {                                                                   \
2004fcf5ef2aSThomas Huth         int i;                                                          \
2005fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
2006fcf5ef2aSThomas Huth                                                                         \
2007fcf5ef2aSThomas Huth         for (i = 0; i < ARRAY_SIZE(r->u32); i++) {                      \
2008fcf5ef2aSThomas Huth             uint16_t e = b->u16[hi ? i : i + 4];                        \
2009fcf5ef2aSThomas Huth             uint8_t a = (e >> 15) ? 0xff : 0;                           \
2010fcf5ef2aSThomas Huth             uint8_t r = (e >> 10) & 0x1f;                               \
2011fcf5ef2aSThomas Huth             uint8_t g = (e >> 5) & 0x1f;                                \
2012fcf5ef2aSThomas Huth             uint8_t b = e & 0x1f;                                       \
2013fcf5ef2aSThomas Huth                                                                         \
2014fcf5ef2aSThomas Huth             result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b;       \
2015fcf5ef2aSThomas Huth         }                                                               \
2016fcf5ef2aSThomas Huth         *r = result;                                                    \
2017fcf5ef2aSThomas Huth     }
2018fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO)
2019fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI)
2020fcf5ef2aSThomas Huth #undef VUPKPX
2021fcf5ef2aSThomas Huth 
2022fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi)                              \
2023fcf5ef2aSThomas Huth     void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b)                \
2024fcf5ef2aSThomas Huth     {                                                                   \
2025fcf5ef2aSThomas Huth         int i;                                                          \
2026fcf5ef2aSThomas Huth         ppc_avr_t result;                                               \
2027fcf5ef2aSThomas Huth                                                                         \
2028fcf5ef2aSThomas Huth         if (hi) {                                                       \
2029fcf5ef2aSThomas Huth             for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) {             \
2030fcf5ef2aSThomas Huth                 result.unpacked[i] = b->packee[i];                      \
2031fcf5ef2aSThomas Huth             }                                                           \
2032fcf5ef2aSThomas Huth         } else {                                                        \
2033fcf5ef2aSThomas Huth             for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \
2034fcf5ef2aSThomas Huth                  i++) {                                                 \
2035fcf5ef2aSThomas Huth                 result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \
2036fcf5ef2aSThomas Huth             }                                                           \
2037fcf5ef2aSThomas Huth         }                                                               \
2038fcf5ef2aSThomas Huth         *r = result;                                                    \
2039fcf5ef2aSThomas Huth     }
2040fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI)
2041fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI)
2042fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI)
2043fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO)
2044fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO)
2045fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO)
2046fcf5ef2aSThomas Huth #undef VUPK
2047fcf5ef2aSThomas Huth #undef UPKHI
2048fcf5ef2aSThomas Huth #undef UPKLO
2049fcf5ef2aSThomas Huth 
2050fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element)                                      \
2051fcf5ef2aSThomas Huth     void helper_v##name(ppc_avr_t *r, ppc_avr_t *b)                     \
2052fcf5ef2aSThomas Huth     {                                                                   \
2053fcf5ef2aSThomas Huth         int i;                                                          \
2054fcf5ef2aSThomas Huth                                                                         \
205560594feaSMark Cave-Ayland         for (i = 0; i < ARRAY_SIZE(r->element); i++) {                  \
2056fcf5ef2aSThomas Huth             r->element[i] = name(b->element[i]);                        \
2057fcf5ef2aSThomas Huth         }                                                               \
2058fcf5ef2aSThomas Huth     }
2059fcf5ef2aSThomas Huth 
2060fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8)
2061fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16)
2062fcf5ef2aSThomas Huth 
2063fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8)
2064fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16)
2065fcf5ef2aSThomas Huth 
2066fcf5ef2aSThomas Huth #undef clzb
2067fcf5ef2aSThomas Huth #undef clzh
2068fcf5ef2aSThomas Huth 
2069fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8)
2070fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16)
2071fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v))
2072fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v))
2073fcf5ef2aSThomas Huth 
2074fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8)
2075fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16)
2076fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32)
2077fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64)
2078fcf5ef2aSThomas Huth 
2079fcf5ef2aSThomas Huth #undef ctzb
2080fcf5ef2aSThomas Huth #undef ctzh
2081fcf5ef2aSThomas Huth #undef ctzw
2082fcf5ef2aSThomas Huth #undef ctzd
2083fcf5ef2aSThomas Huth 
2084fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v)
2085fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v)
2086fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v)
2087fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v)
2088fcf5ef2aSThomas Huth 
2089fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8)
2090fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16)
2091fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32)
2092fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64)
2093fcf5ef2aSThomas Huth 
2094fcf5ef2aSThomas Huth #undef popcntb
2095fcf5ef2aSThomas Huth #undef popcnth
2096fcf5ef2aSThomas Huth #undef popcntw
2097fcf5ef2aSThomas Huth #undef popcntd
2098fcf5ef2aSThomas Huth 
2099fcf5ef2aSThomas Huth #undef VGENERIC_DO
2100fcf5ef2aSThomas Huth 
2101e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN
2102fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } }
2103fcf5ef2aSThomas Huth #else
2104fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } }
2105fcf5ef2aSThomas Huth #endif
2106fcf5ef2aSThomas Huth 
2107fcf5ef2aSThomas Huth #ifndef CONFIG_INT128
2108fcf5ef2aSThomas Huth 
2109fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a)
2110fcf5ef2aSThomas Huth {
2111fcf5ef2aSThomas Huth     t->u64[0] = ~a.u64[0];
2112fcf5ef2aSThomas Huth     t->u64[1] = ~a.u64[1];
2113fcf5ef2aSThomas Huth }
2114fcf5ef2aSThomas Huth 
2115fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b)
2116fcf5ef2aSThomas Huth {
21173c385a93SMark Cave-Ayland     if (a.VsrD(0) < b.VsrD(0)) {
2118fcf5ef2aSThomas Huth         return -1;
21193c385a93SMark Cave-Ayland     } else if (a.VsrD(0) > b.VsrD(0)) {
2120fcf5ef2aSThomas Huth         return 1;
21213c385a93SMark Cave-Ayland     } else if (a.VsrD(1) < b.VsrD(1)) {
2122fcf5ef2aSThomas Huth         return -1;
21233c385a93SMark Cave-Ayland     } else if (a.VsrD(1) > b.VsrD(1)) {
2124fcf5ef2aSThomas Huth         return 1;
2125fcf5ef2aSThomas Huth     } else {
2126fcf5ef2aSThomas Huth         return 0;
2127fcf5ef2aSThomas Huth     }
2128fcf5ef2aSThomas Huth }
2129fcf5ef2aSThomas Huth 
2130fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b)
2131fcf5ef2aSThomas Huth {
21323c385a93SMark Cave-Ayland     t->VsrD(1) = a.VsrD(1) + b.VsrD(1);
21333c385a93SMark Cave-Ayland     t->VsrD(0) = a.VsrD(0) + b.VsrD(0) +
21343c385a93SMark Cave-Ayland                      (~a.VsrD(1) < b.VsrD(1));
2135fcf5ef2aSThomas Huth }
2136fcf5ef2aSThomas Huth 
2137fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b)
2138fcf5ef2aSThomas Huth {
2139fcf5ef2aSThomas Huth     ppc_avr_t not_a;
21403c385a93SMark Cave-Ayland     t->VsrD(1) = a.VsrD(1) + b.VsrD(1);
21413c385a93SMark Cave-Ayland     t->VsrD(0) = a.VsrD(0) + b.VsrD(0) +
21423c385a93SMark Cave-Ayland                      (~a.VsrD(1) < b.VsrD(1));
2143fcf5ef2aSThomas Huth     avr_qw_not(&not_a, a);
2144fcf5ef2aSThomas Huth     return avr_qw_cmpu(not_a, b) < 0;
2145fcf5ef2aSThomas Huth }
2146fcf5ef2aSThomas Huth 
2147fcf5ef2aSThomas Huth #endif
2148fcf5ef2aSThomas Huth 
2149fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2150fcf5ef2aSThomas Huth {
2151fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2152fcf5ef2aSThomas Huth     r->u128 = a->u128 + b->u128;
2153fcf5ef2aSThomas Huth #else
2154fcf5ef2aSThomas Huth     avr_qw_add(r, *a, *b);
2155fcf5ef2aSThomas Huth #endif
2156fcf5ef2aSThomas Huth }
2157fcf5ef2aSThomas Huth 
2158fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2159fcf5ef2aSThomas Huth {
2160fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2161fcf5ef2aSThomas Huth     r->u128 = a->u128 + b->u128 + (c->u128 & 1);
2162fcf5ef2aSThomas Huth #else
2163fcf5ef2aSThomas Huth 
21643c385a93SMark Cave-Ayland     if (c->VsrD(1) & 1) {
2165fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2166fcf5ef2aSThomas Huth 
21673c385a93SMark Cave-Ayland         tmp.VsrD(0) = 0;
21683c385a93SMark Cave-Ayland         tmp.VsrD(1) = c->VsrD(1) & 1;
2169fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
2170fcf5ef2aSThomas Huth         avr_qw_add(r, tmp, *b);
2171fcf5ef2aSThomas Huth     } else {
2172fcf5ef2aSThomas Huth         avr_qw_add(r, *a, *b);
2173fcf5ef2aSThomas Huth     }
2174fcf5ef2aSThomas Huth #endif
2175fcf5ef2aSThomas Huth }
2176fcf5ef2aSThomas Huth 
2177fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2178fcf5ef2aSThomas Huth {
2179fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2180fcf5ef2aSThomas Huth     r->u128 = (~a->u128 < b->u128);
2181fcf5ef2aSThomas Huth #else
2182fcf5ef2aSThomas Huth     ppc_avr_t not_a;
2183fcf5ef2aSThomas Huth 
2184fcf5ef2aSThomas Huth     avr_qw_not(&not_a, *a);
2185fcf5ef2aSThomas Huth 
21863c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
21873c385a93SMark Cave-Ayland     r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0);
2188fcf5ef2aSThomas Huth #endif
2189fcf5ef2aSThomas Huth }
2190fcf5ef2aSThomas Huth 
2191fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2192fcf5ef2aSThomas Huth {
2193fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2194fcf5ef2aSThomas Huth     int carry_out = (~a->u128 < b->u128);
2195fcf5ef2aSThomas Huth     if (!carry_out && (c->u128 & 1)) {
2196fcf5ef2aSThomas Huth         carry_out = ((a->u128 + b->u128 + 1) == 0) &&
2197fcf5ef2aSThomas Huth                     ((a->u128 != 0) || (b->u128 != 0));
2198fcf5ef2aSThomas Huth     }
2199fcf5ef2aSThomas Huth     r->u128 = carry_out;
2200fcf5ef2aSThomas Huth #else
2201fcf5ef2aSThomas Huth 
22023c385a93SMark Cave-Ayland     int carry_in = c->VsrD(1) & 1;
2203fcf5ef2aSThomas Huth     int carry_out = 0;
2204fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2205fcf5ef2aSThomas Huth 
2206fcf5ef2aSThomas Huth     carry_out = avr_qw_addc(&tmp, *a, *b);
2207fcf5ef2aSThomas Huth 
2208fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
2209fcf5ef2aSThomas Huth         ppc_avr_t one = QW_ONE;
2210fcf5ef2aSThomas Huth         carry_out = avr_qw_addc(&tmp, tmp, one);
2211fcf5ef2aSThomas Huth     }
22123c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
22133c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
2214fcf5ef2aSThomas Huth #endif
2215fcf5ef2aSThomas Huth }
2216fcf5ef2aSThomas Huth 
2217fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2218fcf5ef2aSThomas Huth {
2219fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2220fcf5ef2aSThomas Huth     r->u128 = a->u128 - b->u128;
2221fcf5ef2aSThomas Huth #else
2222fcf5ef2aSThomas Huth     ppc_avr_t tmp;
2223fcf5ef2aSThomas Huth     ppc_avr_t one = QW_ONE;
2224fcf5ef2aSThomas Huth 
2225fcf5ef2aSThomas Huth     avr_qw_not(&tmp, *b);
2226fcf5ef2aSThomas Huth     avr_qw_add(&tmp, *a, tmp);
2227fcf5ef2aSThomas Huth     avr_qw_add(r, tmp, one);
2228fcf5ef2aSThomas Huth #endif
2229fcf5ef2aSThomas Huth }
2230fcf5ef2aSThomas Huth 
2231fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2232fcf5ef2aSThomas Huth {
2233fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2234fcf5ef2aSThomas Huth     r->u128 = a->u128 + ~b->u128 + (c->u128 & 1);
2235fcf5ef2aSThomas Huth #else
2236fcf5ef2aSThomas Huth     ppc_avr_t tmp, sum;
2237fcf5ef2aSThomas Huth 
2238fcf5ef2aSThomas Huth     avr_qw_not(&tmp, *b);
2239fcf5ef2aSThomas Huth     avr_qw_add(&sum, *a, tmp);
2240fcf5ef2aSThomas Huth 
22413c385a93SMark Cave-Ayland     tmp.VsrD(0) = 0;
22423c385a93SMark Cave-Ayland     tmp.VsrD(1) = c->VsrD(1) & 1;
2243fcf5ef2aSThomas Huth     avr_qw_add(r, sum, tmp);
2244fcf5ef2aSThomas Huth #endif
2245fcf5ef2aSThomas Huth }
2246fcf5ef2aSThomas Huth 
2247fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
2248fcf5ef2aSThomas Huth {
2249fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2250fcf5ef2aSThomas Huth     r->u128 = (~a->u128 < ~b->u128) ||
2251fcf5ef2aSThomas Huth                  (a->u128 + ~b->u128 == (__uint128_t)-1);
2252fcf5ef2aSThomas Huth #else
2253fcf5ef2aSThomas Huth     int carry = (avr_qw_cmpu(*a, *b) > 0);
2254fcf5ef2aSThomas Huth     if (!carry) {
2255fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2256fcf5ef2aSThomas Huth         avr_qw_not(&tmp, *b);
2257fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
22583c385a93SMark Cave-Ayland         carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull));
2259fcf5ef2aSThomas Huth     }
22603c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
22613c385a93SMark Cave-Ayland     r->VsrD(1) = carry;
2262fcf5ef2aSThomas Huth #endif
2263fcf5ef2aSThomas Huth }
2264fcf5ef2aSThomas Huth 
2265fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
2266fcf5ef2aSThomas Huth {
2267fcf5ef2aSThomas Huth #ifdef CONFIG_INT128
2268fcf5ef2aSThomas Huth     r->u128 =
2269fcf5ef2aSThomas Huth         (~a->u128 < ~b->u128) ||
2270fcf5ef2aSThomas Huth         ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1));
2271fcf5ef2aSThomas Huth #else
22723c385a93SMark Cave-Ayland     int carry_in = c->VsrD(1) & 1;
2273fcf5ef2aSThomas Huth     int carry_out = (avr_qw_cmpu(*a, *b) > 0);
2274fcf5ef2aSThomas Huth     if (!carry_out && carry_in) {
2275fcf5ef2aSThomas Huth         ppc_avr_t tmp;
2276fcf5ef2aSThomas Huth         avr_qw_not(&tmp, *b);
2277fcf5ef2aSThomas Huth         avr_qw_add(&tmp, *a, tmp);
22783c385a93SMark Cave-Ayland         carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull));
2279fcf5ef2aSThomas Huth     }
2280fcf5ef2aSThomas Huth 
22813c385a93SMark Cave-Ayland     r->VsrD(0) = 0;
22823c385a93SMark Cave-Ayland     r->VsrD(1) = carry_out;
2283fcf5ef2aSThomas Huth #endif
2284fcf5ef2aSThomas Huth }
2285fcf5ef2aSThomas Huth 
2286fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC
2287fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF
2288fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1  0xA
2289fcf5ef2aSThomas Huth #define BCD_NEG_PREF    0xD
2290fcf5ef2aSThomas Huth #define BCD_NEG_ALT     0xB
2291fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2  0xE
2292fcf5ef2aSThomas Huth #define NATIONAL_PLUS   0x2B
2293fcf5ef2aSThomas Huth #define NATIONAL_NEG    0x2D
2294fcf5ef2aSThomas Huth 
2295365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2))
2296fcf5ef2aSThomas Huth 
2297fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd)
2298fcf5ef2aSThomas Huth {
2299428115c3SMark Cave-Ayland     switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) {
2300fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_1:
2301fcf5ef2aSThomas Huth     case BCD_PLUS_PREF_2:
2302fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_1:
2303fcf5ef2aSThomas Huth     case BCD_PLUS_ALT_2:
2304fcf5ef2aSThomas Huth     {
2305fcf5ef2aSThomas Huth         return 1;
2306fcf5ef2aSThomas Huth     }
2307fcf5ef2aSThomas Huth 
2308fcf5ef2aSThomas Huth     case BCD_NEG_PREF:
2309fcf5ef2aSThomas Huth     case BCD_NEG_ALT:
2310fcf5ef2aSThomas Huth     {
2311fcf5ef2aSThomas Huth         return -1;
2312fcf5ef2aSThomas Huth     }
2313fcf5ef2aSThomas Huth 
2314fcf5ef2aSThomas Huth     default:
2315fcf5ef2aSThomas Huth     {
2316fcf5ef2aSThomas Huth         return 0;
2317fcf5ef2aSThomas Huth     }
2318fcf5ef2aSThomas Huth     }
2319fcf5ef2aSThomas Huth }
2320fcf5ef2aSThomas Huth 
2321fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps)
2322fcf5ef2aSThomas Huth {
2323fcf5ef2aSThomas Huth     if (sgn >= 0) {
2324fcf5ef2aSThomas Huth         return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2;
2325fcf5ef2aSThomas Huth     } else {
2326fcf5ef2aSThomas Huth         return BCD_NEG_PREF;
2327fcf5ef2aSThomas Huth     }
2328fcf5ef2aSThomas Huth }
2329fcf5ef2aSThomas Huth 
2330fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid)
2331fcf5ef2aSThomas Huth {
2332fcf5ef2aSThomas Huth     uint8_t result;
2333fcf5ef2aSThomas Huth     if (n & 1) {
2334428115c3SMark Cave-Ayland         result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4;
2335fcf5ef2aSThomas Huth     } else {
2336428115c3SMark Cave-Ayland        result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF;
2337fcf5ef2aSThomas Huth     }
2338fcf5ef2aSThomas Huth 
2339fcf5ef2aSThomas Huth     if (unlikely(result > 9)) {
2340fcf5ef2aSThomas Huth         *invalid = true;
2341fcf5ef2aSThomas Huth     }
2342fcf5ef2aSThomas Huth     return result;
2343fcf5ef2aSThomas Huth }
2344fcf5ef2aSThomas Huth 
2345fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n)
2346fcf5ef2aSThomas Huth {
2347fcf5ef2aSThomas Huth     if (n & 1) {
2348428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F;
2349428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4);
2350fcf5ef2aSThomas Huth     } else {
2351428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0;
2352428115c3SMark Cave-Ayland         bcd->VsrB(BCD_DIG_BYTE(n)) |= digit;
2353fcf5ef2aSThomas Huth     }
2354fcf5ef2aSThomas Huth }
2355fcf5ef2aSThomas Huth 
2356071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd)
2357071663dfSJose Ricardo Ziviani {
2358071663dfSJose Ricardo Ziviani     int i;
2359071663dfSJose Ricardo Ziviani     int invalid = 0;
2360071663dfSJose Ricardo Ziviani 
2361071663dfSJose Ricardo Ziviani     if (bcd_get_sgn(bcd) == 0) {
2362071663dfSJose Ricardo Ziviani         return false;
2363071663dfSJose Ricardo Ziviani     }
2364071663dfSJose Ricardo Ziviani 
2365071663dfSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2366071663dfSJose Ricardo Ziviani         bcd_get_digit(bcd, i, &invalid);
2367071663dfSJose Ricardo Ziviani         if (unlikely(invalid)) {
2368071663dfSJose Ricardo Ziviani             return false;
2369071663dfSJose Ricardo Ziviani         }
2370071663dfSJose Ricardo Ziviani     }
2371071663dfSJose Ricardo Ziviani     return true;
2372071663dfSJose Ricardo Ziviani }
2373071663dfSJose Ricardo Ziviani 
2374fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd)
2375fcf5ef2aSThomas Huth {
23763c385a93SMark Cave-Ayland     if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) {
2377efa73196SNikunj A Dadhania         return CRF_EQ;
2378fcf5ef2aSThomas Huth     } else {
2379efa73196SNikunj A Dadhania         return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT;
2380fcf5ef2aSThomas Huth     }
2381fcf5ef2aSThomas Huth }
2382fcf5ef2aSThomas Huth 
2383fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n)
2384fcf5ef2aSThomas Huth {
238560594feaSMark Cave-Ayland     return reg->VsrH(7 - n);
2386fcf5ef2aSThomas Huth }
2387fcf5ef2aSThomas Huth 
2388fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n)
2389fcf5ef2aSThomas Huth {
239060594feaSMark Cave-Ayland     reg->VsrH(7 - n) = val;
2391fcf5ef2aSThomas Huth }
2392fcf5ef2aSThomas Huth 
2393fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b)
2394fcf5ef2aSThomas Huth {
2395fcf5ef2aSThomas Huth     int i;
2396fcf5ef2aSThomas Huth     int invalid = 0;
2397fcf5ef2aSThomas Huth     for (i = 31; i > 0; i--) {
2398fcf5ef2aSThomas Huth         uint8_t dig_a = bcd_get_digit(a, i, &invalid);
2399fcf5ef2aSThomas Huth         uint8_t dig_b = bcd_get_digit(b, i, &invalid);
2400fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2401fcf5ef2aSThomas Huth             return 0; /* doesn't matter */
2402fcf5ef2aSThomas Huth         } else if (dig_a > dig_b) {
2403fcf5ef2aSThomas Huth             return 1;
2404fcf5ef2aSThomas Huth         } else if (dig_a < dig_b) {
2405fcf5ef2aSThomas Huth             return -1;
2406fcf5ef2aSThomas Huth         }
2407fcf5ef2aSThomas Huth     }
2408fcf5ef2aSThomas Huth 
2409fcf5ef2aSThomas Huth     return 0;
2410fcf5ef2aSThomas Huth }
2411fcf5ef2aSThomas Huth 
2412936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2413fcf5ef2aSThomas Huth                        int *overflow)
2414fcf5ef2aSThomas Huth {
2415fcf5ef2aSThomas Huth     int carry = 0;
2416fcf5ef2aSThomas Huth     int i;
2417936fda4dSFabiano Rosas     int is_zero = 1;
2418936fda4dSFabiano Rosas 
2419fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2420fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) +
2421fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2422936fda4dSFabiano Rosas         is_zero &= (digit == 0);
2423fcf5ef2aSThomas Huth         if (digit > 9) {
2424fcf5ef2aSThomas Huth             carry = 1;
2425fcf5ef2aSThomas Huth             digit -= 10;
2426fcf5ef2aSThomas Huth         } else {
2427fcf5ef2aSThomas Huth             carry = 0;
2428fcf5ef2aSThomas Huth         }
2429fcf5ef2aSThomas Huth 
2430fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2431fcf5ef2aSThomas Huth     }
2432fcf5ef2aSThomas Huth 
2433fcf5ef2aSThomas Huth     *overflow = carry;
2434936fda4dSFabiano Rosas     return is_zero;
2435fcf5ef2aSThomas Huth }
2436fcf5ef2aSThomas Huth 
2437d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid,
2438fcf5ef2aSThomas Huth                        int *overflow)
2439fcf5ef2aSThomas Huth {
2440fcf5ef2aSThomas Huth     int carry = 0;
2441fcf5ef2aSThomas Huth     int i;
2442d03b174aSYasmin Beatriz 
2443fcf5ef2aSThomas Huth     for (i = 1; i <= 31; i++) {
2444fcf5ef2aSThomas Huth         uint8_t digit = bcd_get_digit(a, i, invalid) -
2445fcf5ef2aSThomas Huth                         bcd_get_digit(b, i, invalid) + carry;
2446fcf5ef2aSThomas Huth         if (digit & 0x80) {
2447fcf5ef2aSThomas Huth             carry = -1;
2448fcf5ef2aSThomas Huth             digit += 10;
2449fcf5ef2aSThomas Huth         } else {
2450fcf5ef2aSThomas Huth             carry = 0;
2451fcf5ef2aSThomas Huth         }
2452fcf5ef2aSThomas Huth 
2453fcf5ef2aSThomas Huth         bcd_put_digit(t, digit, i);
2454fcf5ef2aSThomas Huth     }
2455fcf5ef2aSThomas Huth 
2456fcf5ef2aSThomas Huth     *overflow = carry;
2457fcf5ef2aSThomas Huth }
2458fcf5ef2aSThomas Huth 
2459fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2460fcf5ef2aSThomas Huth {
2461fcf5ef2aSThomas Huth 
2462fcf5ef2aSThomas Huth     int sgna = bcd_get_sgn(a);
2463fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2464fcf5ef2aSThomas Huth     int invalid = (sgna == 0) || (sgnb == 0);
2465fcf5ef2aSThomas Huth     int overflow = 0;
2466936fda4dSFabiano Rosas     int zero = 0;
2467fcf5ef2aSThomas Huth     uint32_t cr = 0;
2468fcf5ef2aSThomas Huth     ppc_avr_t result = { .u64 = { 0, 0 } };
2469fcf5ef2aSThomas Huth 
2470fcf5ef2aSThomas Huth     if (!invalid) {
2471fcf5ef2aSThomas Huth         if (sgna == sgnb) {
2472428115c3SMark Cave-Ayland             result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2473936fda4dSFabiano Rosas             zero = bcd_add_mag(&result, a, b, &invalid, &overflow);
2474936fda4dSFabiano Rosas             cr = (sgna > 0) ? CRF_GT : CRF_LT;
2475fcf5ef2aSThomas Huth         } else {
2476d03b174aSYasmin Beatriz             int magnitude = bcd_cmp_mag(a, b);
2477d03b174aSYasmin Beatriz             if (magnitude > 0) {
2478428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps);
2479d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, a, b, &invalid, &overflow);
2480d03b174aSYasmin Beatriz                 cr = (sgna > 0) ? CRF_GT : CRF_LT;
2481d03b174aSYasmin Beatriz             } else if (magnitude < 0) {
2482428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps);
2483d03b174aSYasmin Beatriz                 bcd_sub_mag(&result, b, a, &invalid, &overflow);
2484efa73196SNikunj A Dadhania                 cr = (sgnb > 0) ? CRF_GT : CRF_LT;
2485d03b174aSYasmin Beatriz             } else {
2486428115c3SMark Cave-Ayland                 result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps);
2487d03b174aSYasmin Beatriz                 cr = CRF_EQ;
2488d03b174aSYasmin Beatriz             }
2489fcf5ef2aSThomas Huth         }
2490fcf5ef2aSThomas Huth     }
2491fcf5ef2aSThomas Huth 
2492fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
24933c385a93SMark Cave-Ayland         result.VsrD(0) = result.VsrD(1) = -1;
2494efa73196SNikunj A Dadhania         cr = CRF_SO;
2495fcf5ef2aSThomas Huth     } else if (overflow) {
2496efa73196SNikunj A Dadhania         cr |= CRF_SO;
2497936fda4dSFabiano Rosas     } else if (zero) {
2498936fda4dSFabiano Rosas         cr |= CRF_EQ;
2499fcf5ef2aSThomas Huth     }
2500fcf5ef2aSThomas Huth 
2501fcf5ef2aSThomas Huth     *r = result;
2502fcf5ef2aSThomas Huth 
2503fcf5ef2aSThomas Huth     return cr;
2504fcf5ef2aSThomas Huth }
2505fcf5ef2aSThomas Huth 
2506fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2507fcf5ef2aSThomas Huth {
2508fcf5ef2aSThomas Huth     ppc_avr_t bcopy = *b;
2509fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2510fcf5ef2aSThomas Huth     if (sgnb < 0) {
2511fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0);
2512fcf5ef2aSThomas Huth     } else if (sgnb > 0) {
2513fcf5ef2aSThomas Huth         bcd_put_digit(&bcopy, BCD_NEG_PREF, 0);
2514fcf5ef2aSThomas Huth     }
2515fcf5ef2aSThomas Huth     /* else invalid ... defer to bcdadd code for proper handling */
2516fcf5ef2aSThomas Huth 
2517fcf5ef2aSThomas Huth     return helper_bcdadd(r, a, &bcopy, ps);
2518fcf5ef2aSThomas Huth }
2519fcf5ef2aSThomas Huth 
2520fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2521fcf5ef2aSThomas Huth {
2522fcf5ef2aSThomas Huth     int i;
2523fcf5ef2aSThomas Huth     int cr = 0;
2524fcf5ef2aSThomas Huth     uint16_t national = 0;
2525fcf5ef2aSThomas Huth     uint16_t sgnb = get_national_digit(b, 0);
2526fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2527fcf5ef2aSThomas Huth     int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG);
2528fcf5ef2aSThomas Huth 
2529fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2530fcf5ef2aSThomas Huth         national = get_national_digit(b, i);
2531fcf5ef2aSThomas Huth         if (unlikely(national < 0x30 || national > 0x39)) {
2532fcf5ef2aSThomas Huth             invalid = 1;
2533fcf5ef2aSThomas Huth             break;
2534fcf5ef2aSThomas Huth         }
2535fcf5ef2aSThomas Huth 
2536fcf5ef2aSThomas Huth         bcd_put_digit(&ret, national & 0xf, i);
2537fcf5ef2aSThomas Huth     }
2538fcf5ef2aSThomas Huth 
2539fcf5ef2aSThomas Huth     if (sgnb == NATIONAL_PLUS) {
2540fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0);
2541fcf5ef2aSThomas Huth     } else {
2542fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2543fcf5ef2aSThomas Huth     }
2544fcf5ef2aSThomas Huth 
2545fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2546fcf5ef2aSThomas Huth 
2547fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2548efa73196SNikunj A Dadhania         cr = CRF_SO;
2549fcf5ef2aSThomas Huth     }
2550fcf5ef2aSThomas Huth 
2551fcf5ef2aSThomas Huth     *r = ret;
2552fcf5ef2aSThomas Huth 
2553fcf5ef2aSThomas Huth     return cr;
2554fcf5ef2aSThomas Huth }
2555fcf5ef2aSThomas Huth 
2556fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2557fcf5ef2aSThomas Huth {
2558fcf5ef2aSThomas Huth     int i;
2559fcf5ef2aSThomas Huth     int cr = 0;
2560fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2561fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2562fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2563fcf5ef2aSThomas Huth 
25643c385a93SMark Cave-Ayland     int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0);
2565fcf5ef2aSThomas Huth 
2566fcf5ef2aSThomas Huth     for (i = 1; i < 8; i++) {
2567fcf5ef2aSThomas Huth         set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i);
2568fcf5ef2aSThomas Huth 
2569fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2570fcf5ef2aSThomas Huth             break;
2571fcf5ef2aSThomas Huth         }
2572fcf5ef2aSThomas Huth     }
2573fcf5ef2aSThomas Huth     set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0);
2574fcf5ef2aSThomas Huth 
2575fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2576fcf5ef2aSThomas Huth 
2577fcf5ef2aSThomas Huth     if (ox_flag) {
2578efa73196SNikunj A Dadhania         cr |= CRF_SO;
2579fcf5ef2aSThomas Huth     }
2580fcf5ef2aSThomas Huth 
2581fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2582efa73196SNikunj A Dadhania         cr = CRF_SO;
2583fcf5ef2aSThomas Huth     }
2584fcf5ef2aSThomas Huth 
2585fcf5ef2aSThomas Huth     *r = ret;
2586fcf5ef2aSThomas Huth 
2587fcf5ef2aSThomas Huth     return cr;
2588fcf5ef2aSThomas Huth }
2589fcf5ef2aSThomas Huth 
2590fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2591fcf5ef2aSThomas Huth {
2592fcf5ef2aSThomas Huth     int i;
2593fcf5ef2aSThomas Huth     int cr = 0;
2594fcf5ef2aSThomas Huth     int invalid = 0;
2595fcf5ef2aSThomas Huth     int zone_digit = 0;
2596fcf5ef2aSThomas Huth     int zone_lead = ps ? 0xF : 0x3;
2597fcf5ef2aSThomas Huth     int digit = 0;
2598fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2599428115c3SMark Cave-Ayland     int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4;
2600fcf5ef2aSThomas Huth 
2601fcf5ef2aSThomas Huth     if (unlikely((sgnb < 0xA) && ps)) {
2602fcf5ef2aSThomas Huth         invalid = 1;
2603fcf5ef2aSThomas Huth     }
2604fcf5ef2aSThomas Huth 
2605fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2606428115c3SMark Cave-Ayland         zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead;
2607428115c3SMark Cave-Ayland         digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF;
2608fcf5ef2aSThomas Huth         if (unlikely(zone_digit != zone_lead || digit > 0x9)) {
2609fcf5ef2aSThomas Huth             invalid = 1;
2610fcf5ef2aSThomas Huth             break;
2611fcf5ef2aSThomas Huth         }
2612fcf5ef2aSThomas Huth 
2613fcf5ef2aSThomas Huth         bcd_put_digit(&ret, digit, i + 1);
2614fcf5ef2aSThomas Huth     }
2615fcf5ef2aSThomas Huth 
2616fcf5ef2aSThomas Huth     if ((ps && (sgnb == 0xB || sgnb == 0xD)) ||
2617fcf5ef2aSThomas Huth             (!ps && (sgnb & 0x4))) {
2618fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_NEG_PREF, 0);
2619fcf5ef2aSThomas Huth     } else {
2620fcf5ef2aSThomas Huth         bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0);
2621fcf5ef2aSThomas Huth     }
2622fcf5ef2aSThomas Huth 
2623fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(&ret);
2624fcf5ef2aSThomas Huth 
2625fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2626efa73196SNikunj A Dadhania         cr = CRF_SO;
2627fcf5ef2aSThomas Huth     }
2628fcf5ef2aSThomas Huth 
2629fcf5ef2aSThomas Huth     *r = ret;
2630fcf5ef2aSThomas Huth 
2631fcf5ef2aSThomas Huth     return cr;
2632fcf5ef2aSThomas Huth }
2633fcf5ef2aSThomas Huth 
2634fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2635fcf5ef2aSThomas Huth {
2636fcf5ef2aSThomas Huth     int i;
2637fcf5ef2aSThomas Huth     int cr = 0;
2638fcf5ef2aSThomas Huth     uint8_t digit = 0;
2639fcf5ef2aSThomas Huth     int sgnb = bcd_get_sgn(b);
2640fcf5ef2aSThomas Huth     int zone_lead = (ps) ? 0xF0 : 0x30;
2641fcf5ef2aSThomas Huth     int invalid = (sgnb == 0);
2642fcf5ef2aSThomas Huth     ppc_avr_t ret = { .u64 = { 0, 0 } };
2643fcf5ef2aSThomas Huth 
26443c385a93SMark Cave-Ayland     int ox_flag = ((b->VsrD(0) >> 4) != 0);
2645fcf5ef2aSThomas Huth 
2646fcf5ef2aSThomas Huth     for (i = 0; i < 16; i++) {
2647fcf5ef2aSThomas Huth         digit = bcd_get_digit(b, i + 1, &invalid);
2648fcf5ef2aSThomas Huth 
2649fcf5ef2aSThomas Huth         if (unlikely(invalid)) {
2650fcf5ef2aSThomas Huth             break;
2651fcf5ef2aSThomas Huth         }
2652fcf5ef2aSThomas Huth 
2653428115c3SMark Cave-Ayland         ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit;
2654fcf5ef2aSThomas Huth     }
2655fcf5ef2aSThomas Huth 
2656fcf5ef2aSThomas Huth     if (ps) {
2657fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1);
2658fcf5ef2aSThomas Huth     } else {
2659fcf5ef2aSThomas Huth         bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1);
2660fcf5ef2aSThomas Huth     }
2661fcf5ef2aSThomas Huth 
2662fcf5ef2aSThomas Huth     cr = bcd_cmp_zero(b);
2663fcf5ef2aSThomas Huth 
2664fcf5ef2aSThomas Huth     if (ox_flag) {
2665efa73196SNikunj A Dadhania         cr |= CRF_SO;
2666fcf5ef2aSThomas Huth     }
2667fcf5ef2aSThomas Huth 
2668fcf5ef2aSThomas Huth     if (unlikely(invalid)) {
2669efa73196SNikunj A Dadhania         cr = CRF_SO;
2670fcf5ef2aSThomas Huth     }
2671fcf5ef2aSThomas Huth 
2672fcf5ef2aSThomas Huth     *r = ret;
2673fcf5ef2aSThomas Huth 
2674fcf5ef2aSThomas Huth     return cr;
2675fcf5ef2aSThomas Huth }
2676fcf5ef2aSThomas Huth 
2677a3d67f3eSLuis Pires /**
2678a3d67f3eSLuis Pires  * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs
2679a3d67f3eSLuis Pires  *
2680a3d67f3eSLuis Pires  * Returns:
2681a3d67f3eSLuis Pires  * > 0 if ahi|alo > bhi|blo,
2682a3d67f3eSLuis Pires  * 0 if ahi|alo == bhi|blo,
2683a3d67f3eSLuis Pires  * < 0 if ahi|alo < bhi|blo
2684a3d67f3eSLuis Pires  */
2685a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi,
2686a3d67f3eSLuis Pires                           uint64_t blo, uint64_t bhi)
2687a3d67f3eSLuis Pires {
2688a3d67f3eSLuis Pires     return (ahi == bhi) ?
2689a3d67f3eSLuis Pires         (alo > blo ? 1 : (alo == blo ? 0 : -1)) :
2690a3d67f3eSLuis Pires         (ahi > bhi ? 1 : -1);
2691a3d67f3eSLuis Pires }
2692a3d67f3eSLuis Pires 
2693a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2694a406c058SJose Ricardo Ziviani {
2695a406c058SJose Ricardo Ziviani     int i;
2696a3d67f3eSLuis Pires     int cr;
2697a406c058SJose Ricardo Ziviani     uint64_t lo_value;
2698a406c058SJose Ricardo Ziviani     uint64_t hi_value;
269940f3e79aSLuis Pires     uint64_t rem;
2700a406c058SJose Ricardo Ziviani     ppc_avr_t ret = { .u64 = { 0, 0 } };
2701a406c058SJose Ricardo Ziviani 
27023c385a93SMark Cave-Ayland     if (b->VsrSD(0) < 0) {
27033c385a93SMark Cave-Ayland         lo_value = -b->VsrSD(1);
27043c385a93SMark Cave-Ayland         hi_value = ~b->VsrD(0) + !lo_value;
2705a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, 0xD, 0);
2706a3d67f3eSLuis Pires 
2707a3d67f3eSLuis Pires         cr = CRF_LT;
2708a406c058SJose Ricardo Ziviani     } else {
27093c385a93SMark Cave-Ayland         lo_value = b->VsrD(1);
27103c385a93SMark Cave-Ayland         hi_value = b->VsrD(0);
2711a406c058SJose Ricardo Ziviani         bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0);
2712a3d67f3eSLuis Pires 
2713a3d67f3eSLuis Pires         if (hi_value == 0 && lo_value == 0) {
2714a3d67f3eSLuis Pires             cr = CRF_EQ;
2715a3d67f3eSLuis Pires         } else {
2716a3d67f3eSLuis Pires             cr = CRF_GT;
2717a3d67f3eSLuis Pires         }
2718a406c058SJose Ricardo Ziviani     }
2719a406c058SJose Ricardo Ziviani 
2720a3d67f3eSLuis Pires     /*
2721a3d67f3eSLuis Pires      * Check src limits: abs(src) <= 10^31 - 1
2722a3d67f3eSLuis Pires      *
2723a3d67f3eSLuis Pires      * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff
2724a3d67f3eSLuis Pires      */
2725a3d67f3eSLuis Pires     if (ucmp128(lo_value, hi_value,
2726a3d67f3eSLuis Pires                 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) {
2727a3d67f3eSLuis Pires         cr |= CRF_SO;
2728a3d67f3eSLuis Pires 
2729a3d67f3eSLuis Pires         /*
2730a3d67f3eSLuis Pires          * According to the ISA, if src wouldn't fit in the destination
2731a3d67f3eSLuis Pires          * register, the result is undefined.
2732a3d67f3eSLuis Pires          * In that case, we leave r unchanged.
2733a3d67f3eSLuis Pires          */
2734a3d67f3eSLuis Pires     } else {
273540f3e79aSLuis Pires         rem = divu128(&lo_value, &hi_value, 1000000000000000ULL);
2736a406c058SJose Ricardo Ziviani 
273740f3e79aSLuis Pires         for (i = 1; i < 16; rem /= 10, i++) {
273840f3e79aSLuis Pires             bcd_put_digit(&ret, rem % 10, i);
2739a406c058SJose Ricardo Ziviani         }
2740a406c058SJose Ricardo Ziviani 
2741a406c058SJose Ricardo Ziviani         for (; i < 32; lo_value /= 10, i++) {
2742a406c058SJose Ricardo Ziviani             bcd_put_digit(&ret, lo_value % 10, i);
2743a406c058SJose Ricardo Ziviani         }
2744a406c058SJose Ricardo Ziviani 
2745a406c058SJose Ricardo Ziviani         *r = ret;
2746a3d67f3eSLuis Pires     }
2747a406c058SJose Ricardo Ziviani 
2748a406c058SJose Ricardo Ziviani     return cr;
2749a406c058SJose Ricardo Ziviani }
2750a406c058SJose Ricardo Ziviani 
2751c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2752c85bc7ddSJose Ricardo Ziviani {
2753c85bc7ddSJose Ricardo Ziviani     uint8_t i;
2754c85bc7ddSJose Ricardo Ziviani     int cr;
2755c85bc7ddSJose Ricardo Ziviani     uint64_t carry;
2756c85bc7ddSJose Ricardo Ziviani     uint64_t unused;
2757c85bc7ddSJose Ricardo Ziviani     uint64_t lo_value;
2758c85bc7ddSJose Ricardo Ziviani     uint64_t hi_value = 0;
2759c85bc7ddSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2760c85bc7ddSJose Ricardo Ziviani     int invalid = (sgnb == 0);
2761c85bc7ddSJose Ricardo Ziviani 
2762c85bc7ddSJose Ricardo Ziviani     lo_value = bcd_get_digit(b, 31, &invalid);
2763c85bc7ddSJose Ricardo Ziviani     for (i = 30; i > 0; i--) {
2764c85bc7ddSJose Ricardo Ziviani         mulu64(&lo_value, &carry, lo_value, 10ULL);
2765c85bc7ddSJose Ricardo Ziviani         mulu64(&hi_value, &unused, hi_value, 10ULL);
2766c85bc7ddSJose Ricardo Ziviani         lo_value += bcd_get_digit(b, i, &invalid);
2767c85bc7ddSJose Ricardo Ziviani         hi_value += carry;
2768c85bc7ddSJose Ricardo Ziviani 
2769c85bc7ddSJose Ricardo Ziviani         if (unlikely(invalid)) {
2770c85bc7ddSJose Ricardo Ziviani             break;
2771c85bc7ddSJose Ricardo Ziviani         }
2772c85bc7ddSJose Ricardo Ziviani     }
2773c85bc7ddSJose Ricardo Ziviani 
2774c85bc7ddSJose Ricardo Ziviani     if (sgnb == -1) {
27753c385a93SMark Cave-Ayland         r->VsrSD(1) = -lo_value;
27763c385a93SMark Cave-Ayland         r->VsrSD(0) = ~hi_value + !r->VsrSD(1);
2777c85bc7ddSJose Ricardo Ziviani     } else {
27783c385a93SMark Cave-Ayland         r->VsrSD(1) = lo_value;
27793c385a93SMark Cave-Ayland         r->VsrSD(0) = hi_value;
2780c85bc7ddSJose Ricardo Ziviani     }
2781c85bc7ddSJose Ricardo Ziviani 
2782c85bc7ddSJose Ricardo Ziviani     cr = bcd_cmp_zero(b);
2783c85bc7ddSJose Ricardo Ziviani 
2784c85bc7ddSJose Ricardo Ziviani     if (unlikely(invalid)) {
2785c85bc7ddSJose Ricardo Ziviani         cr = CRF_SO;
2786c85bc7ddSJose Ricardo Ziviani     }
2787c85bc7ddSJose Ricardo Ziviani 
2788c85bc7ddSJose Ricardo Ziviani     return cr;
2789c85bc7ddSJose Ricardo Ziviani }
2790c85bc7ddSJose Ricardo Ziviani 
2791c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2792c3025c3bSJose Ricardo Ziviani {
2793c3025c3bSJose Ricardo Ziviani     int i;
2794c3025c3bSJose Ricardo Ziviani     int invalid = 0;
2795c3025c3bSJose Ricardo Ziviani 
2796c3025c3bSJose Ricardo Ziviani     if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) {
2797c3025c3bSJose Ricardo Ziviani         return CRF_SO;
2798c3025c3bSJose Ricardo Ziviani     }
2799c3025c3bSJose Ricardo Ziviani 
2800c3025c3bSJose Ricardo Ziviani     *r = *a;
2801428115c3SMark Cave-Ayland     bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0);
2802c3025c3bSJose Ricardo Ziviani 
2803c3025c3bSJose Ricardo Ziviani     for (i = 1; i < 32; i++) {
2804c3025c3bSJose Ricardo Ziviani         bcd_get_digit(a, i, &invalid);
2805c3025c3bSJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2806c3025c3bSJose Ricardo Ziviani         if (unlikely(invalid)) {
2807c3025c3bSJose Ricardo Ziviani             return CRF_SO;
2808c3025c3bSJose Ricardo Ziviani         }
2809c3025c3bSJose Ricardo Ziviani     }
2810c3025c3bSJose Ricardo Ziviani 
2811c3025c3bSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2812c3025c3bSJose Ricardo Ziviani }
2813c3025c3bSJose Ricardo Ziviani 
2814466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps)
2815466a3f9cSJose Ricardo Ziviani {
2816466a3f9cSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2817466a3f9cSJose Ricardo Ziviani 
2818466a3f9cSJose Ricardo Ziviani     *r = *b;
2819466a3f9cSJose Ricardo Ziviani     bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0);
2820466a3f9cSJose Ricardo Ziviani 
2821071663dfSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2822466a3f9cSJose Ricardo Ziviani         return CRF_SO;
2823466a3f9cSJose Ricardo Ziviani     }
2824466a3f9cSJose Ricardo Ziviani 
2825466a3f9cSJose Ricardo Ziviani     return bcd_cmp_zero(r);
2826466a3f9cSJose Ricardo Ziviani }
2827466a3f9cSJose Ricardo Ziviani 
2828e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2829e04797f7SJose Ricardo Ziviani {
2830e04797f7SJose Ricardo Ziviani     int cr;
2831428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2832e04797f7SJose Ricardo Ziviani     bool ox_flag = false;
2833e04797f7SJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2834e04797f7SJose Ricardo Ziviani     ppc_avr_t ret = *b;
28353c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2836e04797f7SJose Ricardo Ziviani 
2837e04797f7SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2838e04797f7SJose Ricardo Ziviani         return CRF_SO;
2839e04797f7SJose Ricardo Ziviani     }
2840e04797f7SJose Ricardo Ziviani 
2841e04797f7SJose Ricardo Ziviani     if (unlikely(i > 31)) {
2842e04797f7SJose Ricardo Ziviani         i = 31;
2843e04797f7SJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2844e04797f7SJose Ricardo Ziviani         i = -31;
2845e04797f7SJose Ricardo Ziviani     }
2846e04797f7SJose Ricardo Ziviani 
2847e04797f7SJose Ricardo Ziviani     if (i > 0) {
28483c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2849e04797f7SJose Ricardo Ziviani     } else {
28503c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2851e04797f7SJose Ricardo Ziviani     }
2852e04797f7SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2853e04797f7SJose Ricardo Ziviani 
2854e04797f7SJose Ricardo Ziviani     *r = ret;
2855e04797f7SJose Ricardo Ziviani 
2856e04797f7SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2857e04797f7SJose Ricardo Ziviani     if (ox_flag) {
2858e04797f7SJose Ricardo Ziviani         cr |= CRF_SO;
2859e04797f7SJose Ricardo Ziviani     }
2860e04797f7SJose Ricardo Ziviani 
2861e04797f7SJose Ricardo Ziviani     return cr;
2862e04797f7SJose Ricardo Ziviani }
2863e04797f7SJose Ricardo Ziviani 
2864a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2865a49a95e9SJose Ricardo Ziviani {
2866a49a95e9SJose Ricardo Ziviani     int cr;
2867a49a95e9SJose Ricardo Ziviani     int i;
2868a49a95e9SJose Ricardo Ziviani     int invalid = 0;
2869a49a95e9SJose Ricardo Ziviani     bool ox_flag = false;
2870a49a95e9SJose Ricardo Ziviani     ppc_avr_t ret = *b;
2871a49a95e9SJose Ricardo Ziviani 
2872a49a95e9SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
2873a49a95e9SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
2874a49a95e9SJose Ricardo Ziviani 
2875a49a95e9SJose Ricardo Ziviani         if (unlikely(invalid)) {
2876a49a95e9SJose Ricardo Ziviani             return CRF_SO;
2877a49a95e9SJose Ricardo Ziviani         }
2878a49a95e9SJose Ricardo Ziviani     }
2879a49a95e9SJose Ricardo Ziviani 
2880428115c3SMark Cave-Ayland     i = a->VsrSB(7);
2881a49a95e9SJose Ricardo Ziviani     if (i >= 32) {
2882a49a95e9SJose Ricardo Ziviani         ox_flag = true;
28833c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2884a49a95e9SJose Ricardo Ziviani     } else if (i <= -32) {
28853c385a93SMark Cave-Ayland         ret.VsrD(1) = ret.VsrD(0) = 0;
2886a49a95e9SJose Ricardo Ziviani     } else if (i > 0) {
28873c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2888a49a95e9SJose Ricardo Ziviani     } else {
28893c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2890a49a95e9SJose Ricardo Ziviani     }
2891a49a95e9SJose Ricardo Ziviani     *r = ret;
2892a49a95e9SJose Ricardo Ziviani 
2893a49a95e9SJose Ricardo Ziviani     cr = bcd_cmp_zero(r);
2894a49a95e9SJose Ricardo Ziviani     if (ox_flag) {
2895a49a95e9SJose Ricardo Ziviani         cr |= CRF_SO;
2896a49a95e9SJose Ricardo Ziviani     }
2897a49a95e9SJose Ricardo Ziviani 
2898a49a95e9SJose Ricardo Ziviani     return cr;
2899a49a95e9SJose Ricardo Ziviani }
2900a49a95e9SJose Ricardo Ziviani 
2901a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
2902a54238adSJose Ricardo Ziviani {
2903a54238adSJose Ricardo Ziviani     int cr;
2904a54238adSJose Ricardo Ziviani     int unused = 0;
2905a54238adSJose Ricardo Ziviani     int invalid = 0;
2906a54238adSJose Ricardo Ziviani     bool ox_flag = false;
2907a54238adSJose Ricardo Ziviani     int sgnb = bcd_get_sgn(b);
2908a54238adSJose Ricardo Ziviani     ppc_avr_t ret = *b;
29093c385a93SMark Cave-Ayland     ret.VsrD(1) &= ~0xf;
2910a54238adSJose Ricardo Ziviani 
2911428115c3SMark Cave-Ayland     int i = a->VsrSB(7);
2912428115c3SMark Cave-Ayland     ppc_avr_t bcd_one;
2913428115c3SMark Cave-Ayland 
2914428115c3SMark Cave-Ayland     bcd_one.VsrD(0) = 0;
2915428115c3SMark Cave-Ayland     bcd_one.VsrD(1) = 0x10;
2916a54238adSJose Ricardo Ziviani 
2917a54238adSJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
2918a54238adSJose Ricardo Ziviani         return CRF_SO;
2919a54238adSJose Ricardo Ziviani     }
2920a54238adSJose Ricardo Ziviani 
2921a54238adSJose Ricardo Ziviani     if (unlikely(i > 31)) {
2922a54238adSJose Ricardo Ziviani         i = 31;
2923a54238adSJose Ricardo Ziviani     } else if (unlikely(i < -31)) {
2924a54238adSJose Ricardo Ziviani         i = -31;
2925a54238adSJose Ricardo Ziviani     }
2926a54238adSJose Ricardo Ziviani 
2927a54238adSJose Ricardo Ziviani     if (i > 0) {
29283c385a93SMark Cave-Ayland         ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag);
2929a54238adSJose Ricardo Ziviani     } else {
29303c385a93SMark Cave-Ayland         urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4);
2931a54238adSJose Ricardo Ziviani 
2932a54238adSJose Ricardo Ziviani         if (bcd_get_digit(&ret, 0, &invalid) >= 5) {
2933a54238adSJose Ricardo Ziviani             bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused);
2934a54238adSJose Ricardo Ziviani         }
2935a54238adSJose Ricardo Ziviani     }
2936a54238adSJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0);
2937a54238adSJose Ricardo Ziviani 
2938a54238adSJose Ricardo Ziviani     cr = bcd_cmp_zero(&ret);
2939a54238adSJose Ricardo Ziviani     if (ox_flag) {
2940a54238adSJose Ricardo Ziviani         cr |= CRF_SO;
2941a54238adSJose Ricardo Ziviani     }
2942a54238adSJose Ricardo Ziviani     *r = ret;
2943a54238adSJose Ricardo Ziviani 
2944a54238adSJose Ricardo Ziviani     return cr;
2945a54238adSJose Ricardo Ziviani }
2946a54238adSJose Ricardo Ziviani 
294731bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
294831bc4d11SJose Ricardo Ziviani {
294931bc4d11SJose Ricardo Ziviani     uint64_t mask;
295031bc4d11SJose Ricardo Ziviani     uint32_t ox_flag = 0;
2951428115c3SMark Cave-Ayland     int i = a->VsrSH(3) + 1;
295231bc4d11SJose Ricardo Ziviani     ppc_avr_t ret = *b;
295331bc4d11SJose Ricardo Ziviani 
295431bc4d11SJose Ricardo Ziviani     if (bcd_is_valid(b) == false) {
295531bc4d11SJose Ricardo Ziviani         return CRF_SO;
295631bc4d11SJose Ricardo Ziviani     }
295731bc4d11SJose Ricardo Ziviani 
295831bc4d11SJose Ricardo Ziviani     if (i > 16 && i < 32) {
295931bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
29603c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
296131bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
296231bc4d11SJose Ricardo Ziviani         }
296331bc4d11SJose Ricardo Ziviani 
29643c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
296531bc4d11SJose Ricardo Ziviani     } else if (i >= 0 && i <= 16) {
296631bc4d11SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
29673c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
296831bc4d11SJose Ricardo Ziviani             ox_flag = CRF_SO;
296931bc4d11SJose Ricardo Ziviani         }
297031bc4d11SJose Ricardo Ziviani 
29713c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
29723c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
297331bc4d11SJose Ricardo Ziviani     }
297431bc4d11SJose Ricardo Ziviani     bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0);
297531bc4d11SJose Ricardo Ziviani     *r = ret;
297631bc4d11SJose Ricardo Ziviani 
297731bc4d11SJose Ricardo Ziviani     return bcd_cmp_zero(&ret) | ox_flag;
297831bc4d11SJose Ricardo Ziviani }
297931bc4d11SJose Ricardo Ziviani 
29805c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
29815c32e2e4SJose Ricardo Ziviani {
29825c32e2e4SJose Ricardo Ziviani     int i;
29835c32e2e4SJose Ricardo Ziviani     uint64_t mask;
29845c32e2e4SJose Ricardo Ziviani     uint32_t ox_flag = 0;
29855c32e2e4SJose Ricardo Ziviani     int invalid = 0;
29865c32e2e4SJose Ricardo Ziviani     ppc_avr_t ret = *b;
29875c32e2e4SJose Ricardo Ziviani 
29885c32e2e4SJose Ricardo Ziviani     for (i = 0; i < 32; i++) {
29895c32e2e4SJose Ricardo Ziviani         bcd_get_digit(b, i, &invalid);
29905c32e2e4SJose Ricardo Ziviani 
29915c32e2e4SJose Ricardo Ziviani         if (unlikely(invalid)) {
29925c32e2e4SJose Ricardo Ziviani             return CRF_SO;
29935c32e2e4SJose Ricardo Ziviani         }
29945c32e2e4SJose Ricardo Ziviani     }
29955c32e2e4SJose Ricardo Ziviani 
2996428115c3SMark Cave-Ayland     i = a->VsrSH(3);
29975c32e2e4SJose Ricardo Ziviani     if (i > 16 && i < 33) {
29985c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (128 - i * 4);
29993c385a93SMark Cave-Ayland         if (ret.VsrD(0) & ~mask) {
30005c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
30015c32e2e4SJose Ricardo Ziviani         }
30025c32e2e4SJose Ricardo Ziviani 
30033c385a93SMark Cave-Ayland         ret.VsrD(0) &= mask;
30045c32e2e4SJose Ricardo Ziviani     } else if (i > 0 && i <= 16) {
30055c32e2e4SJose Ricardo Ziviani         mask = (uint64_t)-1 >> (64 - i * 4);
30063c385a93SMark Cave-Ayland         if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) {
30075c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
30085c32e2e4SJose Ricardo Ziviani         }
30095c32e2e4SJose Ricardo Ziviani 
30103c385a93SMark Cave-Ayland         ret.VsrD(1) &= mask;
30113c385a93SMark Cave-Ayland         ret.VsrD(0) = 0;
30125c32e2e4SJose Ricardo Ziviani     } else if (i == 0) {
30133c385a93SMark Cave-Ayland         if (ret.VsrD(0) || ret.VsrD(1)) {
30145c32e2e4SJose Ricardo Ziviani             ox_flag = CRF_SO;
30155c32e2e4SJose Ricardo Ziviani         }
30163c385a93SMark Cave-Ayland         ret.VsrD(0) = ret.VsrD(1) = 0;
30175c32e2e4SJose Ricardo Ziviani     }
30185c32e2e4SJose Ricardo Ziviani 
30195c32e2e4SJose Ricardo Ziviani     *r = ret;
30203c385a93SMark Cave-Ayland     if (r->VsrD(0) == 0 && r->VsrD(1) == 0) {
30215c32e2e4SJose Ricardo Ziviani         return ox_flag | CRF_EQ;
30225c32e2e4SJose Ricardo Ziviani     }
30235c32e2e4SJose Ricardo Ziviani 
30245c32e2e4SJose Ricardo Ziviani     return ox_flag | CRF_GT;
30255c32e2e4SJose Ricardo Ziviani }
30265c32e2e4SJose Ricardo Ziviani 
3027fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a)
3028fcf5ef2aSThomas Huth {
3029fcf5ef2aSThomas Huth     int i;
3030fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
3031fcf5ef2aSThomas Huth         r->u8[i] = AES_sbox[a->u8[i]];
3032fcf5ef2aSThomas Huth     }
3033fcf5ef2aSThomas Huth }
3034fcf5ef2aSThomas Huth 
3035fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
3036fcf5ef2aSThomas Huth {
3037fcf5ef2aSThomas Huth     ppc_avr_t result;
3038fcf5ef2aSThomas Huth     int i;
3039fcf5ef2aSThomas Huth 
3040fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
30412dea57dbSMark Cave-Ayland         result.VsrW(i) = b->VsrW(i) ^
30422dea57dbSMark Cave-Ayland             (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^
30432dea57dbSMark Cave-Ayland              AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^
30442dea57dbSMark Cave-Ayland              AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^
30452dea57dbSMark Cave-Ayland              AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]);
3046fcf5ef2aSThomas Huth     }
3047fcf5ef2aSThomas Huth     *r = result;
3048fcf5ef2aSThomas Huth }
3049fcf5ef2aSThomas Huth 
3050fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
3051fcf5ef2aSThomas Huth {
3052fcf5ef2aSThomas Huth     ppc_avr_t result;
3053fcf5ef2aSThomas Huth     int i;
3054fcf5ef2aSThomas Huth 
3055fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
30562dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]);
3057fcf5ef2aSThomas Huth     }
3058fcf5ef2aSThomas Huth     *r = result;
3059fcf5ef2aSThomas Huth }
3060fcf5ef2aSThomas Huth 
3061fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
3062fcf5ef2aSThomas Huth {
3063fcf5ef2aSThomas Huth     /* This differs from what is written in ISA V2.07.  The RTL is */
3064fcf5ef2aSThomas Huth     /* incorrect and will be fixed in V2.07B.                      */
3065fcf5ef2aSThomas Huth     int i;
3066fcf5ef2aSThomas Huth     ppc_avr_t tmp;
3067fcf5ef2aSThomas Huth 
3068fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
30692dea57dbSMark Cave-Ayland         tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])];
3070fcf5ef2aSThomas Huth     }
3071fcf5ef2aSThomas Huth 
3072fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u32) {
30732dea57dbSMark Cave-Ayland         r->VsrW(i) =
30742dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 0)][0] ^
30752dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 1)][1] ^
30762dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 2)][2] ^
30772dea57dbSMark Cave-Ayland             AES_imc[tmp.VsrB(4 * i + 3)][3];
3078fcf5ef2aSThomas Huth     }
3079fcf5ef2aSThomas Huth }
3080fcf5ef2aSThomas Huth 
3081fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
3082fcf5ef2aSThomas Huth {
3083fcf5ef2aSThomas Huth     ppc_avr_t result;
3084fcf5ef2aSThomas Huth     int i;
3085fcf5ef2aSThomas Huth 
3086fcf5ef2aSThomas Huth     VECTOR_FOR_INORDER_I(i, u8) {
30872dea57dbSMark Cave-Ayland         result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]);
3088fcf5ef2aSThomas Huth     }
3089fcf5ef2aSThomas Huth     *r = result;
3090fcf5ef2aSThomas Huth }
3091fcf5ef2aSThomas Huth 
3092fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
3093fcf5ef2aSThomas Huth {
3094fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
3095fcf5ef2aSThomas Huth     int six = st_six & 0xF;
3096fcf5ef2aSThomas Huth     int i;
3097fcf5ef2aSThomas Huth 
3098730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u32); i++) {
3099fcf5ef2aSThomas Huth         if (st == 0) {
3100fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
31010ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 7) ^
31020ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 18) ^
3103730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 3);
3104fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
31050ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 17) ^
31060ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 19) ^
3107730d2ca3SMark Cave-Ayland                              (a->VsrW(i) >> 10);
3108fcf5ef2aSThomas Huth             }
3109fcf5ef2aSThomas Huth         } else { /* st == 1 */
3110fcf5ef2aSThomas Huth             if ((six & (0x8 >> i)) == 0) {
31110ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 2) ^
31120ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 13) ^
31130ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 22);
3114fcf5ef2aSThomas Huth             } else { /* six.bit[i] == 1 */
31150ef83bf2SMark Cave-Ayland                 r->VsrW(i) = ror32(a->VsrW(i), 6) ^
31160ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 11) ^
31170ef83bf2SMark Cave-Ayland                              ror32(a->VsrW(i), 25);
3118fcf5ef2aSThomas Huth             }
3119fcf5ef2aSThomas Huth         }
3120fcf5ef2aSThomas Huth     }
3121fcf5ef2aSThomas Huth }
3122fcf5ef2aSThomas Huth 
3123fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
3124fcf5ef2aSThomas Huth {
3125fcf5ef2aSThomas Huth     int st = (st_six & 0x10) != 0;
3126fcf5ef2aSThomas Huth     int six = st_six & 0xF;
3127fcf5ef2aSThomas Huth     int i;
3128fcf5ef2aSThomas Huth 
3129730d2ca3SMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u64); i++) {
3130fcf5ef2aSThomas Huth         if (st == 0) {
3131fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
31320ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 1) ^
31330ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 8) ^
3134730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 7);
3135fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
31360ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 19) ^
31370ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 61) ^
3138730d2ca3SMark Cave-Ayland                              (a->VsrD(i) >> 6);
3139fcf5ef2aSThomas Huth             }
3140fcf5ef2aSThomas Huth         } else { /* st == 1 */
3141fcf5ef2aSThomas Huth             if ((six & (0x8 >> (2 * i))) == 0) {
31420ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 28) ^
31430ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 34) ^
31440ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 39);
3145fcf5ef2aSThomas Huth             } else { /* six.bit[2*i] == 1 */
31460ef83bf2SMark Cave-Ayland                 r->VsrD(i) = ror64(a->VsrD(i), 14) ^
31470ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 18) ^
31480ef83bf2SMark Cave-Ayland                              ror64(a->VsrD(i), 41);
3149fcf5ef2aSThomas Huth             }
3150fcf5ef2aSThomas Huth         }
3151fcf5ef2aSThomas Huth     }
3152fcf5ef2aSThomas Huth }
3153fcf5ef2aSThomas Huth 
3154fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
3155fcf5ef2aSThomas Huth {
3156fcf5ef2aSThomas Huth     ppc_avr_t result;
3157fcf5ef2aSThomas Huth     int i;
3158fcf5ef2aSThomas Huth 
315960594feaSMark Cave-Ayland     for (i = 0; i < ARRAY_SIZE(r->u8); i++) {
316060594feaSMark Cave-Ayland         int indexA = c->VsrB(i) >> 4;
316160594feaSMark Cave-Ayland         int indexB = c->VsrB(i) & 0xF;
316260594feaSMark Cave-Ayland 
316360594feaSMark Cave-Ayland         result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB);
3164fcf5ef2aSThomas Huth     }
3165fcf5ef2aSThomas Huth     *r = result;
3166fcf5ef2aSThomas Huth }
3167fcf5ef2aSThomas Huth 
3168fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I
3169fcf5ef2aSThomas Huth 
3170fcf5ef2aSThomas Huth /*****************************************************************************/
3171fcf5ef2aSThomas Huth /* SPE extension helpers */
3172fcf5ef2aSThomas Huth /* Use a table to make this quicker */
3173fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = {
3174fcf5ef2aSThomas Huth     0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE,
3175fcf5ef2aSThomas Huth     0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF,
3176fcf5ef2aSThomas Huth };
3177fcf5ef2aSThomas Huth 
3178fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val)
3179fcf5ef2aSThomas Huth {
3180fcf5ef2aSThomas Huth     return hbrev[val >> 4] | (hbrev[val & 0xF] << 4);
3181fcf5ef2aSThomas Huth }
3182fcf5ef2aSThomas Huth 
3183fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val)
3184fcf5ef2aSThomas Huth {
3185fcf5ef2aSThomas Huth     return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) |
3186fcf5ef2aSThomas Huth         (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24);
3187fcf5ef2aSThomas Huth }
3188fcf5ef2aSThomas Huth 
3189fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */
3190fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2)
3191fcf5ef2aSThomas Huth {
3192fcf5ef2aSThomas Huth     uint32_t a, b, d, mask;
3193fcf5ef2aSThomas Huth 
3194fcf5ef2aSThomas Huth     mask = UINT32_MAX >> (32 - MASKBITS);
3195fcf5ef2aSThomas Huth     a = arg1 & mask;
3196fcf5ef2aSThomas Huth     b = arg2 & mask;
3197fcf5ef2aSThomas Huth     d = word_reverse(1 + word_reverse(a | ~b));
3198fcf5ef2aSThomas Huth     return (arg1 & ~mask) | (d & b);
3199fcf5ef2aSThomas Huth }
3200fcf5ef2aSThomas Huth 
3201fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val)
3202fcf5ef2aSThomas Huth {
3203fcf5ef2aSThomas Huth     if (val & 0x80000000) {
3204fcf5ef2aSThomas Huth         return clz32(~val);
3205fcf5ef2aSThomas Huth     } else {
3206fcf5ef2aSThomas Huth         return clz32(val);
3207fcf5ef2aSThomas Huth     }
3208fcf5ef2aSThomas Huth }
3209fcf5ef2aSThomas Huth 
3210fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val)
3211fcf5ef2aSThomas Huth {
3212fcf5ef2aSThomas Huth     return clz32(val);
3213fcf5ef2aSThomas Huth }
3214fcf5ef2aSThomas Huth 
3215fcf5ef2aSThomas Huth /* 440 specific */
3216fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high,
3217fcf5ef2aSThomas Huth                           target_ulong low, uint32_t update_Rc)
3218fcf5ef2aSThomas Huth {
3219fcf5ef2aSThomas Huth     target_ulong mask;
3220fcf5ef2aSThomas Huth     int i;
3221fcf5ef2aSThomas Huth 
3222fcf5ef2aSThomas Huth     i = 1;
3223fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3224fcf5ef2aSThomas Huth         if ((high & mask) == 0) {
3225fcf5ef2aSThomas Huth             if (update_Rc) {
3226fcf5ef2aSThomas Huth                 env->crf[0] = 0x4;
3227fcf5ef2aSThomas Huth             }
3228fcf5ef2aSThomas Huth             goto done;
3229fcf5ef2aSThomas Huth         }
3230fcf5ef2aSThomas Huth         i++;
3231fcf5ef2aSThomas Huth     }
3232fcf5ef2aSThomas Huth     for (mask = 0xFF000000; mask != 0; mask = mask >> 8) {
3233fcf5ef2aSThomas Huth         if ((low & mask) == 0) {
3234fcf5ef2aSThomas Huth             if (update_Rc) {
3235fcf5ef2aSThomas Huth                 env->crf[0] = 0x8;
3236fcf5ef2aSThomas Huth             }
3237fcf5ef2aSThomas Huth             goto done;
3238fcf5ef2aSThomas Huth         }
3239fcf5ef2aSThomas Huth         i++;
3240fcf5ef2aSThomas Huth     }
3241fcf5ef2aSThomas Huth     i = 8;
3242fcf5ef2aSThomas Huth     if (update_Rc) {
3243fcf5ef2aSThomas Huth         env->crf[0] = 0x2;
3244fcf5ef2aSThomas Huth     }
3245fcf5ef2aSThomas Huth  done:
3246fcf5ef2aSThomas Huth     env->xer = (env->xer & ~0x7F) | i;
3247fcf5ef2aSThomas Huth     if (update_Rc) {
3248fcf5ef2aSThomas Huth         env->crf[0] |= xer_so;
3249fcf5ef2aSThomas Huth     }
3250fcf5ef2aSThomas Huth     return i;
3251fcf5ef2aSThomas Huth }
3252