1fcf5ef2aSThomas Huth /* 2fcf5ef2aSThomas Huth * PowerPC integer and vector emulation helpers for QEMU. 3fcf5ef2aSThomas Huth * 4fcf5ef2aSThomas Huth * Copyright (c) 2003-2007 Jocelyn Mayer 5fcf5ef2aSThomas Huth * 6fcf5ef2aSThomas Huth * This library is free software; you can redistribute it and/or 7fcf5ef2aSThomas Huth * modify it under the terms of the GNU Lesser General Public 8fcf5ef2aSThomas Huth * License as published by the Free Software Foundation; either 96bd039cdSChetan Pant * version 2.1 of the License, or (at your option) any later version. 10fcf5ef2aSThomas Huth * 11fcf5ef2aSThomas Huth * This library is distributed in the hope that it will be useful, 12fcf5ef2aSThomas Huth * but WITHOUT ANY WARRANTY; without even the implied warranty of 13fcf5ef2aSThomas Huth * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14fcf5ef2aSThomas Huth * Lesser General Public License for more details. 15fcf5ef2aSThomas Huth * 16fcf5ef2aSThomas Huth * You should have received a copy of the GNU Lesser General Public 17fcf5ef2aSThomas Huth * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18fcf5ef2aSThomas Huth */ 19db725815SMarkus Armbruster 20fcf5ef2aSThomas Huth #include "qemu/osdep.h" 21fcf5ef2aSThomas Huth #include "cpu.h" 22fcf5ef2aSThomas Huth #include "internal.h" 23fcf5ef2aSThomas Huth #include "qemu/host-utils.h" 24db725815SMarkus Armbruster #include "qemu/main-loop.h" 258a05fd9aSRichard Henderson #include "qemu/log.h" 26fcf5ef2aSThomas Huth #include "exec/helper-proto.h" 27fcf5ef2aSThomas Huth #include "crypto/aes.h" 2824f91e81SAlex Bennée #include "fpu/softfloat.h" 293f74b632SRichard Henderson #include "qapi/error.h" 303f74b632SRichard Henderson #include "qemu/guest-random.h" 311015fcabSMatheus Ferst #include "tcg/tcg-gvec-desc.h" 32fcf5ef2aSThomas Huth 33fcf5ef2aSThomas Huth #include "helper_regs.h" 34fcf5ef2aSThomas Huth /*****************************************************************************/ 35fcf5ef2aSThomas Huth /* Fixed point operations helpers */ 36fcf5ef2aSThomas Huth 37f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov) 38f32899deSNikunj A Dadhania { 39f32899deSNikunj A Dadhania if (unlikely(ov)) { 40af721a31SVíctor Colombo env->so = env->ov = env->ov32 = 1; 41f32899deSNikunj A Dadhania } else { 42af721a31SVíctor Colombo env->ov = env->ov32 = 0; 43f32899deSNikunj A Dadhania } 44f32899deSNikunj A Dadhania } 45f32899deSNikunj A Dadhania 46fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb, 47fcf5ef2aSThomas Huth uint32_t oe) 48fcf5ef2aSThomas Huth { 49fcf5ef2aSThomas Huth uint64_t rt = 0; 50fcf5ef2aSThomas Huth int overflow = 0; 51fcf5ef2aSThomas Huth 52fcf5ef2aSThomas Huth uint64_t dividend = (uint64_t)ra << 32; 53fcf5ef2aSThomas Huth uint64_t divisor = (uint32_t)rb; 54fcf5ef2aSThomas Huth 55fcf5ef2aSThomas Huth if (unlikely(divisor == 0)) { 56fcf5ef2aSThomas Huth overflow = 1; 57fcf5ef2aSThomas Huth } else { 58fcf5ef2aSThomas Huth rt = dividend / divisor; 59fcf5ef2aSThomas Huth overflow = rt > UINT32_MAX; 60fcf5ef2aSThomas Huth } 61fcf5ef2aSThomas Huth 62fcf5ef2aSThomas Huth if (unlikely(overflow)) { 63fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 64fcf5ef2aSThomas Huth } 65fcf5ef2aSThomas Huth 66fcf5ef2aSThomas Huth if (oe) { 67f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 68fcf5ef2aSThomas Huth } 69fcf5ef2aSThomas Huth 70fcf5ef2aSThomas Huth return (target_ulong)rt; 71fcf5ef2aSThomas Huth } 72fcf5ef2aSThomas Huth 73fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb, 74fcf5ef2aSThomas Huth uint32_t oe) 75fcf5ef2aSThomas Huth { 76fcf5ef2aSThomas Huth int64_t rt = 0; 77fcf5ef2aSThomas Huth int overflow = 0; 78fcf5ef2aSThomas Huth 79fcf5ef2aSThomas Huth int64_t dividend = (int64_t)ra << 32; 80fcf5ef2aSThomas Huth int64_t divisor = (int64_t)((int32_t)rb); 81fcf5ef2aSThomas Huth 82fcf5ef2aSThomas Huth if (unlikely((divisor == 0) || 83fcf5ef2aSThomas Huth ((divisor == -1ull) && (dividend == INT64_MIN)))) { 84fcf5ef2aSThomas Huth overflow = 1; 85fcf5ef2aSThomas Huth } else { 86fcf5ef2aSThomas Huth rt = dividend / divisor; 87fcf5ef2aSThomas Huth overflow = rt != (int32_t)rt; 88fcf5ef2aSThomas Huth } 89fcf5ef2aSThomas Huth 90fcf5ef2aSThomas Huth if (unlikely(overflow)) { 91fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 92fcf5ef2aSThomas Huth } 93fcf5ef2aSThomas Huth 94fcf5ef2aSThomas Huth if (oe) { 95f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 96fcf5ef2aSThomas Huth } 97fcf5ef2aSThomas Huth 98fcf5ef2aSThomas Huth return (target_ulong)rt; 99fcf5ef2aSThomas Huth } 100fcf5ef2aSThomas Huth 101fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 102fcf5ef2aSThomas Huth 103fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe) 104fcf5ef2aSThomas Huth { 105fcf5ef2aSThomas Huth uint64_t rt = 0; 106fcf5ef2aSThomas Huth int overflow = 0; 107fcf5ef2aSThomas Huth 1089276a31cSLuis Pires if (unlikely(rb == 0 || ra >= rb)) { 1099276a31cSLuis Pires overflow = 1; 110fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1119276a31cSLuis Pires } else { 1129276a31cSLuis Pires divu128(&rt, &ra, rb); 113fcf5ef2aSThomas Huth } 114fcf5ef2aSThomas Huth 115fcf5ef2aSThomas Huth if (oe) { 116f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 117fcf5ef2aSThomas Huth } 118fcf5ef2aSThomas Huth 119fcf5ef2aSThomas Huth return rt; 120fcf5ef2aSThomas Huth } 121fcf5ef2aSThomas Huth 122fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe) 123fcf5ef2aSThomas Huth { 12440f3e79aSLuis Pires uint64_t rt = 0; 125fcf5ef2aSThomas Huth int64_t ra = (int64_t)rau; 126fcf5ef2aSThomas Huth int64_t rb = (int64_t)rbu; 1279276a31cSLuis Pires int overflow = 0; 128fcf5ef2aSThomas Huth 1299276a31cSLuis Pires if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) { 1309276a31cSLuis Pires overflow = 1; 131fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1329276a31cSLuis Pires } else { 1339276a31cSLuis Pires divs128(&rt, &ra, rb); 134fcf5ef2aSThomas Huth } 135fcf5ef2aSThomas Huth 136fcf5ef2aSThomas Huth if (oe) { 137f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 138fcf5ef2aSThomas Huth } 139fcf5ef2aSThomas Huth 140fcf5ef2aSThomas Huth return rt; 141fcf5ef2aSThomas Huth } 142fcf5ef2aSThomas Huth 143fcf5ef2aSThomas Huth #endif 144fcf5ef2aSThomas Huth 145fcf5ef2aSThomas Huth 146fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 147fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */ 148fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff)) 149fcf5ef2aSThomas Huth 150b6cb41b2SDavid Gibson /* 151b6cb41b2SDavid Gibson * subtract 1 from each byte, and with inverse, check if MSB is set at each 152fcf5ef2aSThomas Huth * byte. 153fcf5ef2aSThomas Huth * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80 154fcf5ef2aSThomas Huth * (0xFF & 0xFF) & 0x80 = 0x80 (zero found) 155fcf5ef2aSThomas Huth */ 156fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80)) 157fcf5ef2aSThomas Huth 158fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */ 159fcf5ef2aSThomas Huth #define hasvalue(x, n) (haszero((x) ^ pattern(n))) 160fcf5ef2aSThomas Huth 161fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb) 162fcf5ef2aSThomas Huth { 163efa73196SNikunj A Dadhania return hasvalue(rb, ra) ? CRF_GT : 0; 164fcf5ef2aSThomas Huth } 165fcf5ef2aSThomas Huth 166fcf5ef2aSThomas Huth #undef pattern 167fcf5ef2aSThomas Huth #undef haszero 168fcf5ef2aSThomas Huth #undef hasvalue 169fcf5ef2aSThomas Huth 170b6cb41b2SDavid Gibson /* 1713f74b632SRichard Henderson * Return a random number. 172fcf5ef2aSThomas Huth */ 1733f74b632SRichard Henderson uint64_t helper_darn32(void) 174fcf5ef2aSThomas Huth { 1753f74b632SRichard Henderson Error *err = NULL; 1763f74b632SRichard Henderson uint32_t ret; 1773f74b632SRichard Henderson 1783f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1793f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1803f74b632SRichard Henderson error_get_pretty(err)); 1813f74b632SRichard Henderson error_free(err); 182fcf5ef2aSThomas Huth return -1; 183fcf5ef2aSThomas Huth } 184fcf5ef2aSThomas Huth 1853f74b632SRichard Henderson return ret; 1863f74b632SRichard Henderson } 1873f74b632SRichard Henderson 1883f74b632SRichard Henderson uint64_t helper_darn64(void) 189fcf5ef2aSThomas Huth { 1903f74b632SRichard Henderson Error *err = NULL; 1913f74b632SRichard Henderson uint64_t ret; 1923f74b632SRichard Henderson 1933f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1943f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1953f74b632SRichard Henderson error_get_pretty(err)); 1963f74b632SRichard Henderson error_free(err); 197fcf5ef2aSThomas Huth return -1; 198fcf5ef2aSThomas Huth } 199fcf5ef2aSThomas Huth 2003f74b632SRichard Henderson return ret; 2013f74b632SRichard Henderson } 202fcf5ef2aSThomas Huth 203fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb) 204fcf5ef2aSThomas Huth { 205fcf5ef2aSThomas Huth int i; 206fcf5ef2aSThomas Huth uint64_t ra = 0; 207fcf5ef2aSThomas Huth 208fcf5ef2aSThomas Huth for (i = 0; i < 8; i++) { 209fcf5ef2aSThomas Huth int index = (rs >> (i * 8)) & 0xFF; 210fcf5ef2aSThomas Huth if (index < 64) { 211a6a444a8SCédric Le Goater if (rb & PPC_BIT(index)) { 212fcf5ef2aSThomas Huth ra |= 1 << i; 213fcf5ef2aSThomas Huth } 214fcf5ef2aSThomas Huth } 215fcf5ef2aSThomas Huth } 216fcf5ef2aSThomas Huth return ra; 217fcf5ef2aSThomas Huth } 218fcf5ef2aSThomas Huth 219fcf5ef2aSThomas Huth #endif 220fcf5ef2aSThomas Huth 221fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb) 222fcf5ef2aSThomas Huth { 223fcf5ef2aSThomas Huth target_ulong mask = 0xff; 224fcf5ef2aSThomas Huth target_ulong ra = 0; 225fcf5ef2aSThomas Huth int i; 226fcf5ef2aSThomas Huth 227fcf5ef2aSThomas Huth for (i = 0; i < sizeof(target_ulong); i++) { 228fcf5ef2aSThomas Huth if ((rs & mask) == (rb & mask)) { 229fcf5ef2aSThomas Huth ra |= mask; 230fcf5ef2aSThomas Huth } 231fcf5ef2aSThomas Huth mask <<= 8; 232fcf5ef2aSThomas Huth } 233fcf5ef2aSThomas Huth return ra; 234fcf5ef2aSThomas Huth } 235fcf5ef2aSThomas Huth 236fcf5ef2aSThomas Huth /* shift right arithmetic helper */ 237fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value, 238fcf5ef2aSThomas Huth target_ulong shift) 239fcf5ef2aSThomas Huth { 240fcf5ef2aSThomas Huth int32_t ret; 241fcf5ef2aSThomas Huth 242fcf5ef2aSThomas Huth if (likely(!(shift & 0x20))) { 243fcf5ef2aSThomas Huth if (likely((uint32_t)shift != 0)) { 244fcf5ef2aSThomas Huth shift &= 0x1f; 245fcf5ef2aSThomas Huth ret = (int32_t)value >> shift; 246fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) { 247af1c259fSSandipan Das env->ca32 = env->ca = 0; 248fcf5ef2aSThomas Huth } else { 249af1c259fSSandipan Das env->ca32 = env->ca = 1; 250fcf5ef2aSThomas Huth } 251fcf5ef2aSThomas Huth } else { 252fcf5ef2aSThomas Huth ret = (int32_t)value; 253af1c259fSSandipan Das env->ca32 = env->ca = 0; 254fcf5ef2aSThomas Huth } 255fcf5ef2aSThomas Huth } else { 256fcf5ef2aSThomas Huth ret = (int32_t)value >> 31; 257af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 258fcf5ef2aSThomas Huth } 259fcf5ef2aSThomas Huth return (target_long)ret; 260fcf5ef2aSThomas Huth } 261fcf5ef2aSThomas Huth 262fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 263fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value, 264fcf5ef2aSThomas Huth target_ulong shift) 265fcf5ef2aSThomas Huth { 266fcf5ef2aSThomas Huth int64_t ret; 267fcf5ef2aSThomas Huth 268fcf5ef2aSThomas Huth if (likely(!(shift & 0x40))) { 269fcf5ef2aSThomas Huth if (likely((uint64_t)shift != 0)) { 270fcf5ef2aSThomas Huth shift &= 0x3f; 271fcf5ef2aSThomas Huth ret = (int64_t)value >> shift; 272fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) { 273af1c259fSSandipan Das env->ca32 = env->ca = 0; 274fcf5ef2aSThomas Huth } else { 275af1c259fSSandipan Das env->ca32 = env->ca = 1; 276fcf5ef2aSThomas Huth } 277fcf5ef2aSThomas Huth } else { 278fcf5ef2aSThomas Huth ret = (int64_t)value; 279af1c259fSSandipan Das env->ca32 = env->ca = 0; 280fcf5ef2aSThomas Huth } 281fcf5ef2aSThomas Huth } else { 282fcf5ef2aSThomas Huth ret = (int64_t)value >> 63; 283af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 284fcf5ef2aSThomas Huth } 285fcf5ef2aSThomas Huth return ret; 286fcf5ef2aSThomas Huth } 287fcf5ef2aSThomas Huth #endif 288fcf5ef2aSThomas Huth 289fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 290fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 291fcf5ef2aSThomas Huth { 29279770002SRichard Henderson /* Note that we don't fold past bytes */ 293fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 294fcf5ef2aSThomas Huth 0x5555555555555555ULL); 295fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 296fcf5ef2aSThomas Huth 0x3333333333333333ULL); 297fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 298fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 299fcf5ef2aSThomas Huth return val; 300fcf5ef2aSThomas Huth } 301fcf5ef2aSThomas Huth 302fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val) 303fcf5ef2aSThomas Huth { 30479770002SRichard Henderson /* Note that we don't fold past words. */ 305fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 306fcf5ef2aSThomas Huth 0x5555555555555555ULL); 307fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 308fcf5ef2aSThomas Huth 0x3333333333333333ULL); 309fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 310fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 311fcf5ef2aSThomas Huth val = (val & 0x00ff00ff00ff00ffULL) + ((val >> 8) & 312fcf5ef2aSThomas Huth 0x00ff00ff00ff00ffULL); 313fcf5ef2aSThomas Huth val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) & 314fcf5ef2aSThomas Huth 0x0000ffff0000ffffULL); 315fcf5ef2aSThomas Huth return val; 316fcf5ef2aSThomas Huth } 317fcf5ef2aSThomas Huth #else 318fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 319fcf5ef2aSThomas Huth { 32079770002SRichard Henderson /* Note that we don't fold past bytes */ 321fcf5ef2aSThomas Huth val = (val & 0x55555555) + ((val >> 1) & 0x55555555); 322fcf5ef2aSThomas Huth val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 323fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f) + ((val >> 4) & 0x0f0f0f0f); 324fcf5ef2aSThomas Huth return val; 325fcf5ef2aSThomas Huth } 326fcf5ef2aSThomas Huth #endif 327fcf5ef2aSThomas Huth 3286e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask) 32989ccd7dcSMatheus Ferst { 33089ccd7dcSMatheus Ferst /* 33189ccd7dcSMatheus Ferst * Instead of processing the mask bit-by-bit from the most significant to 33289ccd7dcSMatheus Ferst * the least significant bit, as described in PowerISA, we'll handle it in 33389ccd7dcSMatheus Ferst * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use 33489ccd7dcSMatheus Ferst * ctz or cto, we negate the mask at the end of the loop. 33589ccd7dcSMatheus Ferst */ 33689ccd7dcSMatheus Ferst target_ulong m, left = 0, right = 0; 33789ccd7dcSMatheus Ferst unsigned int n, i = 64; 33889ccd7dcSMatheus Ferst bool bit = false; /* tracks if we are processing zeros or ones */ 33989ccd7dcSMatheus Ferst 34089ccd7dcSMatheus Ferst if (mask == 0 || mask == -1) { 34189ccd7dcSMatheus Ferst return src; 34289ccd7dcSMatheus Ferst } 34389ccd7dcSMatheus Ferst 34489ccd7dcSMatheus Ferst /* Processes the mask in blocks, from LSB to MSB */ 34589ccd7dcSMatheus Ferst while (i) { 34689ccd7dcSMatheus Ferst /* Find how many bits we should take */ 34789ccd7dcSMatheus Ferst n = ctz64(mask); 34889ccd7dcSMatheus Ferst if (n > i) { 34989ccd7dcSMatheus Ferst n = i; 35089ccd7dcSMatheus Ferst } 35189ccd7dcSMatheus Ferst 35289ccd7dcSMatheus Ferst /* 35389ccd7dcSMatheus Ferst * Extracts 'n' trailing bits of src and put them on the leading 'n' 35489ccd7dcSMatheus Ferst * bits of 'right' or 'left', pushing down the previously extracted 35589ccd7dcSMatheus Ferst * values. 35689ccd7dcSMatheus Ferst */ 35789ccd7dcSMatheus Ferst m = (1ll << n) - 1; 35889ccd7dcSMatheus Ferst if (bit) { 35989ccd7dcSMatheus Ferst right = ror64(right | (src & m), n); 36089ccd7dcSMatheus Ferst } else { 36189ccd7dcSMatheus Ferst left = ror64(left | (src & m), n); 36289ccd7dcSMatheus Ferst } 36389ccd7dcSMatheus Ferst 36489ccd7dcSMatheus Ferst /* 36589ccd7dcSMatheus Ferst * Discards the processed bits from 'src' and 'mask'. Note that we are 36689ccd7dcSMatheus Ferst * removing 'n' trailing zeros from 'mask', but the logical shift will 36789ccd7dcSMatheus Ferst * add 'n' leading zeros back, so the population count of 'mask' is kept 36889ccd7dcSMatheus Ferst * the same. 36989ccd7dcSMatheus Ferst */ 37089ccd7dcSMatheus Ferst src >>= n; 37189ccd7dcSMatheus Ferst mask >>= n; 37289ccd7dcSMatheus Ferst i -= n; 37389ccd7dcSMatheus Ferst bit = !bit; 37489ccd7dcSMatheus Ferst mask = ~mask; 37589ccd7dcSMatheus Ferst } 37689ccd7dcSMatheus Ferst 37789ccd7dcSMatheus Ferst /* 37889ccd7dcSMatheus Ferst * At the end, right was ror'ed ctpop(mask) times. To put it back in place, 37989ccd7dcSMatheus Ferst * we'll shift it more 64-ctpop(mask) times. 38089ccd7dcSMatheus Ferst */ 38189ccd7dcSMatheus Ferst if (bit) { 38289ccd7dcSMatheus Ferst n = ctpop64(mask); 38389ccd7dcSMatheus Ferst } else { 38489ccd7dcSMatheus Ferst n = 64 - ctpop64(mask); 38589ccd7dcSMatheus Ferst } 38689ccd7dcSMatheus Ferst 38789ccd7dcSMatheus Ferst return left | (right >> n); 38889ccd7dcSMatheus Ferst } 38989ccd7dcSMatheus Ferst 39021ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask) 39121ba6e58SMatheus Ferst { 39221ba6e58SMatheus Ferst int i, o; 39321ba6e58SMatheus Ferst uint64_t result = 0; 39421ba6e58SMatheus Ferst 39521ba6e58SMatheus Ferst if (mask == -1) { 39621ba6e58SMatheus Ferst return src; 39721ba6e58SMatheus Ferst } 39821ba6e58SMatheus Ferst 39921ba6e58SMatheus Ferst for (i = 0; mask != 0; i++) { 40021ba6e58SMatheus Ferst o = ctz64(mask); 40121ba6e58SMatheus Ferst mask &= mask - 1; 40221ba6e58SMatheus Ferst result |= ((src >> i) & 1) << o; 40321ba6e58SMatheus Ferst } 40421ba6e58SMatheus Ferst 40521ba6e58SMatheus Ferst return result; 40621ba6e58SMatheus Ferst } 4078bdb7606SMatheus Ferst 4088bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask) 4098bdb7606SMatheus Ferst { 4108bdb7606SMatheus Ferst int i, o; 4118bdb7606SMatheus Ferst uint64_t result = 0; 4128bdb7606SMatheus Ferst 4138bdb7606SMatheus Ferst if (mask == -1) { 4148bdb7606SMatheus Ferst return src; 4158bdb7606SMatheus Ferst } 4168bdb7606SMatheus Ferst 4178bdb7606SMatheus Ferst for (o = 0; mask != 0; o++) { 4188bdb7606SMatheus Ferst i = ctz64(mask); 4198bdb7606SMatheus Ferst mask &= mask - 1; 4208bdb7606SMatheus Ferst result |= ((src >> i) & 1) << o; 4218bdb7606SMatheus Ferst } 4228bdb7606SMatheus Ferst 4238bdb7606SMatheus Ferst return result; 4248bdb7606SMatheus Ferst } 42521ba6e58SMatheus Ferst 426fcf5ef2aSThomas Huth /*****************************************************************************/ 427fcf5ef2aSThomas Huth /* Altivec extension helpers */ 428e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 429fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 430fcf5ef2aSThomas Huth for (index = 0; index < ARRAY_SIZE(r->element); index++) 431fcf5ef2aSThomas Huth #else 432fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 433fcf5ef2aSThomas Huth for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--) 434fcf5ef2aSThomas Huth #endif 435fcf5ef2aSThomas Huth 436fcf5ef2aSThomas Huth /* Saturating arithmetic helpers. */ 437fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max) \ 438fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 439fcf5ef2aSThomas Huth { \ 440fcf5ef2aSThomas Huth to_type r; \ 441fcf5ef2aSThomas Huth \ 442fcf5ef2aSThomas Huth if (x < (from_type)min) { \ 443fcf5ef2aSThomas Huth r = min; \ 444fcf5ef2aSThomas Huth *sat = 1; \ 445fcf5ef2aSThomas Huth } else if (x > (from_type)max) { \ 446fcf5ef2aSThomas Huth r = max; \ 447fcf5ef2aSThomas Huth *sat = 1; \ 448fcf5ef2aSThomas Huth } else { \ 449fcf5ef2aSThomas Huth r = x; \ 450fcf5ef2aSThomas Huth } \ 451fcf5ef2aSThomas Huth return r; \ 452fcf5ef2aSThomas Huth } 453fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max) \ 454fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 455fcf5ef2aSThomas Huth { \ 456fcf5ef2aSThomas Huth to_type r; \ 457fcf5ef2aSThomas Huth \ 458fcf5ef2aSThomas Huth if (x > (from_type)max) { \ 459fcf5ef2aSThomas Huth r = max; \ 460fcf5ef2aSThomas Huth *sat = 1; \ 461fcf5ef2aSThomas Huth } else { \ 462fcf5ef2aSThomas Huth r = x; \ 463fcf5ef2aSThomas Huth } \ 464fcf5ef2aSThomas Huth return r; \ 465fcf5ef2aSThomas Huth } 466fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX) 467fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX) 468fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX) 469fcf5ef2aSThomas Huth 470fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX) 471fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX) 472fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX) 473fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX) 474fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX) 475fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX) 476fcf5ef2aSThomas Huth #undef SATCVT 477fcf5ef2aSThomas Huth #undef SATCVTU 478fcf5ef2aSThomas Huth 479dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr) 480fcf5ef2aSThomas Huth { 481c19940dbSBruno Larsen (billionai) ppc_store_vscr(env, vscr); 482fcf5ef2aSThomas Huth } 483fcf5ef2aSThomas Huth 484cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env) 485cc2b90d7SRichard Henderson { 486c19940dbSBruno Larsen (billionai) return ppc_get_vscr(env); 487cc2b90d7SRichard Henderson } 488cc2b90d7SRichard Henderson 4896175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env) 4906175f5a0SRichard Henderson { 4919b5b74daSRichard Henderson /* The choice of non-zero value is arbitrary. */ 4929b5b74daSRichard Henderson env->vscr_sat.u32[0] = 1; 4936175f5a0SRichard Henderson } 4946175f5a0SRichard Henderson 495fcf5ef2aSThomas Huth /* vprtybq */ 496*d57fbd8fSLucas Mateus Castro (alqotel) void helper_VPRTYBQ(ppc_avr_t *r, ppc_avr_t *b, uint32_t v) 497fcf5ef2aSThomas Huth { 498fcf5ef2aSThomas Huth uint64_t res = b->u64[0] ^ b->u64[1]; 499fcf5ef2aSThomas Huth res ^= res >> 32; 500fcf5ef2aSThomas Huth res ^= res >> 16; 501fcf5ef2aSThomas Huth res ^= res >> 8; 5023c385a93SMark Cave-Ayland r->VsrD(1) = res & 1; 5033c385a93SMark Cave-Ayland r->VsrD(0) = 0; 504fcf5ef2aSThomas Huth } 505fcf5ef2aSThomas Huth 506fcf5ef2aSThomas Huth #define VARITHFP(suffix, func) \ 507fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 508fcf5ef2aSThomas Huth ppc_avr_t *b) \ 509fcf5ef2aSThomas Huth { \ 510fcf5ef2aSThomas Huth int i; \ 511fcf5ef2aSThomas Huth \ 51205ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 51305ee3e8aSMark Cave-Ayland r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status); \ 514fcf5ef2aSThomas Huth } \ 515fcf5ef2aSThomas Huth } 516fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add) 517fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub) 518fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min) 519fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max) 520fcf5ef2aSThomas Huth #undef VARITHFP 521fcf5ef2aSThomas Huth 522fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type) \ 523fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 524fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) \ 525fcf5ef2aSThomas Huth { \ 526fcf5ef2aSThomas Huth int i; \ 52705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 52805ee3e8aSMark Cave-Ayland r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \ 529fcf5ef2aSThomas Huth type, &env->vec_status); \ 530fcf5ef2aSThomas Huth } \ 531fcf5ef2aSThomas Huth } 532fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0); 533fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c); 534fcf5ef2aSThomas Huth #undef VARITHFPFMA 535fcf5ef2aSThomas Huth 536fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element) \ 537fcf5ef2aSThomas Huth { \ 538fcf5ef2aSThomas Huth type result = (type)a->element[i] op (type)b->element[i]; \ 539fcf5ef2aSThomas Huth r->element[i] = cvt(result, &sat); \ 540fcf5ef2aSThomas Huth } 541fcf5ef2aSThomas Huth 542fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element) \ 543fb11ae7dSRichard Henderson void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat, \ 544fb11ae7dSRichard Henderson ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 545fcf5ef2aSThomas Huth { \ 546fcf5ef2aSThomas Huth int sat = 0; \ 547fcf5ef2aSThomas Huth int i; \ 548fcf5ef2aSThomas Huth \ 549fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 550fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 551fcf5ef2aSThomas Huth } \ 552fcf5ef2aSThomas Huth if (sat) { \ 553fb11ae7dSRichard Henderson vscr_sat->u32[0] = 1; \ 554fcf5ef2aSThomas Huth } \ 555fcf5ef2aSThomas Huth } 556fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt) \ 557fcf5ef2aSThomas Huth VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element) \ 558fcf5ef2aSThomas Huth VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element) 559fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt) \ 560fcf5ef2aSThomas Huth VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element) \ 561fcf5ef2aSThomas Huth VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element) 562fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb) 563fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh) 564fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw) 565fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub) 566fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh) 567fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw) 568fcf5ef2aSThomas Huth #undef VARITHSAT_CASE 569fcf5ef2aSThomas Huth #undef VARITHSAT_DO 570fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED 571fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED 572fcf5ef2aSThomas Huth 573fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype) \ 574fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 575fcf5ef2aSThomas Huth { \ 576fcf5ef2aSThomas Huth int i; \ 577fcf5ef2aSThomas Huth \ 578fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 579fcf5ef2aSThomas Huth etype x = (etype)a->element[i] + (etype)b->element[i] + 1; \ 580fcf5ef2aSThomas Huth r->element[i] = x >> 1; \ 581fcf5ef2aSThomas Huth } \ 582fcf5ef2aSThomas Huth } 583fcf5ef2aSThomas Huth 584fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element, \ 585fcf5ef2aSThomas Huth unsigned_type) \ 586fcf5ef2aSThomas Huth VAVG_DO(avgs##type, signed_element, signed_type) \ 587fcf5ef2aSThomas Huth VAVG_DO(avgu##type, unsigned_element, unsigned_type) 588fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t) 589fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t) 590fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t) 591fcf5ef2aSThomas Huth #undef VAVG_DO 592fcf5ef2aSThomas Huth #undef VAVG 593fcf5ef2aSThomas Huth 594fcf5ef2aSThomas Huth #define VABSDU_DO(name, element) \ 595fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 596fcf5ef2aSThomas Huth { \ 597fcf5ef2aSThomas Huth int i; \ 598fcf5ef2aSThomas Huth \ 599fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 600fcf5ef2aSThomas Huth r->element[i] = (a->element[i] > b->element[i]) ? \ 601fcf5ef2aSThomas Huth (a->element[i] - b->element[i]) : \ 602fcf5ef2aSThomas Huth (b->element[i] - a->element[i]); \ 603fcf5ef2aSThomas Huth } \ 604fcf5ef2aSThomas Huth } 605fcf5ef2aSThomas Huth 606b6cb41b2SDavid Gibson /* 607b6cb41b2SDavid Gibson * VABSDU - Vector absolute difference unsigned 608fcf5ef2aSThomas Huth * name - instruction mnemonic suffix (b: byte, h: halfword, w: word) 609fcf5ef2aSThomas Huth * element - element type to access from vector 610fcf5ef2aSThomas Huth */ 611fcf5ef2aSThomas Huth #define VABSDU(type, element) \ 612fcf5ef2aSThomas Huth VABSDU_DO(absdu##type, element) 613fcf5ef2aSThomas Huth VABSDU(b, u8) 614fcf5ef2aSThomas Huth VABSDU(h, u16) 615fcf5ef2aSThomas Huth VABSDU(w, u32) 616fcf5ef2aSThomas Huth #undef VABSDU_DO 617fcf5ef2aSThomas Huth #undef VABSDU 618fcf5ef2aSThomas Huth 619fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element) \ 620fcf5ef2aSThomas Huth void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r, \ 621fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 622fcf5ef2aSThomas Huth { \ 623fcf5ef2aSThomas Huth int i; \ 624fcf5ef2aSThomas Huth \ 62505ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 626fcf5ef2aSThomas Huth float32 t = cvt(b->element[i], &env->vec_status); \ 62705ee3e8aSMark Cave-Ayland r->f32[i] = float32_scalbn(t, -uim, &env->vec_status); \ 628fcf5ef2aSThomas Huth } \ 629fcf5ef2aSThomas Huth } 630fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32) 631fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32) 632fcf5ef2aSThomas Huth #undef VCF 633fcf5ef2aSThomas Huth 634eb936dc0SMatheus Ferst #define VCMPNEZ(NAME, ELEM) \ 635eb936dc0SMatheus Ferst void helper_##NAME(ppc_vsr_t *t, ppc_vsr_t *a, ppc_vsr_t *b, uint32_t desc) \ 636fcf5ef2aSThomas Huth { \ 637eb936dc0SMatheus Ferst for (int i = 0; i < ARRAY_SIZE(t->ELEM); i++) { \ 638eb936dc0SMatheus Ferst t->ELEM[i] = ((a->ELEM[i] == 0) || (b->ELEM[i] == 0) || \ 639eb936dc0SMatheus Ferst (a->ELEM[i] != b->ELEM[i])) ? -1 : 0; \ 640fcf5ef2aSThomas Huth } \ 641fcf5ef2aSThomas Huth } 642eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZB, u8) 643eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZH, u16) 644eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZW, u32) 645eb936dc0SMatheus Ferst #undef VCMPNEZ 646fcf5ef2aSThomas Huth 647fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record) \ 648fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 649fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 650fcf5ef2aSThomas Huth { \ 651fcf5ef2aSThomas Huth uint32_t ones = (uint32_t)-1; \ 652fcf5ef2aSThomas Huth uint32_t all = ones; \ 653fcf5ef2aSThomas Huth uint32_t none = 0; \ 654fcf5ef2aSThomas Huth int i; \ 655fcf5ef2aSThomas Huth \ 65605ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 657fcf5ef2aSThomas Huth uint32_t result; \ 65871bfd65cSRichard Henderson FloatRelation rel = \ 65971bfd65cSRichard Henderson float32_compare_quiet(a->f32[i], b->f32[i], \ 660fcf5ef2aSThomas Huth &env->vec_status); \ 661fcf5ef2aSThomas Huth if (rel == float_relation_unordered) { \ 662fcf5ef2aSThomas Huth result = 0; \ 663fcf5ef2aSThomas Huth } else if (rel compare order) { \ 664fcf5ef2aSThomas Huth result = ones; \ 665fcf5ef2aSThomas Huth } else { \ 666fcf5ef2aSThomas Huth result = 0; \ 667fcf5ef2aSThomas Huth } \ 668fcf5ef2aSThomas Huth r->u32[i] = result; \ 669fcf5ef2aSThomas Huth all &= result; \ 670fcf5ef2aSThomas Huth none |= result; \ 671fcf5ef2aSThomas Huth } \ 672fcf5ef2aSThomas Huth if (record) { \ 673fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 674fcf5ef2aSThomas Huth } \ 675fcf5ef2aSThomas Huth } 676fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order) \ 677fcf5ef2aSThomas Huth VCMPFP_DO(suffix, compare, order, 0) \ 678fcf5ef2aSThomas Huth VCMPFP_DO(suffix##_dot, compare, order, 1) 679fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal) 680fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less) 681fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater) 682fcf5ef2aSThomas Huth #undef VCMPFP_DO 683fcf5ef2aSThomas Huth #undef VCMPFP 684fcf5ef2aSThomas Huth 685fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r, 686fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b, int record) 687fcf5ef2aSThomas Huth { 688fcf5ef2aSThomas Huth int i; 689fcf5ef2aSThomas Huth int all_in = 0; 690fcf5ef2aSThomas Huth 69105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 69271bfd65cSRichard Henderson FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i], 69305ee3e8aSMark Cave-Ayland &env->vec_status); 694fcf5ef2aSThomas Huth if (le_rel == float_relation_unordered) { 695fcf5ef2aSThomas Huth r->u32[i] = 0xc0000000; 696fcf5ef2aSThomas Huth all_in = 1; 697fcf5ef2aSThomas Huth } else { 69805ee3e8aSMark Cave-Ayland float32 bneg = float32_chs(b->f32[i]); 69971bfd65cSRichard Henderson FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg, 70005ee3e8aSMark Cave-Ayland &env->vec_status); 701fcf5ef2aSThomas Huth int le = le_rel != float_relation_greater; 702fcf5ef2aSThomas Huth int ge = ge_rel != float_relation_less; 703fcf5ef2aSThomas Huth 704fcf5ef2aSThomas Huth r->u32[i] = ((!le) << 31) | ((!ge) << 30); 705fcf5ef2aSThomas Huth all_in |= (!le | !ge); 706fcf5ef2aSThomas Huth } 707fcf5ef2aSThomas Huth } 708fcf5ef2aSThomas Huth if (record) { 709fcf5ef2aSThomas Huth env->crf[6] = (all_in == 0) << 1; 710fcf5ef2aSThomas Huth } 711fcf5ef2aSThomas Huth } 712fcf5ef2aSThomas Huth 713fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 714fcf5ef2aSThomas Huth { 715fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 0); 716fcf5ef2aSThomas Huth } 717fcf5ef2aSThomas Huth 718fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 719fcf5ef2aSThomas Huth ppc_avr_t *b) 720fcf5ef2aSThomas Huth { 721fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 1); 722fcf5ef2aSThomas Huth } 723fcf5ef2aSThomas Huth 724fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element) \ 725fcf5ef2aSThomas Huth void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r, \ 726fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 727fcf5ef2aSThomas Huth { \ 728fcf5ef2aSThomas Huth int i; \ 729fcf5ef2aSThomas Huth int sat = 0; \ 730fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 731fcf5ef2aSThomas Huth \ 732fcf5ef2aSThomas Huth set_float_rounding_mode(float_round_to_zero, &s); \ 73305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 73405ee3e8aSMark Cave-Ayland if (float32_is_any_nan(b->f32[i])) { \ 735fcf5ef2aSThomas Huth r->element[i] = 0; \ 736fcf5ef2aSThomas Huth } else { \ 73705ee3e8aSMark Cave-Ayland float64 t = float32_to_float64(b->f32[i], &s); \ 738fcf5ef2aSThomas Huth int64_t j; \ 739fcf5ef2aSThomas Huth \ 740fcf5ef2aSThomas Huth t = float64_scalbn(t, uim, &s); \ 741fcf5ef2aSThomas Huth j = float64_to_int64(t, &s); \ 742fcf5ef2aSThomas Huth r->element[i] = satcvt(j, &sat); \ 743fcf5ef2aSThomas Huth } \ 744fcf5ef2aSThomas Huth } \ 745fcf5ef2aSThomas Huth if (sat) { \ 7466175f5a0SRichard Henderson set_vscr_sat(env); \ 747fcf5ef2aSThomas Huth } \ 748fcf5ef2aSThomas Huth } 749fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32) 750fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32) 751fcf5ef2aSThomas Huth #undef VCT 752fcf5ef2aSThomas Huth 75334553153SLucas Mateus Castro (alqotel) typedef int64_t do_ger(uint32_t, uint32_t, uint32_t); 75434553153SLucas Mateus Castro (alqotel) 75534553153SLucas Mateus Castro (alqotel) static int64_t ger_rank8(uint32_t a, uint32_t b, uint32_t mask) 75634553153SLucas Mateus Castro (alqotel) { 75734553153SLucas Mateus Castro (alqotel) int64_t psum = 0; 75834553153SLucas Mateus Castro (alqotel) for (int i = 0; i < 8; i++, mask >>= 1) { 75934553153SLucas Mateus Castro (alqotel) if (mask & 1) { 760feeef6b6SDaniel Henrique Barboza psum += (int64_t)sextract32(a, 4 * i, 4) * sextract32(b, 4 * i, 4); 76134553153SLucas Mateus Castro (alqotel) } 76234553153SLucas Mateus Castro (alqotel) } 76334553153SLucas Mateus Castro (alqotel) return psum; 76434553153SLucas Mateus Castro (alqotel) } 76534553153SLucas Mateus Castro (alqotel) 76634553153SLucas Mateus Castro (alqotel) static int64_t ger_rank4(uint32_t a, uint32_t b, uint32_t mask) 76734553153SLucas Mateus Castro (alqotel) { 76834553153SLucas Mateus Castro (alqotel) int64_t psum = 0; 76934553153SLucas Mateus Castro (alqotel) for (int i = 0; i < 4; i++, mask >>= 1) { 77034553153SLucas Mateus Castro (alqotel) if (mask & 1) { 77134553153SLucas Mateus Castro (alqotel) psum += sextract32(a, 8 * i, 8) * (int64_t)extract32(b, 8 * i, 8); 77234553153SLucas Mateus Castro (alqotel) } 77334553153SLucas Mateus Castro (alqotel) } 77434553153SLucas Mateus Castro (alqotel) return psum; 77534553153SLucas Mateus Castro (alqotel) } 77634553153SLucas Mateus Castro (alqotel) 77734553153SLucas Mateus Castro (alqotel) static int64_t ger_rank2(uint32_t a, uint32_t b, uint32_t mask) 77834553153SLucas Mateus Castro (alqotel) { 77934553153SLucas Mateus Castro (alqotel) int64_t psum = 0; 78034553153SLucas Mateus Castro (alqotel) for (int i = 0; i < 2; i++, mask >>= 1) { 78134553153SLucas Mateus Castro (alqotel) if (mask & 1) { 782feeef6b6SDaniel Henrique Barboza psum += (int64_t)sextract32(a, 16 * i, 16) * 783feeef6b6SDaniel Henrique Barboza sextract32(b, 16 * i, 16); 78434553153SLucas Mateus Castro (alqotel) } 78534553153SLucas Mateus Castro (alqotel) } 78634553153SLucas Mateus Castro (alqotel) return psum; 78734553153SLucas Mateus Castro (alqotel) } 78834553153SLucas Mateus Castro (alqotel) 78934553153SLucas Mateus Castro (alqotel) static void xviger(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, ppc_acc_t *at, 79034553153SLucas Mateus Castro (alqotel) uint32_t mask, bool sat, bool acc, do_ger ger) 79134553153SLucas Mateus Castro (alqotel) { 79234553153SLucas Mateus Castro (alqotel) uint8_t pmsk = FIELD_EX32(mask, GER_MSK, PMSK), 79334553153SLucas Mateus Castro (alqotel) xmsk = FIELD_EX32(mask, GER_MSK, XMSK), 79434553153SLucas Mateus Castro (alqotel) ymsk = FIELD_EX32(mask, GER_MSK, YMSK); 79534553153SLucas Mateus Castro (alqotel) uint8_t xmsk_bit, ymsk_bit; 79634553153SLucas Mateus Castro (alqotel) int64_t psum; 79734553153SLucas Mateus Castro (alqotel) int i, j; 79834553153SLucas Mateus Castro (alqotel) for (i = 0, xmsk_bit = 1 << 3; i < 4; i++, xmsk_bit >>= 1) { 79934553153SLucas Mateus Castro (alqotel) for (j = 0, ymsk_bit = 1 << 3; j < 4; j++, ymsk_bit >>= 1) { 80034553153SLucas Mateus Castro (alqotel) if ((xmsk_bit & xmsk) && (ymsk_bit & ymsk)) { 80134553153SLucas Mateus Castro (alqotel) psum = ger(a->VsrW(i), b->VsrW(j), pmsk); 80234553153SLucas Mateus Castro (alqotel) if (acc) { 80334553153SLucas Mateus Castro (alqotel) psum += at[i].VsrSW(j); 80434553153SLucas Mateus Castro (alqotel) } 80534553153SLucas Mateus Castro (alqotel) if (sat && psum > INT32_MAX) { 80634553153SLucas Mateus Castro (alqotel) set_vscr_sat(env); 80734553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = INT32_MAX; 80834553153SLucas Mateus Castro (alqotel) } else if (sat && psum < INT32_MIN) { 80934553153SLucas Mateus Castro (alqotel) set_vscr_sat(env); 81034553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = INT32_MIN; 81134553153SLucas Mateus Castro (alqotel) } else { 81234553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = (int32_t) psum; 81334553153SLucas Mateus Castro (alqotel) } 81434553153SLucas Mateus Castro (alqotel) } else { 81534553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = 0; 81634553153SLucas Mateus Castro (alqotel) } 81734553153SLucas Mateus Castro (alqotel) } 81834553153SLucas Mateus Castro (alqotel) } 81934553153SLucas Mateus Castro (alqotel) } 82034553153SLucas Mateus Castro (alqotel) 82134553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 82234553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 82334553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 82434553153SLucas Mateus Castro (alqotel) { 82534553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, false, ger_rank8); 82634553153SLucas Mateus Castro (alqotel) } 82734553153SLucas Mateus Castro (alqotel) 82834553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 82934553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 83034553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 83134553153SLucas Mateus Castro (alqotel) { 83234553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, true, ger_rank8); 83334553153SLucas Mateus Castro (alqotel) } 83434553153SLucas Mateus Castro (alqotel) 83534553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 83634553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 83734553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 83834553153SLucas Mateus Castro (alqotel) { 83934553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, false, ger_rank4); 84034553153SLucas Mateus Castro (alqotel) } 84134553153SLucas Mateus Castro (alqotel) 84234553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 84334553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 84434553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 84534553153SLucas Mateus Castro (alqotel) { 84634553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, true, ger_rank4); 84734553153SLucas Mateus Castro (alqotel) } 84834553153SLucas Mateus Castro (alqotel) 84934553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 85034553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 85134553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 85234553153SLucas Mateus Castro (alqotel) { 85334553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, true, true, ger_rank4); 85434553153SLucas Mateus Castro (alqotel) } 85534553153SLucas Mateus Castro (alqotel) 85634553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 85734553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 85834553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 85934553153SLucas Mateus Castro (alqotel) { 86034553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, false, ger_rank2); 86134553153SLucas Mateus Castro (alqotel) } 86234553153SLucas Mateus Castro (alqotel) 86334553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 86434553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2S(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 86534553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 86634553153SLucas Mateus Castro (alqotel) { 86734553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, true, false, ger_rank2); 86834553153SLucas Mateus Castro (alqotel) } 86934553153SLucas Mateus Castro (alqotel) 87034553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 87134553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 87234553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 87334553153SLucas Mateus Castro (alqotel) { 87434553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, true, ger_rank2); 87534553153SLucas Mateus Castro (alqotel) } 87634553153SLucas Mateus Castro (alqotel) 87734553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 87834553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 87934553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 88034553153SLucas Mateus Castro (alqotel) { 88134553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, true, true, ger_rank2); 88234553153SLucas Mateus Castro (alqotel) } 88334553153SLucas Mateus Castro (alqotel) 884fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r) 885fcf5ef2aSThomas Huth { 886fcf5ef2aSThomas Huth target_ulong count = 0; 887fcf5ef2aSThomas Huth int i; 88860594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 88960594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 890fcf5ef2aSThomas Huth break; 891fcf5ef2aSThomas Huth } 892fcf5ef2aSThomas Huth count++; 893fcf5ef2aSThomas Huth } 894fcf5ef2aSThomas Huth return count; 895fcf5ef2aSThomas Huth } 896fcf5ef2aSThomas Huth 897fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r) 898fcf5ef2aSThomas Huth { 899fcf5ef2aSThomas Huth target_ulong count = 0; 900fcf5ef2aSThomas Huth int i; 901fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 90260594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 903fcf5ef2aSThomas Huth break; 904fcf5ef2aSThomas Huth } 905fcf5ef2aSThomas Huth count++; 906fcf5ef2aSThomas Huth } 907fcf5ef2aSThomas Huth return count; 908fcf5ef2aSThomas Huth } 909fcf5ef2aSThomas Huth 910306e4753SLucas Mateus Castro (alqotel) void helper_VMHADDSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 911fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 912fcf5ef2aSThomas Huth { 913fcf5ef2aSThomas Huth int sat = 0; 914fcf5ef2aSThomas Huth int i; 915fcf5ef2aSThomas Huth 916fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 917fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 918fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 919fcf5ef2aSThomas Huth 920fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 921fcf5ef2aSThomas Huth } 922fcf5ef2aSThomas Huth 923fcf5ef2aSThomas Huth if (sat) { 9246175f5a0SRichard Henderson set_vscr_sat(env); 925fcf5ef2aSThomas Huth } 926fcf5ef2aSThomas Huth } 927fcf5ef2aSThomas Huth 928306e4753SLucas Mateus Castro (alqotel) void helper_VMHRADDSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 929fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 930fcf5ef2aSThomas Huth { 931fcf5ef2aSThomas Huth int sat = 0; 932fcf5ef2aSThomas Huth int i; 933fcf5ef2aSThomas Huth 934fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 935fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i] + 0x00004000; 936fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 937fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 938fcf5ef2aSThomas Huth } 939fcf5ef2aSThomas Huth 940fcf5ef2aSThomas Huth if (sat) { 9416175f5a0SRichard Henderson set_vscr_sat(env); 942fcf5ef2aSThomas Huth } 943fcf5ef2aSThomas Huth } 944fcf5ef2aSThomas Huth 945dc46167aSLucas Mateus Castro (alqotel) void helper_VMLADDUHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c, 946dc46167aSLucas Mateus Castro (alqotel) uint32_t v) 947fcf5ef2aSThomas Huth { 948fcf5ef2aSThomas Huth int i; 949fcf5ef2aSThomas Huth 950fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 951fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 952fcf5ef2aSThomas Huth r->s16[i] = (int16_t) (prod + c->s16[i]); 953fcf5ef2aSThomas Huth } 954fcf5ef2aSThomas Huth } 955fcf5ef2aSThomas Huth 956d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs) \ 957fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 958fcf5ef2aSThomas Huth { \ 959fcf5ef2aSThomas Huth ppc_avr_t result; \ 960d81c2040SMark Cave-Ayland int i, half = ARRAY_SIZE(r->element) / 2; \ 961fcf5ef2aSThomas Huth \ 962d81c2040SMark Cave-Ayland for (i = 0; i < half; i++) { \ 963d81c2040SMark Cave-Ayland result.access(i * 2 + 0) = a->access(i + ofs); \ 964d81c2040SMark Cave-Ayland result.access(i * 2 + 1) = b->access(i + ofs); \ 965fcf5ef2aSThomas Huth } \ 966fcf5ef2aSThomas Huth *r = result; \ 967fcf5ef2aSThomas Huth } 968d81c2040SMark Cave-Ayland 969d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access) \ 970d81c2040SMark Cave-Ayland VMRG_DO(mrgl##suffix, element, access, half) \ 971d81c2040SMark Cave-Ayland VMRG_DO(mrgh##suffix, element, access, 0) 972d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB) 973d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH) 974d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW) 975fcf5ef2aSThomas Huth #undef VMRG_DO 976fcf5ef2aSThomas Huth #undef VMRG 977fcf5ef2aSThomas Huth 978b2dc03a5SMatheus Ferst void helper_VMSUMMBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 979fcf5ef2aSThomas Huth { 980fcf5ef2aSThomas Huth int32_t prod[16]; 981fcf5ef2aSThomas Huth int i; 982fcf5ef2aSThomas Huth 983fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s8); i++) { 984fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s8[i] * b->u8[i]; 985fcf5ef2aSThomas Huth } 986fcf5ef2aSThomas Huth 987fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 988fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] + 989fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 990fcf5ef2aSThomas Huth } 991fcf5ef2aSThomas Huth } 992fcf5ef2aSThomas Huth 9936f52f731SMatheus Ferst void helper_VMSUMSHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 994fcf5ef2aSThomas Huth { 995fcf5ef2aSThomas Huth int32_t prod[8]; 996fcf5ef2aSThomas Huth int i; 997fcf5ef2aSThomas Huth 998fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 999fcf5ef2aSThomas Huth prod[i] = a->s16[i] * b->s16[i]; 1000fcf5ef2aSThomas Huth } 1001fcf5ef2aSThomas Huth 1002fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1003fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1004fcf5ef2aSThomas Huth } 1005fcf5ef2aSThomas Huth } 1006fcf5ef2aSThomas Huth 10076f52f731SMatheus Ferst void helper_VMSUMSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1008fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1009fcf5ef2aSThomas Huth { 1010fcf5ef2aSThomas Huth int32_t prod[8]; 1011fcf5ef2aSThomas Huth int i; 1012fcf5ef2aSThomas Huth int sat = 0; 1013fcf5ef2aSThomas Huth 1014fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1015fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s16[i] * b->s16[i]; 1016fcf5ef2aSThomas Huth } 1017fcf5ef2aSThomas Huth 1018fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1019fcf5ef2aSThomas Huth int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1020fcf5ef2aSThomas Huth 1021fcf5ef2aSThomas Huth r->u32[i] = cvtsdsw(t, &sat); 1022fcf5ef2aSThomas Huth } 1023fcf5ef2aSThomas Huth 1024fcf5ef2aSThomas Huth if (sat) { 10256175f5a0SRichard Henderson set_vscr_sat(env); 1026fcf5ef2aSThomas Huth } 1027fcf5ef2aSThomas Huth } 1028fcf5ef2aSThomas Huth 1029b2dc03a5SMatheus Ferst void helper_VMSUMUBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1030fcf5ef2aSThomas Huth { 1031fcf5ef2aSThomas Huth uint16_t prod[16]; 1032fcf5ef2aSThomas Huth int i; 1033fcf5ef2aSThomas Huth 1034fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1035fcf5ef2aSThomas Huth prod[i] = a->u8[i] * b->u8[i]; 1036fcf5ef2aSThomas Huth } 1037fcf5ef2aSThomas Huth 1038fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1039fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] + 1040fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1041fcf5ef2aSThomas Huth } 1042fcf5ef2aSThomas Huth } 1043fcf5ef2aSThomas Huth 104489a5a1aeSMatheus Ferst void helper_VMSUMUHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1045fcf5ef2aSThomas Huth { 1046fcf5ef2aSThomas Huth uint32_t prod[8]; 1047fcf5ef2aSThomas Huth int i; 1048fcf5ef2aSThomas Huth 1049fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1050fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1051fcf5ef2aSThomas Huth } 1052fcf5ef2aSThomas Huth 1053fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1054fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1055fcf5ef2aSThomas Huth } 1056fcf5ef2aSThomas Huth } 1057fcf5ef2aSThomas Huth 105889a5a1aeSMatheus Ferst void helper_VMSUMUHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1059fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1060fcf5ef2aSThomas Huth { 1061fcf5ef2aSThomas Huth uint32_t prod[8]; 1062fcf5ef2aSThomas Huth int i; 1063fcf5ef2aSThomas Huth int sat = 0; 1064fcf5ef2aSThomas Huth 1065fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1066fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1067fcf5ef2aSThomas Huth } 1068fcf5ef2aSThomas Huth 1069fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1070fcf5ef2aSThomas Huth uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1071fcf5ef2aSThomas Huth 1072fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1073fcf5ef2aSThomas Huth } 1074fcf5ef2aSThomas Huth 1075fcf5ef2aSThomas Huth if (sat) { 10766175f5a0SRichard Henderson set_vscr_sat(env); 1077fcf5ef2aSThomas Huth } 1078fcf5ef2aSThomas Huth } 1079fcf5ef2aSThomas Huth 10804fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast) \ 108180eca687SLucas Mateus Castro (alqotel) void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1082fcf5ef2aSThomas Huth { \ 1083fcf5ef2aSThomas Huth int i; \ 1084fcf5ef2aSThomas Huth \ 10854fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 10864fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i) * \ 10874fbc89edSMark Cave-Ayland (cast)b->mul_access(i); \ 1088fcf5ef2aSThomas Huth } \ 1089fcf5ef2aSThomas Huth } 10904fbc89edSMark Cave-Ayland 10914fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast) \ 109280eca687SLucas Mateus Castro (alqotel) void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 10934fbc89edSMark Cave-Ayland { \ 10944fbc89edSMark Cave-Ayland int i; \ 10954fbc89edSMark Cave-Ayland \ 10964fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 10974fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) * \ 10984fbc89edSMark Cave-Ayland (cast)b->mul_access(i + 1); \ 10994fbc89edSMark Cave-Ayland } \ 11004fbc89edSMark Cave-Ayland } 11014fbc89edSMark Cave-Ayland 11024fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast) \ 110380eca687SLucas Mateus Castro (alqotel) VMUL_DO_EVN(MULE##suffix, mul_element, mul_access, prod_access, cast) \ 110480eca687SLucas Mateus Castro (alqotel) VMUL_DO_ODD(MULO##suffix, mul_element, mul_access, prod_access, cast) 110580eca687SLucas Mateus Castro (alqotel) VMUL(SB, s8, VsrSB, VsrSH, int16_t) 110680eca687SLucas Mateus Castro (alqotel) VMUL(SH, s16, VsrSH, VsrSW, int32_t) 110780eca687SLucas Mateus Castro (alqotel) VMUL(SW, s32, VsrSW, VsrSD, int64_t) 110880eca687SLucas Mateus Castro (alqotel) VMUL(UB, u8, VsrB, VsrH, uint16_t) 110980eca687SLucas Mateus Castro (alqotel) VMUL(UH, u16, VsrH, VsrW, uint32_t) 111080eca687SLucas Mateus Castro (alqotel) VMUL(UW, u32, VsrW, VsrD, uint64_t) 11114fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN 11124fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD 1113fcf5ef2aSThomas Huth #undef VMUL 1114fcf5ef2aSThomas Huth 111541c2877fSMatheus Ferst void helper_XXPERMX(ppc_vsr_t *t, ppc_vsr_t *s0, ppc_vsr_t *s1, ppc_vsr_t *pcv, 111641c2877fSMatheus Ferst target_ulong uim) 111741c2877fSMatheus Ferst { 111841c2877fSMatheus Ferst int i, idx; 111941c2877fSMatheus Ferst ppc_vsr_t tmp = { .u64 = {0, 0} }; 112041c2877fSMatheus Ferst 112141c2877fSMatheus Ferst for (i = 0; i < ARRAY_SIZE(t->u8); i++) { 112241c2877fSMatheus Ferst if ((pcv->VsrB(i) >> 5) == uim) { 112341c2877fSMatheus Ferst idx = pcv->VsrB(i) & 0x1f; 112441c2877fSMatheus Ferst if (idx < ARRAY_SIZE(t->u8)) { 112541c2877fSMatheus Ferst tmp.VsrB(i) = s0->VsrB(idx); 112641c2877fSMatheus Ferst } else { 112741c2877fSMatheus Ferst tmp.VsrB(i) = s1->VsrB(idx - ARRAY_SIZE(t->u8)); 112841c2877fSMatheus Ferst } 112941c2877fSMatheus Ferst } 113041c2877fSMatheus Ferst } 113141c2877fSMatheus Ferst 113241c2877fSMatheus Ferst *t = tmp; 113341c2877fSMatheus Ferst } 113441c2877fSMatheus Ferst 11351700f2bfSLucas Mateus Castro (alqotel) void helper_VDIVSQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 11361700f2bfSLucas Mateus Castro (alqotel) { 11371700f2bfSLucas Mateus Castro (alqotel) Int128 neg1 = int128_makes64(-1); 11381700f2bfSLucas Mateus Castro (alqotel) Int128 int128_min = int128_make128(0, INT64_MIN); 11391700f2bfSLucas Mateus Castro (alqotel) if (likely(int128_nz(b->s128) && 11401700f2bfSLucas Mateus Castro (alqotel) (int128_ne(a->s128, int128_min) || int128_ne(b->s128, neg1)))) { 11411700f2bfSLucas Mateus Castro (alqotel) t->s128 = int128_divs(a->s128, b->s128); 11421700f2bfSLucas Mateus Castro (alqotel) } else { 11431700f2bfSLucas Mateus Castro (alqotel) t->s128 = a->s128; /* Undefined behavior */ 11441700f2bfSLucas Mateus Castro (alqotel) } 11451700f2bfSLucas Mateus Castro (alqotel) } 11461700f2bfSLucas Mateus Castro (alqotel) 11471700f2bfSLucas Mateus Castro (alqotel) void helper_VDIVUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 11481700f2bfSLucas Mateus Castro (alqotel) { 11491700f2bfSLucas Mateus Castro (alqotel) if (int128_nz(b->s128)) { 11501700f2bfSLucas Mateus Castro (alqotel) t->s128 = int128_divu(a->s128, b->s128); 11511700f2bfSLucas Mateus Castro (alqotel) } else { 11521700f2bfSLucas Mateus Castro (alqotel) t->s128 = a->s128; /* Undefined behavior */ 11531700f2bfSLucas Mateus Castro (alqotel) } 11541700f2bfSLucas Mateus Castro (alqotel) } 11551700f2bfSLucas Mateus Castro (alqotel) 1156a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVESD(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1157a173ba88SLucas Mateus Castro (alqotel) { 1158a173ba88SLucas Mateus Castro (alqotel) int i; 1159a173ba88SLucas Mateus Castro (alqotel) int64_t high; 1160a173ba88SLucas Mateus Castro (alqotel) uint64_t low; 1161a173ba88SLucas Mateus Castro (alqotel) for (i = 0; i < 2; i++) { 1162a173ba88SLucas Mateus Castro (alqotel) high = a->s64[i]; 1163a173ba88SLucas Mateus Castro (alqotel) low = 0; 1164a173ba88SLucas Mateus Castro (alqotel) if (unlikely((high == INT64_MIN && b->s64[i] == -1) || !b->s64[i])) { 1165a173ba88SLucas Mateus Castro (alqotel) t->s64[i] = a->s64[i]; /* Undefined behavior */ 1166a173ba88SLucas Mateus Castro (alqotel) } else { 1167a173ba88SLucas Mateus Castro (alqotel) divs128(&low, &high, b->s64[i]); 1168a173ba88SLucas Mateus Castro (alqotel) t->s64[i] = low; 1169a173ba88SLucas Mateus Castro (alqotel) } 1170a173ba88SLucas Mateus Castro (alqotel) } 1171a173ba88SLucas Mateus Castro (alqotel) } 1172a173ba88SLucas Mateus Castro (alqotel) 1173a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVEUD(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1174a173ba88SLucas Mateus Castro (alqotel) { 1175a173ba88SLucas Mateus Castro (alqotel) int i; 1176a173ba88SLucas Mateus Castro (alqotel) uint64_t high, low; 1177a173ba88SLucas Mateus Castro (alqotel) for (i = 0; i < 2; i++) { 1178a173ba88SLucas Mateus Castro (alqotel) high = a->u64[i]; 1179a173ba88SLucas Mateus Castro (alqotel) low = 0; 1180a173ba88SLucas Mateus Castro (alqotel) if (unlikely(!b->u64[i])) { 1181a173ba88SLucas Mateus Castro (alqotel) t->u64[i] = a->u64[i]; /* Undefined behavior */ 1182a173ba88SLucas Mateus Castro (alqotel) } else { 1183a173ba88SLucas Mateus Castro (alqotel) divu128(&low, &high, b->u64[i]); 1184a173ba88SLucas Mateus Castro (alqotel) t->u64[i] = low; 1185a173ba88SLucas Mateus Castro (alqotel) } 1186a173ba88SLucas Mateus Castro (alqotel) } 1187a173ba88SLucas Mateus Castro (alqotel) } 1188a173ba88SLucas Mateus Castro (alqotel) 1189a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVESQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1190a173ba88SLucas Mateus Castro (alqotel) { 1191a173ba88SLucas Mateus Castro (alqotel) Int128 high, low; 1192a173ba88SLucas Mateus Castro (alqotel) Int128 int128_min = int128_make128(0, INT64_MIN); 1193a173ba88SLucas Mateus Castro (alqotel) Int128 neg1 = int128_makes64(-1); 1194a173ba88SLucas Mateus Castro (alqotel) 1195a173ba88SLucas Mateus Castro (alqotel) high = a->s128; 1196a173ba88SLucas Mateus Castro (alqotel) low = int128_zero(); 1197a173ba88SLucas Mateus Castro (alqotel) if (unlikely(!int128_nz(b->s128) || 1198a173ba88SLucas Mateus Castro (alqotel) (int128_eq(b->s128, neg1) && int128_eq(high, int128_min)))) { 1199a173ba88SLucas Mateus Castro (alqotel) t->s128 = a->s128; /* Undefined behavior */ 1200a173ba88SLucas Mateus Castro (alqotel) } else { 1201a173ba88SLucas Mateus Castro (alqotel) divs256(&low, &high, b->s128); 1202a173ba88SLucas Mateus Castro (alqotel) t->s128 = low; 1203a173ba88SLucas Mateus Castro (alqotel) } 1204a173ba88SLucas Mateus Castro (alqotel) } 1205a173ba88SLucas Mateus Castro (alqotel) 1206a173ba88SLucas Mateus Castro (alqotel) void helper_VDIVEUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1207a173ba88SLucas Mateus Castro (alqotel) { 1208a173ba88SLucas Mateus Castro (alqotel) Int128 high, low; 1209a173ba88SLucas Mateus Castro (alqotel) 1210a173ba88SLucas Mateus Castro (alqotel) high = a->s128; 1211a173ba88SLucas Mateus Castro (alqotel) low = int128_zero(); 1212a173ba88SLucas Mateus Castro (alqotel) if (unlikely(!int128_nz(b->s128))) { 1213a173ba88SLucas Mateus Castro (alqotel) t->s128 = a->s128; /* Undefined behavior */ 1214a173ba88SLucas Mateus Castro (alqotel) } else { 1215a173ba88SLucas Mateus Castro (alqotel) divu256(&low, &high, b->s128); 1216a173ba88SLucas Mateus Castro (alqotel) t->s128 = low; 1217a173ba88SLucas Mateus Castro (alqotel) } 1218a173ba88SLucas Mateus Castro (alqotel) } 1219a173ba88SLucas Mateus Castro (alqotel) 1220b80bec3aSLucas Mateus Castro (alqotel) void helper_VMODSQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1221b80bec3aSLucas Mateus Castro (alqotel) { 1222b80bec3aSLucas Mateus Castro (alqotel) Int128 neg1 = int128_makes64(-1); 1223b80bec3aSLucas Mateus Castro (alqotel) Int128 int128_min = int128_make128(0, INT64_MIN); 1224b80bec3aSLucas Mateus Castro (alqotel) if (likely(int128_nz(b->s128) && 1225b80bec3aSLucas Mateus Castro (alqotel) (int128_ne(a->s128, int128_min) || int128_ne(b->s128, neg1)))) { 1226b80bec3aSLucas Mateus Castro (alqotel) t->s128 = int128_rems(a->s128, b->s128); 1227b80bec3aSLucas Mateus Castro (alqotel) } else { 1228b80bec3aSLucas Mateus Castro (alqotel) t->s128 = int128_zero(); /* Undefined behavior */ 1229b80bec3aSLucas Mateus Castro (alqotel) } 1230b80bec3aSLucas Mateus Castro (alqotel) } 1231b80bec3aSLucas Mateus Castro (alqotel) 1232b80bec3aSLucas Mateus Castro (alqotel) void helper_VMODUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1233b80bec3aSLucas Mateus Castro (alqotel) { 1234b80bec3aSLucas Mateus Castro (alqotel) if (likely(int128_nz(b->s128))) { 1235b80bec3aSLucas Mateus Castro (alqotel) t->s128 = int128_remu(a->s128, b->s128); 1236b80bec3aSLucas Mateus Castro (alqotel) } else { 1237b80bec3aSLucas Mateus Castro (alqotel) t->s128 = int128_zero(); /* Undefined behavior */ 1238b80bec3aSLucas Mateus Castro (alqotel) } 1239b80bec3aSLucas Mateus Castro (alqotel) } 1240b80bec3aSLucas Mateus Castro (alqotel) 124128347fe2SMatheus Ferst void helper_VPERM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1242fcf5ef2aSThomas Huth { 1243fcf5ef2aSThomas Huth ppc_avr_t result; 1244fcf5ef2aSThomas Huth int i; 1245fcf5ef2aSThomas Huth 124660594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 124760594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1248fcf5ef2aSThomas Huth int index = s & 0xf; 1249fcf5ef2aSThomas Huth 1250fcf5ef2aSThomas Huth if (s & 0x10) { 125160594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1252fcf5ef2aSThomas Huth } else { 125360594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1254fcf5ef2aSThomas Huth } 1255fcf5ef2aSThomas Huth } 1256fcf5ef2aSThomas Huth *r = result; 1257fcf5ef2aSThomas Huth } 1258fcf5ef2aSThomas Huth 125928347fe2SMatheus Ferst void helper_VPERMR(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1260fcf5ef2aSThomas Huth { 1261fcf5ef2aSThomas Huth ppc_avr_t result; 1262fcf5ef2aSThomas Huth int i; 1263fcf5ef2aSThomas Huth 126460594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 126560594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1266fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1267fcf5ef2aSThomas Huth 1268fcf5ef2aSThomas Huth if (s & 0x10) { 126960594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1270fcf5ef2aSThomas Huth } else { 127160594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1272fcf5ef2aSThomas Huth } 1273fcf5ef2aSThomas Huth } 1274fcf5ef2aSThomas Huth *r = result; 1275fcf5ef2aSThomas Huth } 1276fcf5ef2aSThomas Huth 1277618574ddSMatheus Ferst #define XXGENPCV_BE_EXP(NAME, SZ) \ 1278b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \ 1279b090f4f1SMatheus Ferst { \ 1280b090f4f1SMatheus Ferst ppc_vsr_t tmp; \ 1281b090f4f1SMatheus Ferst \ 1282b090f4f1SMatheus Ferst /* Initialize tmp with the result of an all-zeros mask */ \ 1283b090f4f1SMatheus Ferst tmp.VsrD(0) = 0x1011121314151617; \ 1284b090f4f1SMatheus Ferst tmp.VsrD(1) = 0x18191A1B1C1D1E1F; \ 1285b090f4f1SMatheus Ferst \ 1286b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1287b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1288b090f4f1SMatheus Ferst if (b->VsrB(i) & 0x80) { \ 1289b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1290b090f4f1SMatheus Ferst for (int k = 0; k < SZ; k++) { \ 1291b090f4f1SMatheus Ferst tmp.VsrB(i + k) = j + k; \ 1292b090f4f1SMatheus Ferst } \ 1293b090f4f1SMatheus Ferst j += SZ; \ 1294b090f4f1SMatheus Ferst } \ 1295b090f4f1SMatheus Ferst } \ 1296b090f4f1SMatheus Ferst \ 1297b090f4f1SMatheus Ferst *t = tmp; \ 1298618574ddSMatheus Ferst } 1299618574ddSMatheus Ferst 1300618574ddSMatheus Ferst #define XXGENPCV_BE_COMP(NAME, SZ) \ 1301b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\ 1302b090f4f1SMatheus Ferst { \ 1303b090f4f1SMatheus Ferst ppc_vsr_t tmp = { .u64 = { 0, 0 } }; \ 1304b090f4f1SMatheus Ferst \ 1305b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1306b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1307b090f4f1SMatheus Ferst if (b->VsrB(i) & 0x80) { \ 1308b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1309b090f4f1SMatheus Ferst for (int k = 0; k < SZ; k++) { \ 1310b090f4f1SMatheus Ferst tmp.VsrB(j + k) = i + k; \ 1311b090f4f1SMatheus Ferst } \ 1312b090f4f1SMatheus Ferst j += SZ; \ 1313b090f4f1SMatheus Ferst } \ 1314b090f4f1SMatheus Ferst } \ 1315b090f4f1SMatheus Ferst \ 1316b090f4f1SMatheus Ferst *t = tmp; \ 1317618574ddSMatheus Ferst } 1318618574ddSMatheus Ferst 1319618574ddSMatheus Ferst #define XXGENPCV_LE_EXP(NAME, SZ) \ 1320b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \ 1321b090f4f1SMatheus Ferst { \ 1322b090f4f1SMatheus Ferst ppc_vsr_t tmp; \ 1323b090f4f1SMatheus Ferst \ 1324b090f4f1SMatheus Ferst /* Initialize tmp with the result of an all-zeros mask */ \ 1325b090f4f1SMatheus Ferst tmp.VsrD(0) = 0x1F1E1D1C1B1A1918; \ 1326b090f4f1SMatheus Ferst tmp.VsrD(1) = 0x1716151413121110; \ 1327b090f4f1SMatheus Ferst \ 1328b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1329b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1330b090f4f1SMatheus Ferst /* Reverse indexing of "i" */ \ 1331b090f4f1SMatheus Ferst const int idx = ARRAY_SIZE(b->u8) - i - SZ; \ 1332b090f4f1SMatheus Ferst if (b->VsrB(idx) & 0x80) { \ 1333b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1334b090f4f1SMatheus Ferst for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) { \ 1335b090f4f1SMatheus Ferst tmp.VsrB(idx + rk) = j + k; \ 1336b090f4f1SMatheus Ferst } \ 1337b090f4f1SMatheus Ferst j += SZ; \ 1338b090f4f1SMatheus Ferst } \ 1339b090f4f1SMatheus Ferst } \ 1340b090f4f1SMatheus Ferst \ 1341b090f4f1SMatheus Ferst *t = tmp; \ 1342618574ddSMatheus Ferst } 1343618574ddSMatheus Ferst 1344618574ddSMatheus Ferst #define XXGENPCV_LE_COMP(NAME, SZ) \ 1345b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\ 1346b090f4f1SMatheus Ferst { \ 1347b090f4f1SMatheus Ferst ppc_vsr_t tmp = { .u64 = { 0, 0 } }; \ 1348b090f4f1SMatheus Ferst \ 1349b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1350b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1351b090f4f1SMatheus Ferst if (b->VsrB(ARRAY_SIZE(b->u8) - i - SZ) & 0x80) { \ 1352b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1353b090f4f1SMatheus Ferst for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) { \ 1354b090f4f1SMatheus Ferst /* Reverse indexing of "j" */ \ 1355b090f4f1SMatheus Ferst const int idx = ARRAY_SIZE(b->u8) - j - SZ; \ 1356b090f4f1SMatheus Ferst tmp.VsrB(idx + rk) = i + k; \ 1357b090f4f1SMatheus Ferst } \ 1358b090f4f1SMatheus Ferst j += SZ; \ 1359b090f4f1SMatheus Ferst } \ 1360b090f4f1SMatheus Ferst } \ 1361b090f4f1SMatheus Ferst \ 1362b090f4f1SMatheus Ferst *t = tmp; \ 1363b090f4f1SMatheus Ferst } 1364b090f4f1SMatheus Ferst 1365618574ddSMatheus Ferst #define XXGENPCV(NAME, SZ) \ 1366618574ddSMatheus Ferst XXGENPCV_BE_EXP(NAME, SZ) \ 1367618574ddSMatheus Ferst XXGENPCV_BE_COMP(NAME, SZ) \ 1368618574ddSMatheus Ferst XXGENPCV_LE_EXP(NAME, SZ) \ 1369618574ddSMatheus Ferst XXGENPCV_LE_COMP(NAME, SZ) \ 1370618574ddSMatheus Ferst 1371b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVBM, 1) 1372b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVHM, 2) 1373b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVWM, 4) 1374b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVDM, 8) 1375618574ddSMatheus Ferst 1376618574ddSMatheus Ferst #undef XXGENPCV_BE_EXP 1377618574ddSMatheus Ferst #undef XXGENPCV_BE_COMP 1378618574ddSMatheus Ferst #undef XXGENPCV_LE_EXP 1379618574ddSMatheus Ferst #undef XXGENPCV_LE_COMP 1380b090f4f1SMatheus Ferst #undef XXGENPCV 1381b090f4f1SMatheus Ferst 1382e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1383fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)]) 1384fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i) 1385fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0) 1386fcf5ef2aSThomas Huth #else 1387fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)]) 1388fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i) 1389fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0) 1390fcf5ef2aSThomas Huth #endif 13918f7d41e0SMatheus Ferst #define EXTRACT_BIT(avr, i, index) \ 13928f7d41e0SMatheus Ferst (extract64((avr)->VsrD(i), 63 - index, 1)) 1393fcf5ef2aSThomas Huth 1394fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1395fcf5ef2aSThomas Huth { 1396fcf5ef2aSThomas Huth int i, j; 1397fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 1398fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1399fcf5ef2aSThomas Huth for (j = 0; j < 8; j++) { 1400fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, (i * 8) + j); 1401fcf5ef2aSThomas Huth if (index < 64 && EXTRACT_BIT(a, i, index)) { 1402fcf5ef2aSThomas Huth result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j); 1403fcf5ef2aSThomas Huth } 1404fcf5ef2aSThomas Huth } 1405fcf5ef2aSThomas Huth } 1406fcf5ef2aSThomas Huth *r = result; 1407fcf5ef2aSThomas Huth } 1408fcf5ef2aSThomas Huth 1409fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1410fcf5ef2aSThomas Huth { 1411fcf5ef2aSThomas Huth int i; 1412fcf5ef2aSThomas Huth uint64_t perm = 0; 1413fcf5ef2aSThomas Huth 1414fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1415fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, i); 1416fcf5ef2aSThomas Huth 1417fcf5ef2aSThomas Huth if (index < 128) { 1418fcf5ef2aSThomas Huth uint64_t mask = (1ull << (63 - (index & 0x3F))); 1419fcf5ef2aSThomas Huth if (a->u64[VBPERMQ_DW(index)] & mask) { 1420fcf5ef2aSThomas Huth perm |= (0x8000 >> i); 1421fcf5ef2aSThomas Huth } 1422fcf5ef2aSThomas Huth } 1423fcf5ef2aSThomas Huth } 1424fcf5ef2aSThomas Huth 14253c385a93SMark Cave-Ayland r->VsrD(0) = perm; 14263c385a93SMark Cave-Ayland r->VsrD(1) = 0; 1427fcf5ef2aSThomas Huth } 1428fcf5ef2aSThomas Huth 1429fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX 1430fcf5ef2aSThomas Huth #undef VBPERMQ_DW 1431fcf5ef2aSThomas Huth 1432fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp) \ 1433fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1434fcf5ef2aSThomas Huth { \ 1435fcf5ef2aSThomas Huth int i, j; \ 1436fcf5ef2aSThomas Huth trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])]; \ 1437fcf5ef2aSThomas Huth \ 1438fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, srcfld) { \ 1439fcf5ef2aSThomas Huth prod[i] = 0; \ 1440fcf5ef2aSThomas Huth for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) { \ 1441fcf5ef2aSThomas Huth if (a->srcfld[i] & (1ull << j)) { \ 1442fcf5ef2aSThomas Huth prod[i] ^= ((trgtyp)b->srcfld[i] << j); \ 1443fcf5ef2aSThomas Huth } \ 1444fcf5ef2aSThomas Huth } \ 1445fcf5ef2aSThomas Huth } \ 1446fcf5ef2aSThomas Huth \ 1447fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, trgfld) { \ 1448fcf5ef2aSThomas Huth r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1]; \ 1449fcf5ef2aSThomas Huth } \ 1450fcf5ef2aSThomas Huth } 1451fcf5ef2aSThomas Huth 1452fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t) 1453fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t) 1454fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t) 1455fcf5ef2aSThomas Huth 1456e82ca8acSMatheus Ferst void helper_VPMSUMD(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1457fcf5ef2aSThomas Huth { 1458fcf5ef2aSThomas Huth int i, j; 1459e82ca8acSMatheus Ferst Int128 tmp, prod[2] = {int128_zero(), int128_zero()}; 1460fcf5ef2aSThomas Huth 1461fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1462e82ca8acSMatheus Ferst for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 1463e82ca8acSMatheus Ferst if (a->VsrD(i) & (1ull << j)) { 1464e82ca8acSMatheus Ferst tmp = int128_make64(b->VsrD(i)); 1465e82ca8acSMatheus Ferst tmp = int128_lshift(tmp, j); 1466e82ca8acSMatheus Ferst prod[i] = int128_xor(prod[i], tmp); 1467fcf5ef2aSThomas Huth } 1468fcf5ef2aSThomas Huth } 1469fcf5ef2aSThomas Huth } 1470fcf5ef2aSThomas Huth 1471e82ca8acSMatheus Ferst r->s128 = int128_xor(prod[0], prod[1]); 1472fcf5ef2aSThomas Huth } 1473fcf5ef2aSThomas Huth 1474e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1475fcf5ef2aSThomas Huth #define PKBIG 1 1476fcf5ef2aSThomas Huth #else 1477fcf5ef2aSThomas Huth #define PKBIG 0 1478fcf5ef2aSThomas Huth #endif 1479fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1480fcf5ef2aSThomas Huth { 1481fcf5ef2aSThomas Huth int i, j; 1482fcf5ef2aSThomas Huth ppc_avr_t result; 1483e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1484fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { a, b }; 1485fcf5ef2aSThomas Huth #else 1486fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { b, a }; 1487fcf5ef2aSThomas Huth #endif 1488fcf5ef2aSThomas Huth 1489fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1490fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(j, u32) { 1491fcf5ef2aSThomas Huth uint32_t e = x[i]->u32[j]; 1492fcf5ef2aSThomas Huth 1493fcf5ef2aSThomas Huth result.u16[4 * i + j] = (((e >> 9) & 0xfc00) | 1494fcf5ef2aSThomas Huth ((e >> 6) & 0x3e0) | 1495fcf5ef2aSThomas Huth ((e >> 3) & 0x1f)); 1496fcf5ef2aSThomas Huth } 1497fcf5ef2aSThomas Huth } 1498fcf5ef2aSThomas Huth *r = result; 1499fcf5ef2aSThomas Huth } 1500fcf5ef2aSThomas Huth 1501fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat) \ 1502fcf5ef2aSThomas Huth void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1503fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 1504fcf5ef2aSThomas Huth { \ 1505fcf5ef2aSThomas Huth int i; \ 1506fcf5ef2aSThomas Huth int sat = 0; \ 1507fcf5ef2aSThomas Huth ppc_avr_t result; \ 1508fcf5ef2aSThomas Huth ppc_avr_t *a0 = PKBIG ? a : b; \ 1509fcf5ef2aSThomas Huth ppc_avr_t *a1 = PKBIG ? b : a; \ 1510fcf5ef2aSThomas Huth \ 1511fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, from) { \ 1512fcf5ef2aSThomas Huth result.to[i] = cvt(a0->from[i], &sat); \ 1513fcf5ef2aSThomas Huth result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\ 1514fcf5ef2aSThomas Huth } \ 1515fcf5ef2aSThomas Huth *r = result; \ 1516fcf5ef2aSThomas Huth if (dosat && sat) { \ 15176175f5a0SRichard Henderson set_vscr_sat(env); \ 1518fcf5ef2aSThomas Huth } \ 1519fcf5ef2aSThomas Huth } 1520fcf5ef2aSThomas Huth #define I(x, y) (x) 1521fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1) 1522fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1) 1523fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1) 1524fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1) 1525fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1) 1526fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1) 1527fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1) 1528fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1) 1529fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1) 1530fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0) 1531fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0) 1532fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0) 1533fcf5ef2aSThomas Huth #undef I 1534fcf5ef2aSThomas Huth #undef VPK 1535fcf5ef2aSThomas Huth #undef PKBIG 1536fcf5ef2aSThomas Huth 1537fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1538fcf5ef2aSThomas Huth { 1539fcf5ef2aSThomas Huth int i; 1540fcf5ef2aSThomas Huth 154105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 154205ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status); 1543fcf5ef2aSThomas Huth } 1544fcf5ef2aSThomas Huth } 1545fcf5ef2aSThomas Huth 1546fcf5ef2aSThomas Huth #define VRFI(suffix, rounding) \ 1547fcf5ef2aSThomas Huth void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1548fcf5ef2aSThomas Huth ppc_avr_t *b) \ 1549fcf5ef2aSThomas Huth { \ 1550fcf5ef2aSThomas Huth int i; \ 1551fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 1552fcf5ef2aSThomas Huth \ 1553fcf5ef2aSThomas Huth set_float_rounding_mode(rounding, &s); \ 155405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 155505ee3e8aSMark Cave-Ayland r->f32[i] = float32_round_to_int (b->f32[i], &s); \ 1556fcf5ef2aSThomas Huth } \ 1557fcf5ef2aSThomas Huth } 1558fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even) 1559fcf5ef2aSThomas Huth VRFI(m, float_round_down) 1560fcf5ef2aSThomas Huth VRFI(p, float_round_up) 1561fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero) 1562fcf5ef2aSThomas Huth #undef VRFI 1563fcf5ef2aSThomas Huth 1564fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1565fcf5ef2aSThomas Huth { 1566fcf5ef2aSThomas Huth int i; 1567fcf5ef2aSThomas Huth 156805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 156905ee3e8aSMark Cave-Ayland float32 t = float32_sqrt(b->f32[i], &env->vec_status); 1570fcf5ef2aSThomas Huth 157105ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, t, &env->vec_status); 1572fcf5ef2aSThomas Huth } 1573fcf5ef2aSThomas Huth } 1574fcf5ef2aSThomas Huth 1575fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert) \ 157602c74f0eSMatheus Ferst void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 1577fcf5ef2aSThomas Huth { \ 1578fcf5ef2aSThomas Huth int i; \ 1579fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1580fcf5ef2aSThomas Huth uint##size##_t src1 = a->element[i]; \ 1581fcf5ef2aSThomas Huth uint##size##_t src2 = b->element[i]; \ 1582fcf5ef2aSThomas Huth uint##size##_t src3 = r->element[i]; \ 1583fcf5ef2aSThomas Huth uint##size##_t begin, end, shift, mask, rot_val; \ 1584fcf5ef2aSThomas Huth \ 1585fcf5ef2aSThomas Huth shift = extract##size(src2, 0, 6); \ 1586fcf5ef2aSThomas Huth end = extract##size(src2, 8, 6); \ 1587fcf5ef2aSThomas Huth begin = extract##size(src2, 16, 6); \ 1588fcf5ef2aSThomas Huth rot_val = rol##size(src1, shift); \ 1589fcf5ef2aSThomas Huth mask = mask_u##size(begin, end); \ 1590fcf5ef2aSThomas Huth if (insert) { \ 1591fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask) | (src3 & ~mask); \ 1592fcf5ef2aSThomas Huth } else { \ 1593fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask); \ 1594fcf5ef2aSThomas Huth } \ 1595fcf5ef2aSThomas Huth } \ 1596fcf5ef2aSThomas Huth } 1597fcf5ef2aSThomas Huth 159802c74f0eSMatheus Ferst VRLMI(VRLDMI, 64, u64, 1); 159902c74f0eSMatheus Ferst VRLMI(VRLWMI, 32, u32, 1); 160002c74f0eSMatheus Ferst VRLMI(VRLDNM, 64, u64, 0); 160102c74f0eSMatheus Ferst VRLMI(VRLWNM, 32, u32, 0); 1602fcf5ef2aSThomas Huth 1603fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1604fcf5ef2aSThomas Huth { 1605fcf5ef2aSThomas Huth int i; 1606fcf5ef2aSThomas Huth 160705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 160805ee3e8aSMark Cave-Ayland r->f32[i] = float32_exp2(b->f32[i], &env->vec_status); 1609fcf5ef2aSThomas Huth } 1610fcf5ef2aSThomas Huth } 1611fcf5ef2aSThomas Huth 1612fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1613fcf5ef2aSThomas Huth { 1614fcf5ef2aSThomas Huth int i; 1615fcf5ef2aSThomas Huth 161605ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 161705ee3e8aSMark Cave-Ayland r->f32[i] = float32_log2(b->f32[i], &env->vec_status); 1618fcf5ef2aSThomas Huth } 1619fcf5ef2aSThomas Huth } 1620fcf5ef2aSThomas Huth 162160caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 162260caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 162360caf221SAvinesh Kumar { \ 1624f297c4c6SMatheus Ferst int index = (a & 0xf) * 8; \ 162560caf221SAvinesh Kumar if (left) { \ 1626f297c4c6SMatheus Ferst index = 128 - index - size; \ 162760caf221SAvinesh Kumar } \ 162860caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 162960caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 163060caf221SAvinesh Kumar } 163160caf221SAvinesh Kumar VEXTU_X_DO(vextublx, 8, 1) 163260caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1) 163360caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1) 163460caf221SAvinesh Kumar VEXTU_X_DO(vextubrx, 8, 0) 163560caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0) 163660caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0) 163760caf221SAvinesh Kumar #undef VEXTU_X_DO 163860caf221SAvinesh Kumar 1639fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1640fcf5ef2aSThomas Huth { 1641fcf5ef2aSThomas Huth int i; 1642fcf5ef2aSThomas Huth unsigned int shift, bytes, size; 1643fcf5ef2aSThomas Huth 1644fcf5ef2aSThomas Huth size = ARRAY_SIZE(r->u8); 1645fcf5ef2aSThomas Huth for (i = 0; i < size; i++) { 164663be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 164763be02fcSAnton Blanchard bytes = (a->VsrB(i) << 8) + /* extract adjacent bytes */ 164863be02fcSAnton Blanchard (((i + 1) < size) ? a->VsrB(i + 1) : 0); 164963be02fcSAnton Blanchard r->VsrB(i) = (bytes << shift) >> 8; /* shift and store result */ 1650fcf5ef2aSThomas Huth } 1651fcf5ef2aSThomas Huth } 1652fcf5ef2aSThomas Huth 1653fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1654fcf5ef2aSThomas Huth { 1655fcf5ef2aSThomas Huth int i; 1656fcf5ef2aSThomas Huth unsigned int shift, bytes; 1657fcf5ef2aSThomas Huth 1658b6cb41b2SDavid Gibson /* 1659b6cb41b2SDavid Gibson * Use reverse order, as destination and source register can be 1660b6cb41b2SDavid Gibson * same. Its being modified in place saving temporary, reverse 1661b6cb41b2SDavid Gibson * order will guarantee that computed result is not fed back. 1662fcf5ef2aSThomas Huth */ 1663fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 166463be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 166563be02fcSAnton Blanchard bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i); 1666fcf5ef2aSThomas Huth /* extract adjacent bytes */ 166763be02fcSAnton Blanchard r->VsrB(i) = (bytes >> shift) & 0xFF; /* shift and store result */ 1668fcf5ef2aSThomas Huth } 1669fcf5ef2aSThomas Huth } 1670fcf5ef2aSThomas Huth 1671fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift) 1672fcf5ef2aSThomas Huth { 1673fcf5ef2aSThomas Huth int sh = shift & 0xf; 1674fcf5ef2aSThomas Huth int i; 1675fcf5ef2aSThomas Huth ppc_avr_t result; 1676fcf5ef2aSThomas Huth 1677fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1678fcf5ef2aSThomas Huth int index = sh + i; 1679fcf5ef2aSThomas Huth if (index > 0xf) { 168060594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index - 0x10); 1681fcf5ef2aSThomas Huth } else { 168260594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1683fcf5ef2aSThomas Huth } 1684fcf5ef2aSThomas Huth } 1685fcf5ef2aSThomas Huth *r = result; 1686fcf5ef2aSThomas Huth } 1687fcf5ef2aSThomas Huth 1688fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1689fcf5ef2aSThomas Huth { 16903c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1691fcf5ef2aSThomas Huth 1692e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1693fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1694fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1695fcf5ef2aSThomas Huth #else 1696fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1697fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1698fcf5ef2aSThomas Huth #endif 1699fcf5ef2aSThomas Huth } 1700fcf5ef2aSThomas Huth 1701e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 17022cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX]) 17032cc12af3SMatheus Ferst #else 17042cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1) 17052cc12af3SMatheus Ferst #endif 17062cc12af3SMatheus Ferst 17072cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \ 17082cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t, \ 17092cc12af3SMatheus Ferst uint64_t val, target_ulong index) \ 17102cc12af3SMatheus Ferst { \ 17112cc12af3SMatheus Ferst const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE); \ 17122cc12af3SMatheus Ferst target_long idx = index; \ 17132cc12af3SMatheus Ferst \ 17142cc12af3SMatheus Ferst if (idx < 0 || idx > maxidx) { \ 17152cc12af3SMatheus Ferst idx = idx < 0 ? sizeof(TYPE) - idx : idx; \ 17162cc12af3SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, \ 17172cc12af3SMatheus Ferst "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx \ 17182cc12af3SMatheus Ferst ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx); \ 17192cc12af3SMatheus Ferst } else { \ 17202cc12af3SMatheus Ferst TYPE src = val; \ 17212cc12af3SMatheus Ferst memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE)); \ 17222cc12af3SMatheus Ferst } \ 17232cc12af3SMatheus Ferst } 17242cc12af3SMatheus Ferst VINSX(B, uint8_t) 17252cc12af3SMatheus Ferst VINSX(H, uint16_t) 17262cc12af3SMatheus Ferst VINSX(W, uint32_t) 17272cc12af3SMatheus Ferst VINSX(D, uint64_t) 17282cc12af3SMatheus Ferst #undef ELEM_ADDR 17292cc12af3SMatheus Ferst #undef VINSX 1730e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 173128110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \ 173228110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 173328110b72SMatheus Ferst target_ulong index) \ 173428110b72SMatheus Ferst { \ 173528110b72SMatheus Ferst const target_long idx = index; \ 173628110b72SMatheus Ferst ppc_avr_t tmp[2] = { *a, *b }; \ 173728110b72SMatheus Ferst memset(t, 0, sizeof(*t)); \ 173828110b72SMatheus Ferst if (idx >= 0 && idx + SIZE <= sizeof(tmp)) { \ 173928110b72SMatheus Ferst memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \ 174028110b72SMatheus Ferst } else { \ 174128110b72SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x" \ 174228110b72SMatheus Ferst TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n", \ 174328110b72SMatheus Ferst env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE); \ 174428110b72SMatheus Ferst } \ 174528110b72SMatheus Ferst } 174628110b72SMatheus Ferst #else 174728110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \ 174828110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 174928110b72SMatheus Ferst target_ulong index) \ 175028110b72SMatheus Ferst { \ 175128110b72SMatheus Ferst const target_long idx = index; \ 175228110b72SMatheus Ferst ppc_avr_t tmp[2] = { *b, *a }; \ 175328110b72SMatheus Ferst memset(t, 0, sizeof(*t)); \ 175428110b72SMatheus Ferst if (idx >= 0 && idx + SIZE <= sizeof(tmp)) { \ 175528110b72SMatheus Ferst memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2], \ 175628110b72SMatheus Ferst (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE); \ 175728110b72SMatheus Ferst } else { \ 175828110b72SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x" \ 175928110b72SMatheus Ferst TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n", \ 176028110b72SMatheus Ferst env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE); \ 176128110b72SMatheus Ferst } \ 176228110b72SMatheus Ferst } 176328110b72SMatheus Ferst #endif 176428110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1) 176528110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2) 176628110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4) 176728110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8) 176828110b72SMatheus Ferst #undef VEXTDVLX 1769e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1770fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1771fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1772fcf5ef2aSThomas Huth { \ 1773fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1774fcf5ef2aSThomas Huth memmove(&r->u8[8 - es], &b->u8[index], es); \ 1775fcf5ef2aSThomas Huth memset(&r->u8[8], 0, 8); \ 1776fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8 - es); \ 1777fcf5ef2aSThomas Huth } 1778fcf5ef2aSThomas Huth #else 1779fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1780fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1781fcf5ef2aSThomas Huth { \ 1782fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1783fcf5ef2aSThomas Huth uint32_t s = (16 - index) - es; \ 1784fcf5ef2aSThomas Huth memmove(&r->u8[8], &b->u8[s], es); \ 1785fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8); \ 1786fcf5ef2aSThomas Huth memset(&r->u8[8 + es], 0, 8 - es); \ 1787fcf5ef2aSThomas Huth } 1788fcf5ef2aSThomas Huth #endif 1789fcf5ef2aSThomas Huth VEXTRACT(ub, u8) 1790fcf5ef2aSThomas Huth VEXTRACT(uh, u16) 1791fcf5ef2aSThomas Huth VEXTRACT(uw, u32) 1792fcf5ef2aSThomas Huth VEXTRACT(d, u64) 1793fcf5ef2aSThomas Huth #undef VEXTRACT 1794fcf5ef2aSThomas Huth 1795fb5303ccSMatheus Ferst #define VSTRI(NAME, ELEM, NUM_ELEMS, LEFT) \ 1796fb5303ccSMatheus Ferst uint32_t helper_##NAME(ppc_avr_t *t, ppc_avr_t *b) \ 1797fb5303ccSMatheus Ferst { \ 1798fb5303ccSMatheus Ferst int i, idx, crf = 0; \ 1799fb5303ccSMatheus Ferst \ 1800fb5303ccSMatheus Ferst for (i = 0; i < NUM_ELEMS; i++) { \ 1801fb5303ccSMatheus Ferst idx = LEFT ? i : NUM_ELEMS - i - 1; \ 1802fb5303ccSMatheus Ferst if (b->Vsr##ELEM(idx)) { \ 1803fb5303ccSMatheus Ferst t->Vsr##ELEM(idx) = b->Vsr##ELEM(idx); \ 1804fb5303ccSMatheus Ferst } else { \ 1805fb5303ccSMatheus Ferst crf = 0b0010; \ 1806fb5303ccSMatheus Ferst break; \ 1807fb5303ccSMatheus Ferst } \ 1808fb5303ccSMatheus Ferst } \ 1809fb5303ccSMatheus Ferst \ 1810fb5303ccSMatheus Ferst for (; i < NUM_ELEMS; i++) { \ 1811fb5303ccSMatheus Ferst idx = LEFT ? i : NUM_ELEMS - i - 1; \ 1812fb5303ccSMatheus Ferst t->Vsr##ELEM(idx) = 0; \ 1813fb5303ccSMatheus Ferst } \ 1814fb5303ccSMatheus Ferst \ 1815fb5303ccSMatheus Ferst return crf; \ 1816fb5303ccSMatheus Ferst } 1817fb5303ccSMatheus Ferst VSTRI(VSTRIBL, B, 16, true) 1818fb5303ccSMatheus Ferst VSTRI(VSTRIBR, B, 16, false) 1819fb5303ccSMatheus Ferst VSTRI(VSTRIHL, H, 8, true) 1820fb5303ccSMatheus Ferst VSTRI(VSTRIHR, H, 8, false) 1821fb5303ccSMatheus Ferst #undef VSTRI 1822fb5303ccSMatheus Ferst 18238f5eeee3SMatheus Ferst void helper_XXEXTRACTUW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index) 18248ad901e5SNikunj A Dadhania { 182503b32c09SMark Cave-Ayland ppc_vsr_t t = { }; 18268ad901e5SNikunj A Dadhania size_t es = sizeof(uint32_t); 18278ad901e5SNikunj A Dadhania uint32_t ext_index; 18288ad901e5SNikunj A Dadhania int i; 18298ad901e5SNikunj A Dadhania 18308ad901e5SNikunj A Dadhania ext_index = index; 18318ad901e5SNikunj A Dadhania for (i = 0; i < es; i++, ext_index++) { 183203b32c09SMark Cave-Ayland t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16); 18338ad901e5SNikunj A Dadhania } 18348ad901e5SNikunj A Dadhania 183503b32c09SMark Cave-Ayland *xt = t; 18368ad901e5SNikunj A Dadhania } 18378ad901e5SNikunj A Dadhania 18388f5eeee3SMatheus Ferst void helper_XXINSERTW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index) 18393398b742SNikunj A Dadhania { 184003b32c09SMark Cave-Ayland ppc_vsr_t t = *xt; 18413398b742SNikunj A Dadhania size_t es = sizeof(uint32_t); 18423398b742SNikunj A Dadhania int ins_index, i = 0; 18433398b742SNikunj A Dadhania 18443398b742SNikunj A Dadhania ins_index = index; 18453398b742SNikunj A Dadhania for (i = 0; i < es && ins_index < 16; i++, ins_index++) { 184603b32c09SMark Cave-Ayland t.VsrB(ins_index) = xb->VsrB(8 - es + i); 18473398b742SNikunj A Dadhania } 18483398b742SNikunj A Dadhania 184903b32c09SMark Cave-Ayland *xt = t; 18503398b742SNikunj A Dadhania } 18513398b742SNikunj A Dadhania 18521015fcabSMatheus Ferst void helper_XXEVAL(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c, 18531015fcabSMatheus Ferst uint32_t desc) 18541015fcabSMatheus Ferst { 18551015fcabSMatheus Ferst /* 18561015fcabSMatheus Ferst * Instead of processing imm bit-by-bit, we'll skip the computation of 18571015fcabSMatheus Ferst * conjunctions whose corresponding bit is unset. 18581015fcabSMatheus Ferst */ 18591015fcabSMatheus Ferst int bit, imm = simd_data(desc); 18601015fcabSMatheus Ferst Int128 conj, disj = int128_zero(); 18611015fcabSMatheus Ferst 18621015fcabSMatheus Ferst /* Iterate over set bits from the least to the most significant bit */ 18631015fcabSMatheus Ferst while (imm) { 18641015fcabSMatheus Ferst /* 18651015fcabSMatheus Ferst * Get the next bit to be processed with ctz64. Invert the result of 18661015fcabSMatheus Ferst * ctz64 to match the indexing used by PowerISA. 18671015fcabSMatheus Ferst */ 18681015fcabSMatheus Ferst bit = 7 - ctzl(imm); 18691015fcabSMatheus Ferst if (bit & 0x4) { 18701015fcabSMatheus Ferst conj = a->s128; 18711015fcabSMatheus Ferst } else { 18721015fcabSMatheus Ferst conj = int128_not(a->s128); 18731015fcabSMatheus Ferst } 18741015fcabSMatheus Ferst if (bit & 0x2) { 18751015fcabSMatheus Ferst conj = int128_and(conj, b->s128); 18761015fcabSMatheus Ferst } else { 18771015fcabSMatheus Ferst conj = int128_and(conj, int128_not(b->s128)); 18781015fcabSMatheus Ferst } 18791015fcabSMatheus Ferst if (bit & 0x1) { 18801015fcabSMatheus Ferst conj = int128_and(conj, c->s128); 18811015fcabSMatheus Ferst } else { 18821015fcabSMatheus Ferst conj = int128_and(conj, int128_not(c->s128)); 18831015fcabSMatheus Ferst } 18841015fcabSMatheus Ferst disj = int128_or(disj, conj); 18851015fcabSMatheus Ferst 18861015fcabSMatheus Ferst /* Unset the least significant bit that is set */ 18871015fcabSMatheus Ferst imm &= imm - 1; 18881015fcabSMatheus Ferst } 18891015fcabSMatheus Ferst 18901015fcabSMatheus Ferst t->s128 = disj; 18911015fcabSMatheus Ferst } 18921015fcabSMatheus Ferst 1893788c6399SMatheus Ferst #define XXBLEND(name, sz) \ 1894788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 1895788c6399SMatheus Ferst ppc_avr_t *c, uint32_t desc) \ 1896788c6399SMatheus Ferst { \ 1897788c6399SMatheus Ferst for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) { \ 1898788c6399SMatheus Ferst t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ? \ 1899788c6399SMatheus Ferst b->glue(u, sz)[i] : a->glue(u, sz)[i]; \ 1900788c6399SMatheus Ferst } \ 1901788c6399SMatheus Ferst } 1902788c6399SMatheus Ferst XXBLEND(B, 8) 1903788c6399SMatheus Ferst XXBLEND(H, 16) 1904788c6399SMatheus Ferst XXBLEND(W, 32) 1905788c6399SMatheus Ferst XXBLEND(D, 64) 1906788c6399SMatheus Ferst #undef XXBLEND 1907788c6399SMatheus Ferst 1908fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1909fcf5ef2aSThomas Huth { 19103c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1911fcf5ef2aSThomas Huth 1912e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1913fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1914fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1915fcf5ef2aSThomas Huth #else 1916fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1917fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1918fcf5ef2aSThomas Huth #endif 1919fcf5ef2aSThomas Huth } 1920fcf5ef2aSThomas Huth 1921fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1922fcf5ef2aSThomas Huth { 1923fcf5ef2aSThomas Huth int64_t t; 1924fcf5ef2aSThomas Huth int i, upper; 1925fcf5ef2aSThomas Huth ppc_avr_t result; 1926fcf5ef2aSThomas Huth int sat = 0; 1927fcf5ef2aSThomas Huth 1928fcf5ef2aSThomas Huth upper = ARRAY_SIZE(r->s32) - 1; 192960594feaSMark Cave-Ayland t = (int64_t)b->VsrSW(upper); 1930fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 193160594feaSMark Cave-Ayland t += a->VsrSW(i); 193260594feaSMark Cave-Ayland result.VsrSW(i) = 0; 1933fcf5ef2aSThomas Huth } 193460594feaSMark Cave-Ayland result.VsrSW(upper) = cvtsdsw(t, &sat); 1935fcf5ef2aSThomas Huth *r = result; 1936fcf5ef2aSThomas Huth 1937fcf5ef2aSThomas Huth if (sat) { 19386175f5a0SRichard Henderson set_vscr_sat(env); 1939fcf5ef2aSThomas Huth } 1940fcf5ef2aSThomas Huth } 1941fcf5ef2aSThomas Huth 1942fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1943fcf5ef2aSThomas Huth { 1944fcf5ef2aSThomas Huth int i, j, upper; 1945fcf5ef2aSThomas Huth ppc_avr_t result; 1946fcf5ef2aSThomas Huth int sat = 0; 1947fcf5ef2aSThomas Huth 1948fcf5ef2aSThomas Huth upper = 1; 1949fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 195060594feaSMark Cave-Ayland int64_t t = (int64_t)b->VsrSW(upper + i * 2); 1951fcf5ef2aSThomas Huth 19527fa0ddc1SAnton Blanchard result.VsrD(i) = 0; 1953fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u64); j++) { 195460594feaSMark Cave-Ayland t += a->VsrSW(2 * i + j); 1955fcf5ef2aSThomas Huth } 195660594feaSMark Cave-Ayland result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat); 1957fcf5ef2aSThomas Huth } 1958fcf5ef2aSThomas Huth 1959fcf5ef2aSThomas Huth *r = result; 1960fcf5ef2aSThomas Huth if (sat) { 19616175f5a0SRichard Henderson set_vscr_sat(env); 1962fcf5ef2aSThomas Huth } 1963fcf5ef2aSThomas Huth } 1964fcf5ef2aSThomas Huth 1965fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1966fcf5ef2aSThomas Huth { 1967fcf5ef2aSThomas Huth int i, j; 1968fcf5ef2aSThomas Huth int sat = 0; 1969fcf5ef2aSThomas Huth 1970fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1971fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1972fcf5ef2aSThomas Huth 1973fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->s32); j++) { 1974fcf5ef2aSThomas Huth t += a->s8[4 * i + j]; 1975fcf5ef2aSThomas Huth } 1976fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1977fcf5ef2aSThomas Huth } 1978fcf5ef2aSThomas Huth 1979fcf5ef2aSThomas Huth if (sat) { 19806175f5a0SRichard Henderson set_vscr_sat(env); 1981fcf5ef2aSThomas Huth } 1982fcf5ef2aSThomas Huth } 1983fcf5ef2aSThomas Huth 1984fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1985fcf5ef2aSThomas Huth { 1986fcf5ef2aSThomas Huth int sat = 0; 1987fcf5ef2aSThomas Huth int i; 1988fcf5ef2aSThomas Huth 1989fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1990fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1991fcf5ef2aSThomas Huth 1992fcf5ef2aSThomas Huth t += a->s16[2 * i] + a->s16[2 * i + 1]; 1993fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1994fcf5ef2aSThomas Huth } 1995fcf5ef2aSThomas Huth 1996fcf5ef2aSThomas Huth if (sat) { 19976175f5a0SRichard Henderson set_vscr_sat(env); 1998fcf5ef2aSThomas Huth } 1999fcf5ef2aSThomas Huth } 2000fcf5ef2aSThomas Huth 2001fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2002fcf5ef2aSThomas Huth { 2003fcf5ef2aSThomas Huth int i, j; 2004fcf5ef2aSThomas Huth int sat = 0; 2005fcf5ef2aSThomas Huth 2006fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2007fcf5ef2aSThomas Huth uint64_t t = (uint64_t)b->u32[i]; 2008fcf5ef2aSThomas Huth 2009fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u32); j++) { 2010fcf5ef2aSThomas Huth t += a->u8[4 * i + j]; 2011fcf5ef2aSThomas Huth } 2012fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 2013fcf5ef2aSThomas Huth } 2014fcf5ef2aSThomas Huth 2015fcf5ef2aSThomas Huth if (sat) { 20166175f5a0SRichard Henderson set_vscr_sat(env); 2017fcf5ef2aSThomas Huth } 2018fcf5ef2aSThomas Huth } 2019fcf5ef2aSThomas Huth 2020e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 2021fcf5ef2aSThomas Huth #define UPKHI 1 2022fcf5ef2aSThomas Huth #define UPKLO 0 2023fcf5ef2aSThomas Huth #else 2024fcf5ef2aSThomas Huth #define UPKHI 0 2025fcf5ef2aSThomas Huth #define UPKLO 1 2026fcf5ef2aSThomas Huth #endif 2027fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi) \ 2028fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 2029fcf5ef2aSThomas Huth { \ 2030fcf5ef2aSThomas Huth int i; \ 2031fcf5ef2aSThomas Huth ppc_avr_t result; \ 2032fcf5ef2aSThomas Huth \ 2033fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { \ 2034fcf5ef2aSThomas Huth uint16_t e = b->u16[hi ? i : i + 4]; \ 2035fcf5ef2aSThomas Huth uint8_t a = (e >> 15) ? 0xff : 0; \ 2036fcf5ef2aSThomas Huth uint8_t r = (e >> 10) & 0x1f; \ 2037fcf5ef2aSThomas Huth uint8_t g = (e >> 5) & 0x1f; \ 2038fcf5ef2aSThomas Huth uint8_t b = e & 0x1f; \ 2039fcf5ef2aSThomas Huth \ 2040fcf5ef2aSThomas Huth result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b; \ 2041fcf5ef2aSThomas Huth } \ 2042fcf5ef2aSThomas Huth *r = result; \ 2043fcf5ef2aSThomas Huth } 2044fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO) 2045fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI) 2046fcf5ef2aSThomas Huth #undef VUPKPX 2047fcf5ef2aSThomas Huth 2048fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi) \ 2049fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 2050fcf5ef2aSThomas Huth { \ 2051fcf5ef2aSThomas Huth int i; \ 2052fcf5ef2aSThomas Huth ppc_avr_t result; \ 2053fcf5ef2aSThomas Huth \ 2054fcf5ef2aSThomas Huth if (hi) { \ 2055fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) { \ 2056fcf5ef2aSThomas Huth result.unpacked[i] = b->packee[i]; \ 2057fcf5ef2aSThomas Huth } \ 2058fcf5ef2aSThomas Huth } else { \ 2059fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \ 2060fcf5ef2aSThomas Huth i++) { \ 2061fcf5ef2aSThomas Huth result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \ 2062fcf5ef2aSThomas Huth } \ 2063fcf5ef2aSThomas Huth } \ 2064fcf5ef2aSThomas Huth *r = result; \ 2065fcf5ef2aSThomas Huth } 2066fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI) 2067fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI) 2068fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI) 2069fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO) 2070fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO) 2071fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO) 2072fcf5ef2aSThomas Huth #undef VUPK 2073fcf5ef2aSThomas Huth #undef UPKHI 2074fcf5ef2aSThomas Huth #undef UPKLO 2075fcf5ef2aSThomas Huth 2076fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element) \ 2077fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *b) \ 2078fcf5ef2aSThomas Huth { \ 2079fcf5ef2aSThomas Huth int i; \ 2080fcf5ef2aSThomas Huth \ 208160594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 2082fcf5ef2aSThomas Huth r->element[i] = name(b->element[i]); \ 2083fcf5ef2aSThomas Huth } \ 2084fcf5ef2aSThomas Huth } 2085fcf5ef2aSThomas Huth 2086fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8) 2087fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16) 2088fcf5ef2aSThomas Huth 2089fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8) 2090fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16) 2091fcf5ef2aSThomas Huth 2092fcf5ef2aSThomas Huth #undef clzb 2093fcf5ef2aSThomas Huth #undef clzh 2094fcf5ef2aSThomas Huth 2095fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8) 2096fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16) 2097fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v)) 2098fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v)) 2099fcf5ef2aSThomas Huth 2100fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8) 2101fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16) 2102fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32) 2103fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64) 2104fcf5ef2aSThomas Huth 2105fcf5ef2aSThomas Huth #undef ctzb 2106fcf5ef2aSThomas Huth #undef ctzh 2107fcf5ef2aSThomas Huth #undef ctzw 2108fcf5ef2aSThomas Huth #undef ctzd 2109fcf5ef2aSThomas Huth 2110fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v) 2111fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v) 2112fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v) 2113fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v) 2114fcf5ef2aSThomas Huth 2115fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8) 2116fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16) 2117fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32) 2118fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64) 2119fcf5ef2aSThomas Huth 2120fcf5ef2aSThomas Huth #undef popcntb 2121fcf5ef2aSThomas Huth #undef popcnth 2122fcf5ef2aSThomas Huth #undef popcntw 2123fcf5ef2aSThomas Huth #undef popcntd 2124fcf5ef2aSThomas Huth 2125fcf5ef2aSThomas Huth #undef VGENERIC_DO 2126fcf5ef2aSThomas Huth 21277ca04286SMatheus Ferst void helper_VADDUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2128fcf5ef2aSThomas Huth { 21297ca04286SMatheus Ferst r->s128 = int128_add(a->s128, b->s128); 2130fcf5ef2aSThomas Huth } 2131fcf5ef2aSThomas Huth 2132896d92c8SMatheus Ferst void helper_VADDEUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2133fcf5ef2aSThomas Huth { 2134896d92c8SMatheus Ferst r->s128 = int128_add(int128_add(a->s128, b->s128), 2135896d92c8SMatheus Ferst int128_make64(int128_getlo(c->s128) & 1)); 2136fcf5ef2aSThomas Huth } 2137fcf5ef2aSThomas Huth 21388290ea50SMatheus Ferst void helper_VADDCUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2139fcf5ef2aSThomas Huth { 21408290ea50SMatheus Ferst r->VsrD(1) = int128_ult(int128_not(a->s128), b->s128); 21413c385a93SMark Cave-Ayland r->VsrD(0) = 0; 2142fcf5ef2aSThomas Huth } 2143fcf5ef2aSThomas Huth 2144896d92c8SMatheus Ferst void helper_VADDECUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2145fcf5ef2aSThomas Huth { 2146896d92c8SMatheus Ferst bool carry_out = int128_ult(int128_not(a->s128), b->s128), 2147896d92c8SMatheus Ferst carry_in = int128_getlo(c->s128) & 1; 2148fcf5ef2aSThomas Huth 2149fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2150896d92c8SMatheus Ferst carry_out = (int128_nz(a->s128) || int128_nz(b->s128)) && 2151896d92c8SMatheus Ferst int128_eq(int128_add(a->s128, b->s128), int128_makes64(-1)); 2152fcf5ef2aSThomas Huth } 2153896d92c8SMatheus Ferst 21543c385a93SMark Cave-Ayland r->VsrD(0) = 0; 21553c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2156fcf5ef2aSThomas Huth } 2157fcf5ef2aSThomas Huth 2158b132be53SMatheus Ferst void helper_VSUBUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2159fcf5ef2aSThomas Huth { 2160b132be53SMatheus Ferst r->s128 = int128_sub(a->s128, b->s128); 2161fcf5ef2aSThomas Huth } 2162fcf5ef2aSThomas Huth 2163e6a5ad43SMatheus Ferst void helper_VSUBEUQM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2164fcf5ef2aSThomas Huth { 2165e6a5ad43SMatheus Ferst r->s128 = int128_add(int128_add(a->s128, int128_not(b->s128)), 2166e6a5ad43SMatheus Ferst int128_make64(int128_getlo(c->s128) & 1)); 2167fcf5ef2aSThomas Huth } 2168fcf5ef2aSThomas Huth 2169b7d30faeSMatheus Ferst void helper_VSUBCUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2170fcf5ef2aSThomas Huth { 2171b7d30faeSMatheus Ferst Int128 tmp = int128_not(b->s128); 2172b7d30faeSMatheus Ferst 2173b7d30faeSMatheus Ferst r->VsrD(1) = int128_ult(int128_not(a->s128), tmp) || 2174b7d30faeSMatheus Ferst int128_eq(int128_add(a->s128, tmp), int128_makes64(-1)); 21753c385a93SMark Cave-Ayland r->VsrD(0) = 0; 2176fcf5ef2aSThomas Huth } 2177fcf5ef2aSThomas Huth 2178e6a5ad43SMatheus Ferst void helper_VSUBECUQ(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2179fcf5ef2aSThomas Huth { 2180e6a5ad43SMatheus Ferst Int128 tmp = int128_not(b->s128); 2181e6a5ad43SMatheus Ferst bool carry_out = int128_ult(int128_not(a->s128), tmp), 2182e6a5ad43SMatheus Ferst carry_in = int128_getlo(c->s128) & 1; 2183fcf5ef2aSThomas Huth 2184e6a5ad43SMatheus Ferst r->VsrD(1) = carry_out || (carry_in && int128_eq(int128_add(a->s128, tmp), 2185e6a5ad43SMatheus Ferst int128_makes64(-1))); 21863c385a93SMark Cave-Ayland r->VsrD(0) = 0; 2187fcf5ef2aSThomas Huth } 2188fcf5ef2aSThomas Huth 2189fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC 2190fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF 2191fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1 0xA 2192fcf5ef2aSThomas Huth #define BCD_NEG_PREF 0xD 2193fcf5ef2aSThomas Huth #define BCD_NEG_ALT 0xB 2194fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2 0xE 2195fcf5ef2aSThomas Huth #define NATIONAL_PLUS 0x2B 2196fcf5ef2aSThomas Huth #define NATIONAL_NEG 0x2D 2197fcf5ef2aSThomas Huth 2198365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2)) 2199fcf5ef2aSThomas Huth 2200fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd) 2201fcf5ef2aSThomas Huth { 2202428115c3SMark Cave-Ayland switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) { 2203fcf5ef2aSThomas Huth case BCD_PLUS_PREF_1: 2204fcf5ef2aSThomas Huth case BCD_PLUS_PREF_2: 2205fcf5ef2aSThomas Huth case BCD_PLUS_ALT_1: 2206fcf5ef2aSThomas Huth case BCD_PLUS_ALT_2: 2207fcf5ef2aSThomas Huth { 2208fcf5ef2aSThomas Huth return 1; 2209fcf5ef2aSThomas Huth } 2210fcf5ef2aSThomas Huth 2211fcf5ef2aSThomas Huth case BCD_NEG_PREF: 2212fcf5ef2aSThomas Huth case BCD_NEG_ALT: 2213fcf5ef2aSThomas Huth { 2214fcf5ef2aSThomas Huth return -1; 2215fcf5ef2aSThomas Huth } 2216fcf5ef2aSThomas Huth 2217fcf5ef2aSThomas Huth default: 2218fcf5ef2aSThomas Huth { 2219fcf5ef2aSThomas Huth return 0; 2220fcf5ef2aSThomas Huth } 2221fcf5ef2aSThomas Huth } 2222fcf5ef2aSThomas Huth } 2223fcf5ef2aSThomas Huth 2224fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps) 2225fcf5ef2aSThomas Huth { 2226fcf5ef2aSThomas Huth if (sgn >= 0) { 2227fcf5ef2aSThomas Huth return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2; 2228fcf5ef2aSThomas Huth } else { 2229fcf5ef2aSThomas Huth return BCD_NEG_PREF; 2230fcf5ef2aSThomas Huth } 2231fcf5ef2aSThomas Huth } 2232fcf5ef2aSThomas Huth 2233fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid) 2234fcf5ef2aSThomas Huth { 2235fcf5ef2aSThomas Huth uint8_t result; 2236fcf5ef2aSThomas Huth if (n & 1) { 2237428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4; 2238fcf5ef2aSThomas Huth } else { 2239428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF; 2240fcf5ef2aSThomas Huth } 2241fcf5ef2aSThomas Huth 2242fcf5ef2aSThomas Huth if (unlikely(result > 9)) { 2243fcf5ef2aSThomas Huth *invalid = true; 2244fcf5ef2aSThomas Huth } 2245fcf5ef2aSThomas Huth return result; 2246fcf5ef2aSThomas Huth } 2247fcf5ef2aSThomas Huth 2248fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n) 2249fcf5ef2aSThomas Huth { 2250fcf5ef2aSThomas Huth if (n & 1) { 2251428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F; 2252428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4); 2253fcf5ef2aSThomas Huth } else { 2254428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0; 2255428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= digit; 2256fcf5ef2aSThomas Huth } 2257fcf5ef2aSThomas Huth } 2258fcf5ef2aSThomas Huth 2259071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd) 2260071663dfSJose Ricardo Ziviani { 2261071663dfSJose Ricardo Ziviani int i; 2262071663dfSJose Ricardo Ziviani int invalid = 0; 2263071663dfSJose Ricardo Ziviani 2264071663dfSJose Ricardo Ziviani if (bcd_get_sgn(bcd) == 0) { 2265071663dfSJose Ricardo Ziviani return false; 2266071663dfSJose Ricardo Ziviani } 2267071663dfSJose Ricardo Ziviani 2268071663dfSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2269071663dfSJose Ricardo Ziviani bcd_get_digit(bcd, i, &invalid); 2270071663dfSJose Ricardo Ziviani if (unlikely(invalid)) { 2271071663dfSJose Ricardo Ziviani return false; 2272071663dfSJose Ricardo Ziviani } 2273071663dfSJose Ricardo Ziviani } 2274071663dfSJose Ricardo Ziviani return true; 2275071663dfSJose Ricardo Ziviani } 2276071663dfSJose Ricardo Ziviani 2277fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd) 2278fcf5ef2aSThomas Huth { 22793c385a93SMark Cave-Ayland if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) { 2280efa73196SNikunj A Dadhania return CRF_EQ; 2281fcf5ef2aSThomas Huth } else { 2282efa73196SNikunj A Dadhania return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT; 2283fcf5ef2aSThomas Huth } 2284fcf5ef2aSThomas Huth } 2285fcf5ef2aSThomas Huth 2286fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n) 2287fcf5ef2aSThomas Huth { 228860594feaSMark Cave-Ayland return reg->VsrH(7 - n); 2289fcf5ef2aSThomas Huth } 2290fcf5ef2aSThomas Huth 2291fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n) 2292fcf5ef2aSThomas Huth { 229360594feaSMark Cave-Ayland reg->VsrH(7 - n) = val; 2294fcf5ef2aSThomas Huth } 2295fcf5ef2aSThomas Huth 2296fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b) 2297fcf5ef2aSThomas Huth { 2298fcf5ef2aSThomas Huth int i; 2299fcf5ef2aSThomas Huth int invalid = 0; 2300fcf5ef2aSThomas Huth for (i = 31; i > 0; i--) { 2301fcf5ef2aSThomas Huth uint8_t dig_a = bcd_get_digit(a, i, &invalid); 2302fcf5ef2aSThomas Huth uint8_t dig_b = bcd_get_digit(b, i, &invalid); 2303fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2304fcf5ef2aSThomas Huth return 0; /* doesn't matter */ 2305fcf5ef2aSThomas Huth } else if (dig_a > dig_b) { 2306fcf5ef2aSThomas Huth return 1; 2307fcf5ef2aSThomas Huth } else if (dig_a < dig_b) { 2308fcf5ef2aSThomas Huth return -1; 2309fcf5ef2aSThomas Huth } 2310fcf5ef2aSThomas Huth } 2311fcf5ef2aSThomas Huth 2312fcf5ef2aSThomas Huth return 0; 2313fcf5ef2aSThomas Huth } 2314fcf5ef2aSThomas Huth 2315936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2316fcf5ef2aSThomas Huth int *overflow) 2317fcf5ef2aSThomas Huth { 2318fcf5ef2aSThomas Huth int carry = 0; 2319fcf5ef2aSThomas Huth int i; 2320936fda4dSFabiano Rosas int is_zero = 1; 2321936fda4dSFabiano Rosas 2322fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2323fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) + 2324fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2325936fda4dSFabiano Rosas is_zero &= (digit == 0); 2326fcf5ef2aSThomas Huth if (digit > 9) { 2327fcf5ef2aSThomas Huth carry = 1; 2328fcf5ef2aSThomas Huth digit -= 10; 2329fcf5ef2aSThomas Huth } else { 2330fcf5ef2aSThomas Huth carry = 0; 2331fcf5ef2aSThomas Huth } 2332fcf5ef2aSThomas Huth 2333fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2334fcf5ef2aSThomas Huth } 2335fcf5ef2aSThomas Huth 2336fcf5ef2aSThomas Huth *overflow = carry; 2337936fda4dSFabiano Rosas return is_zero; 2338fcf5ef2aSThomas Huth } 2339fcf5ef2aSThomas Huth 2340d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2341fcf5ef2aSThomas Huth int *overflow) 2342fcf5ef2aSThomas Huth { 2343fcf5ef2aSThomas Huth int carry = 0; 2344fcf5ef2aSThomas Huth int i; 2345d03b174aSYasmin Beatriz 2346fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2347fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) - 2348fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2349fcf5ef2aSThomas Huth if (digit & 0x80) { 2350fcf5ef2aSThomas Huth carry = -1; 2351fcf5ef2aSThomas Huth digit += 10; 2352fcf5ef2aSThomas Huth } else { 2353fcf5ef2aSThomas Huth carry = 0; 2354fcf5ef2aSThomas Huth } 2355fcf5ef2aSThomas Huth 2356fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2357fcf5ef2aSThomas Huth } 2358fcf5ef2aSThomas Huth 2359fcf5ef2aSThomas Huth *overflow = carry; 2360fcf5ef2aSThomas Huth } 2361fcf5ef2aSThomas Huth 2362fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2363fcf5ef2aSThomas Huth { 2364fcf5ef2aSThomas Huth 2365fcf5ef2aSThomas Huth int sgna = bcd_get_sgn(a); 2366fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2367fcf5ef2aSThomas Huth int invalid = (sgna == 0) || (sgnb == 0); 2368fcf5ef2aSThomas Huth int overflow = 0; 2369936fda4dSFabiano Rosas int zero = 0; 2370fcf5ef2aSThomas Huth uint32_t cr = 0; 2371fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 2372fcf5ef2aSThomas Huth 2373fcf5ef2aSThomas Huth if (!invalid) { 2374fcf5ef2aSThomas Huth if (sgna == sgnb) { 2375428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2376936fda4dSFabiano Rosas zero = bcd_add_mag(&result, a, b, &invalid, &overflow); 2377936fda4dSFabiano Rosas cr = (sgna > 0) ? CRF_GT : CRF_LT; 2378fcf5ef2aSThomas Huth } else { 2379d03b174aSYasmin Beatriz int magnitude = bcd_cmp_mag(a, b); 2380d03b174aSYasmin Beatriz if (magnitude > 0) { 2381428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2382d03b174aSYasmin Beatriz bcd_sub_mag(&result, a, b, &invalid, &overflow); 2383d03b174aSYasmin Beatriz cr = (sgna > 0) ? CRF_GT : CRF_LT; 2384d03b174aSYasmin Beatriz } else if (magnitude < 0) { 2385428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps); 2386d03b174aSYasmin Beatriz bcd_sub_mag(&result, b, a, &invalid, &overflow); 2387efa73196SNikunj A Dadhania cr = (sgnb > 0) ? CRF_GT : CRF_LT; 2388d03b174aSYasmin Beatriz } else { 2389428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps); 2390d03b174aSYasmin Beatriz cr = CRF_EQ; 2391d03b174aSYasmin Beatriz } 2392fcf5ef2aSThomas Huth } 2393fcf5ef2aSThomas Huth } 2394fcf5ef2aSThomas Huth 2395fcf5ef2aSThomas Huth if (unlikely(invalid)) { 23963c385a93SMark Cave-Ayland result.VsrD(0) = result.VsrD(1) = -1; 2397efa73196SNikunj A Dadhania cr = CRF_SO; 2398fcf5ef2aSThomas Huth } else if (overflow) { 2399efa73196SNikunj A Dadhania cr |= CRF_SO; 2400936fda4dSFabiano Rosas } else if (zero) { 2401936fda4dSFabiano Rosas cr |= CRF_EQ; 2402fcf5ef2aSThomas Huth } 2403fcf5ef2aSThomas Huth 2404fcf5ef2aSThomas Huth *r = result; 2405fcf5ef2aSThomas Huth 2406fcf5ef2aSThomas Huth return cr; 2407fcf5ef2aSThomas Huth } 2408fcf5ef2aSThomas Huth 2409fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2410fcf5ef2aSThomas Huth { 2411fcf5ef2aSThomas Huth ppc_avr_t bcopy = *b; 2412fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2413fcf5ef2aSThomas Huth if (sgnb < 0) { 2414fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0); 2415fcf5ef2aSThomas Huth } else if (sgnb > 0) { 2416fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_NEG_PREF, 0); 2417fcf5ef2aSThomas Huth } 2418fcf5ef2aSThomas Huth /* else invalid ... defer to bcdadd code for proper handling */ 2419fcf5ef2aSThomas Huth 2420fcf5ef2aSThomas Huth return helper_bcdadd(r, a, &bcopy, ps); 2421fcf5ef2aSThomas Huth } 2422fcf5ef2aSThomas Huth 2423fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2424fcf5ef2aSThomas Huth { 2425fcf5ef2aSThomas Huth int i; 2426fcf5ef2aSThomas Huth int cr = 0; 2427fcf5ef2aSThomas Huth uint16_t national = 0; 2428fcf5ef2aSThomas Huth uint16_t sgnb = get_national_digit(b, 0); 2429fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2430fcf5ef2aSThomas Huth int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG); 2431fcf5ef2aSThomas Huth 2432fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2433fcf5ef2aSThomas Huth national = get_national_digit(b, i); 2434fcf5ef2aSThomas Huth if (unlikely(national < 0x30 || national > 0x39)) { 2435fcf5ef2aSThomas Huth invalid = 1; 2436fcf5ef2aSThomas Huth break; 2437fcf5ef2aSThomas Huth } 2438fcf5ef2aSThomas Huth 2439fcf5ef2aSThomas Huth bcd_put_digit(&ret, national & 0xf, i); 2440fcf5ef2aSThomas Huth } 2441fcf5ef2aSThomas Huth 2442fcf5ef2aSThomas Huth if (sgnb == NATIONAL_PLUS) { 2443fcf5ef2aSThomas Huth bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0); 2444fcf5ef2aSThomas Huth } else { 2445fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2446fcf5ef2aSThomas Huth } 2447fcf5ef2aSThomas Huth 2448fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2449fcf5ef2aSThomas Huth 2450fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2451efa73196SNikunj A Dadhania cr = CRF_SO; 2452fcf5ef2aSThomas Huth } 2453fcf5ef2aSThomas Huth 2454fcf5ef2aSThomas Huth *r = ret; 2455fcf5ef2aSThomas Huth 2456fcf5ef2aSThomas Huth return cr; 2457fcf5ef2aSThomas Huth } 2458fcf5ef2aSThomas Huth 2459fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2460fcf5ef2aSThomas Huth { 2461fcf5ef2aSThomas Huth int i; 2462fcf5ef2aSThomas Huth int cr = 0; 2463fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2464fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2465fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2466fcf5ef2aSThomas Huth 24673c385a93SMark Cave-Ayland int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0); 2468fcf5ef2aSThomas Huth 2469fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2470fcf5ef2aSThomas Huth set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i); 2471fcf5ef2aSThomas Huth 2472fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2473fcf5ef2aSThomas Huth break; 2474fcf5ef2aSThomas Huth } 2475fcf5ef2aSThomas Huth } 2476fcf5ef2aSThomas Huth set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0); 2477fcf5ef2aSThomas Huth 2478fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2479fcf5ef2aSThomas Huth 2480fcf5ef2aSThomas Huth if (ox_flag) { 2481efa73196SNikunj A Dadhania cr |= CRF_SO; 2482fcf5ef2aSThomas Huth } 2483fcf5ef2aSThomas Huth 2484fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2485efa73196SNikunj A Dadhania cr = CRF_SO; 2486fcf5ef2aSThomas Huth } 2487fcf5ef2aSThomas Huth 2488fcf5ef2aSThomas Huth *r = ret; 2489fcf5ef2aSThomas Huth 2490fcf5ef2aSThomas Huth return cr; 2491fcf5ef2aSThomas Huth } 2492fcf5ef2aSThomas Huth 2493fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2494fcf5ef2aSThomas Huth { 2495fcf5ef2aSThomas Huth int i; 2496fcf5ef2aSThomas Huth int cr = 0; 2497fcf5ef2aSThomas Huth int invalid = 0; 2498fcf5ef2aSThomas Huth int zone_digit = 0; 2499fcf5ef2aSThomas Huth int zone_lead = ps ? 0xF : 0x3; 2500fcf5ef2aSThomas Huth int digit = 0; 2501fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2502428115c3SMark Cave-Ayland int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4; 2503fcf5ef2aSThomas Huth 2504fcf5ef2aSThomas Huth if (unlikely((sgnb < 0xA) && ps)) { 2505fcf5ef2aSThomas Huth invalid = 1; 2506fcf5ef2aSThomas Huth } 2507fcf5ef2aSThomas Huth 2508fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2509428115c3SMark Cave-Ayland zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead; 2510428115c3SMark Cave-Ayland digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF; 2511fcf5ef2aSThomas Huth if (unlikely(zone_digit != zone_lead || digit > 0x9)) { 2512fcf5ef2aSThomas Huth invalid = 1; 2513fcf5ef2aSThomas Huth break; 2514fcf5ef2aSThomas Huth } 2515fcf5ef2aSThomas Huth 2516fcf5ef2aSThomas Huth bcd_put_digit(&ret, digit, i + 1); 2517fcf5ef2aSThomas Huth } 2518fcf5ef2aSThomas Huth 2519fcf5ef2aSThomas Huth if ((ps && (sgnb == 0xB || sgnb == 0xD)) || 2520fcf5ef2aSThomas Huth (!ps && (sgnb & 0x4))) { 2521fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2522fcf5ef2aSThomas Huth } else { 2523fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0); 2524fcf5ef2aSThomas Huth } 2525fcf5ef2aSThomas Huth 2526fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2527fcf5ef2aSThomas Huth 2528fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2529efa73196SNikunj A Dadhania cr = CRF_SO; 2530fcf5ef2aSThomas Huth } 2531fcf5ef2aSThomas Huth 2532fcf5ef2aSThomas Huth *r = ret; 2533fcf5ef2aSThomas Huth 2534fcf5ef2aSThomas Huth return cr; 2535fcf5ef2aSThomas Huth } 2536fcf5ef2aSThomas Huth 2537fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2538fcf5ef2aSThomas Huth { 2539fcf5ef2aSThomas Huth int i; 2540fcf5ef2aSThomas Huth int cr = 0; 2541fcf5ef2aSThomas Huth uint8_t digit = 0; 2542fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2543fcf5ef2aSThomas Huth int zone_lead = (ps) ? 0xF0 : 0x30; 2544fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2545fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2546fcf5ef2aSThomas Huth 25473c385a93SMark Cave-Ayland int ox_flag = ((b->VsrD(0) >> 4) != 0); 2548fcf5ef2aSThomas Huth 2549fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2550fcf5ef2aSThomas Huth digit = bcd_get_digit(b, i + 1, &invalid); 2551fcf5ef2aSThomas Huth 2552fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2553fcf5ef2aSThomas Huth break; 2554fcf5ef2aSThomas Huth } 2555fcf5ef2aSThomas Huth 2556428115c3SMark Cave-Ayland ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit; 2557fcf5ef2aSThomas Huth } 2558fcf5ef2aSThomas Huth 2559fcf5ef2aSThomas Huth if (ps) { 2560fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1); 2561fcf5ef2aSThomas Huth } else { 2562fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1); 2563fcf5ef2aSThomas Huth } 2564fcf5ef2aSThomas Huth 2565fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2566fcf5ef2aSThomas Huth 2567fcf5ef2aSThomas Huth if (ox_flag) { 2568efa73196SNikunj A Dadhania cr |= CRF_SO; 2569fcf5ef2aSThomas Huth } 2570fcf5ef2aSThomas Huth 2571fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2572efa73196SNikunj A Dadhania cr = CRF_SO; 2573fcf5ef2aSThomas Huth } 2574fcf5ef2aSThomas Huth 2575fcf5ef2aSThomas Huth *r = ret; 2576fcf5ef2aSThomas Huth 2577fcf5ef2aSThomas Huth return cr; 2578fcf5ef2aSThomas Huth } 2579fcf5ef2aSThomas Huth 2580a3d67f3eSLuis Pires /** 2581a3d67f3eSLuis Pires * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs 2582a3d67f3eSLuis Pires * 2583a3d67f3eSLuis Pires * Returns: 2584a3d67f3eSLuis Pires * > 0 if ahi|alo > bhi|blo, 2585a3d67f3eSLuis Pires * 0 if ahi|alo == bhi|blo, 2586a3d67f3eSLuis Pires * < 0 if ahi|alo < bhi|blo 2587a3d67f3eSLuis Pires */ 2588a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi, 2589a3d67f3eSLuis Pires uint64_t blo, uint64_t bhi) 2590a3d67f3eSLuis Pires { 2591a3d67f3eSLuis Pires return (ahi == bhi) ? 2592a3d67f3eSLuis Pires (alo > blo ? 1 : (alo == blo ? 0 : -1)) : 2593a3d67f3eSLuis Pires (ahi > bhi ? 1 : -1); 2594a3d67f3eSLuis Pires } 2595a3d67f3eSLuis Pires 2596a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2597a406c058SJose Ricardo Ziviani { 2598a406c058SJose Ricardo Ziviani int i; 2599a3d67f3eSLuis Pires int cr; 2600a406c058SJose Ricardo Ziviani uint64_t lo_value; 2601a406c058SJose Ricardo Ziviani uint64_t hi_value; 260240f3e79aSLuis Pires uint64_t rem; 2603a406c058SJose Ricardo Ziviani ppc_avr_t ret = { .u64 = { 0, 0 } }; 2604a406c058SJose Ricardo Ziviani 26053c385a93SMark Cave-Ayland if (b->VsrSD(0) < 0) { 26063c385a93SMark Cave-Ayland lo_value = -b->VsrSD(1); 26073c385a93SMark Cave-Ayland hi_value = ~b->VsrD(0) + !lo_value; 2608a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, 0xD, 0); 2609a3d67f3eSLuis Pires 2610a3d67f3eSLuis Pires cr = CRF_LT; 2611a406c058SJose Ricardo Ziviani } else { 26123c385a93SMark Cave-Ayland lo_value = b->VsrD(1); 26133c385a93SMark Cave-Ayland hi_value = b->VsrD(0); 2614a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0); 2615a3d67f3eSLuis Pires 2616a3d67f3eSLuis Pires if (hi_value == 0 && lo_value == 0) { 2617a3d67f3eSLuis Pires cr = CRF_EQ; 2618a3d67f3eSLuis Pires } else { 2619a3d67f3eSLuis Pires cr = CRF_GT; 2620a3d67f3eSLuis Pires } 2621a406c058SJose Ricardo Ziviani } 2622a406c058SJose Ricardo Ziviani 2623a3d67f3eSLuis Pires /* 2624a3d67f3eSLuis Pires * Check src limits: abs(src) <= 10^31 - 1 2625a3d67f3eSLuis Pires * 2626a3d67f3eSLuis Pires * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff 2627a3d67f3eSLuis Pires */ 2628a3d67f3eSLuis Pires if (ucmp128(lo_value, hi_value, 2629a3d67f3eSLuis Pires 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) { 2630a3d67f3eSLuis Pires cr |= CRF_SO; 2631a3d67f3eSLuis Pires 2632a3d67f3eSLuis Pires /* 2633a3d67f3eSLuis Pires * According to the ISA, if src wouldn't fit in the destination 2634a3d67f3eSLuis Pires * register, the result is undefined. 2635a3d67f3eSLuis Pires * In that case, we leave r unchanged. 2636a3d67f3eSLuis Pires */ 2637a3d67f3eSLuis Pires } else { 263840f3e79aSLuis Pires rem = divu128(&lo_value, &hi_value, 1000000000000000ULL); 2639a406c058SJose Ricardo Ziviani 264040f3e79aSLuis Pires for (i = 1; i < 16; rem /= 10, i++) { 264140f3e79aSLuis Pires bcd_put_digit(&ret, rem % 10, i); 2642a406c058SJose Ricardo Ziviani } 2643a406c058SJose Ricardo Ziviani 2644a406c058SJose Ricardo Ziviani for (; i < 32; lo_value /= 10, i++) { 2645a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, lo_value % 10, i); 2646a406c058SJose Ricardo Ziviani } 2647a406c058SJose Ricardo Ziviani 2648a406c058SJose Ricardo Ziviani *r = ret; 2649a3d67f3eSLuis Pires } 2650a406c058SJose Ricardo Ziviani 2651a406c058SJose Ricardo Ziviani return cr; 2652a406c058SJose Ricardo Ziviani } 2653a406c058SJose Ricardo Ziviani 2654c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2655c85bc7ddSJose Ricardo Ziviani { 2656c85bc7ddSJose Ricardo Ziviani uint8_t i; 2657c85bc7ddSJose Ricardo Ziviani int cr; 2658c85bc7ddSJose Ricardo Ziviani uint64_t carry; 2659c85bc7ddSJose Ricardo Ziviani uint64_t unused; 2660c85bc7ddSJose Ricardo Ziviani uint64_t lo_value; 2661c85bc7ddSJose Ricardo Ziviani uint64_t hi_value = 0; 2662c85bc7ddSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2663c85bc7ddSJose Ricardo Ziviani int invalid = (sgnb == 0); 2664c85bc7ddSJose Ricardo Ziviani 2665c85bc7ddSJose Ricardo Ziviani lo_value = bcd_get_digit(b, 31, &invalid); 2666c85bc7ddSJose Ricardo Ziviani for (i = 30; i > 0; i--) { 2667c85bc7ddSJose Ricardo Ziviani mulu64(&lo_value, &carry, lo_value, 10ULL); 2668c85bc7ddSJose Ricardo Ziviani mulu64(&hi_value, &unused, hi_value, 10ULL); 2669c85bc7ddSJose Ricardo Ziviani lo_value += bcd_get_digit(b, i, &invalid); 2670c85bc7ddSJose Ricardo Ziviani hi_value += carry; 2671c85bc7ddSJose Ricardo Ziviani 2672c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2673c85bc7ddSJose Ricardo Ziviani break; 2674c85bc7ddSJose Ricardo Ziviani } 2675c85bc7ddSJose Ricardo Ziviani } 2676c85bc7ddSJose Ricardo Ziviani 2677c85bc7ddSJose Ricardo Ziviani if (sgnb == -1) { 26783c385a93SMark Cave-Ayland r->VsrSD(1) = -lo_value; 26793c385a93SMark Cave-Ayland r->VsrSD(0) = ~hi_value + !r->VsrSD(1); 2680c85bc7ddSJose Ricardo Ziviani } else { 26813c385a93SMark Cave-Ayland r->VsrSD(1) = lo_value; 26823c385a93SMark Cave-Ayland r->VsrSD(0) = hi_value; 2683c85bc7ddSJose Ricardo Ziviani } 2684c85bc7ddSJose Ricardo Ziviani 2685c85bc7ddSJose Ricardo Ziviani cr = bcd_cmp_zero(b); 2686c85bc7ddSJose Ricardo Ziviani 2687c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2688c85bc7ddSJose Ricardo Ziviani cr = CRF_SO; 2689c85bc7ddSJose Ricardo Ziviani } 2690c85bc7ddSJose Ricardo Ziviani 2691c85bc7ddSJose Ricardo Ziviani return cr; 2692c85bc7ddSJose Ricardo Ziviani } 2693c85bc7ddSJose Ricardo Ziviani 2694c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2695c3025c3bSJose Ricardo Ziviani { 2696c3025c3bSJose Ricardo Ziviani int i; 2697c3025c3bSJose Ricardo Ziviani int invalid = 0; 2698c3025c3bSJose Ricardo Ziviani 2699c3025c3bSJose Ricardo Ziviani if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) { 2700c3025c3bSJose Ricardo Ziviani return CRF_SO; 2701c3025c3bSJose Ricardo Ziviani } 2702c3025c3bSJose Ricardo Ziviani 2703c3025c3bSJose Ricardo Ziviani *r = *a; 2704428115c3SMark Cave-Ayland bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0); 2705c3025c3bSJose Ricardo Ziviani 2706c3025c3bSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2707c3025c3bSJose Ricardo Ziviani bcd_get_digit(a, i, &invalid); 2708c3025c3bSJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2709c3025c3bSJose Ricardo Ziviani if (unlikely(invalid)) { 2710c3025c3bSJose Ricardo Ziviani return CRF_SO; 2711c3025c3bSJose Ricardo Ziviani } 2712c3025c3bSJose Ricardo Ziviani } 2713c3025c3bSJose Ricardo Ziviani 2714c3025c3bSJose Ricardo Ziviani return bcd_cmp_zero(r); 2715c3025c3bSJose Ricardo Ziviani } 2716c3025c3bSJose Ricardo Ziviani 2717466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2718466a3f9cSJose Ricardo Ziviani { 2719466a3f9cSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2720466a3f9cSJose Ricardo Ziviani 2721466a3f9cSJose Ricardo Ziviani *r = *b; 2722466a3f9cSJose Ricardo Ziviani bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0); 2723466a3f9cSJose Ricardo Ziviani 2724071663dfSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2725466a3f9cSJose Ricardo Ziviani return CRF_SO; 2726466a3f9cSJose Ricardo Ziviani } 2727466a3f9cSJose Ricardo Ziviani 2728466a3f9cSJose Ricardo Ziviani return bcd_cmp_zero(r); 2729466a3f9cSJose Ricardo Ziviani } 2730466a3f9cSJose Ricardo Ziviani 2731e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2732e04797f7SJose Ricardo Ziviani { 2733e04797f7SJose Ricardo Ziviani int cr; 2734428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2735e04797f7SJose Ricardo Ziviani bool ox_flag = false; 2736e04797f7SJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2737e04797f7SJose Ricardo Ziviani ppc_avr_t ret = *b; 27383c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2739e04797f7SJose Ricardo Ziviani 2740e04797f7SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2741e04797f7SJose Ricardo Ziviani return CRF_SO; 2742e04797f7SJose Ricardo Ziviani } 2743e04797f7SJose Ricardo Ziviani 2744e04797f7SJose Ricardo Ziviani if (unlikely(i > 31)) { 2745e04797f7SJose Ricardo Ziviani i = 31; 2746e04797f7SJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2747e04797f7SJose Ricardo Ziviani i = -31; 2748e04797f7SJose Ricardo Ziviani } 2749e04797f7SJose Ricardo Ziviani 2750e04797f7SJose Ricardo Ziviani if (i > 0) { 27513c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2752e04797f7SJose Ricardo Ziviani } else { 27533c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2754e04797f7SJose Ricardo Ziviani } 2755e04797f7SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2756e04797f7SJose Ricardo Ziviani 2757e04797f7SJose Ricardo Ziviani *r = ret; 2758e04797f7SJose Ricardo Ziviani 2759e04797f7SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2760e04797f7SJose Ricardo Ziviani if (ox_flag) { 2761e04797f7SJose Ricardo Ziviani cr |= CRF_SO; 2762e04797f7SJose Ricardo Ziviani } 2763e04797f7SJose Ricardo Ziviani 2764e04797f7SJose Ricardo Ziviani return cr; 2765e04797f7SJose Ricardo Ziviani } 2766e04797f7SJose Ricardo Ziviani 2767a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2768a49a95e9SJose Ricardo Ziviani { 2769a49a95e9SJose Ricardo Ziviani int cr; 2770a49a95e9SJose Ricardo Ziviani int i; 2771a49a95e9SJose Ricardo Ziviani int invalid = 0; 2772a49a95e9SJose Ricardo Ziviani bool ox_flag = false; 2773a49a95e9SJose Ricardo Ziviani ppc_avr_t ret = *b; 2774a49a95e9SJose Ricardo Ziviani 2775a49a95e9SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 2776a49a95e9SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2777a49a95e9SJose Ricardo Ziviani 2778a49a95e9SJose Ricardo Ziviani if (unlikely(invalid)) { 2779a49a95e9SJose Ricardo Ziviani return CRF_SO; 2780a49a95e9SJose Ricardo Ziviani } 2781a49a95e9SJose Ricardo Ziviani } 2782a49a95e9SJose Ricardo Ziviani 2783428115c3SMark Cave-Ayland i = a->VsrSB(7); 2784a49a95e9SJose Ricardo Ziviani if (i >= 32) { 2785a49a95e9SJose Ricardo Ziviani ox_flag = true; 27863c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2787a49a95e9SJose Ricardo Ziviani } else if (i <= -32) { 27883c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2789a49a95e9SJose Ricardo Ziviani } else if (i > 0) { 27903c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2791a49a95e9SJose Ricardo Ziviani } else { 27923c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2793a49a95e9SJose Ricardo Ziviani } 2794a49a95e9SJose Ricardo Ziviani *r = ret; 2795a49a95e9SJose Ricardo Ziviani 2796a49a95e9SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2797a49a95e9SJose Ricardo Ziviani if (ox_flag) { 2798a49a95e9SJose Ricardo Ziviani cr |= CRF_SO; 2799a49a95e9SJose Ricardo Ziviani } 2800a49a95e9SJose Ricardo Ziviani 2801a49a95e9SJose Ricardo Ziviani return cr; 2802a49a95e9SJose Ricardo Ziviani } 2803a49a95e9SJose Ricardo Ziviani 2804a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2805a54238adSJose Ricardo Ziviani { 2806a54238adSJose Ricardo Ziviani int cr; 2807a54238adSJose Ricardo Ziviani int unused = 0; 2808a54238adSJose Ricardo Ziviani int invalid = 0; 2809a54238adSJose Ricardo Ziviani bool ox_flag = false; 2810a54238adSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2811a54238adSJose Ricardo Ziviani ppc_avr_t ret = *b; 28123c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2813a54238adSJose Ricardo Ziviani 2814428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2815428115c3SMark Cave-Ayland ppc_avr_t bcd_one; 2816428115c3SMark Cave-Ayland 2817428115c3SMark Cave-Ayland bcd_one.VsrD(0) = 0; 2818428115c3SMark Cave-Ayland bcd_one.VsrD(1) = 0x10; 2819a54238adSJose Ricardo Ziviani 2820a54238adSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2821a54238adSJose Ricardo Ziviani return CRF_SO; 2822a54238adSJose Ricardo Ziviani } 2823a54238adSJose Ricardo Ziviani 2824a54238adSJose Ricardo Ziviani if (unlikely(i > 31)) { 2825a54238adSJose Ricardo Ziviani i = 31; 2826a54238adSJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2827a54238adSJose Ricardo Ziviani i = -31; 2828a54238adSJose Ricardo Ziviani } 2829a54238adSJose Ricardo Ziviani 2830a54238adSJose Ricardo Ziviani if (i > 0) { 28313c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2832a54238adSJose Ricardo Ziviani } else { 28333c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2834a54238adSJose Ricardo Ziviani 2835a54238adSJose Ricardo Ziviani if (bcd_get_digit(&ret, 0, &invalid) >= 5) { 2836a54238adSJose Ricardo Ziviani bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused); 2837a54238adSJose Ricardo Ziviani } 2838a54238adSJose Ricardo Ziviani } 2839a54238adSJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2840a54238adSJose Ricardo Ziviani 2841a54238adSJose Ricardo Ziviani cr = bcd_cmp_zero(&ret); 2842a54238adSJose Ricardo Ziviani if (ox_flag) { 2843a54238adSJose Ricardo Ziviani cr |= CRF_SO; 2844a54238adSJose Ricardo Ziviani } 2845a54238adSJose Ricardo Ziviani *r = ret; 2846a54238adSJose Ricardo Ziviani 2847a54238adSJose Ricardo Ziviani return cr; 2848a54238adSJose Ricardo Ziviani } 2849a54238adSJose Ricardo Ziviani 285031bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 285131bc4d11SJose Ricardo Ziviani { 285231bc4d11SJose Ricardo Ziviani uint64_t mask; 285331bc4d11SJose Ricardo Ziviani uint32_t ox_flag = 0; 2854428115c3SMark Cave-Ayland int i = a->VsrSH(3) + 1; 285531bc4d11SJose Ricardo Ziviani ppc_avr_t ret = *b; 285631bc4d11SJose Ricardo Ziviani 285731bc4d11SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 285831bc4d11SJose Ricardo Ziviani return CRF_SO; 285931bc4d11SJose Ricardo Ziviani } 286031bc4d11SJose Ricardo Ziviani 286131bc4d11SJose Ricardo Ziviani if (i > 16 && i < 32) { 286231bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 28633c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 286431bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 286531bc4d11SJose Ricardo Ziviani } 286631bc4d11SJose Ricardo Ziviani 28673c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 286831bc4d11SJose Ricardo Ziviani } else if (i >= 0 && i <= 16) { 286931bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 28703c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 287131bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 287231bc4d11SJose Ricardo Ziviani } 287331bc4d11SJose Ricardo Ziviani 28743c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 28753c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 287631bc4d11SJose Ricardo Ziviani } 287731bc4d11SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0); 287831bc4d11SJose Ricardo Ziviani *r = ret; 287931bc4d11SJose Ricardo Ziviani 288031bc4d11SJose Ricardo Ziviani return bcd_cmp_zero(&ret) | ox_flag; 288131bc4d11SJose Ricardo Ziviani } 288231bc4d11SJose Ricardo Ziviani 28835c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 28845c32e2e4SJose Ricardo Ziviani { 28855c32e2e4SJose Ricardo Ziviani int i; 28865c32e2e4SJose Ricardo Ziviani uint64_t mask; 28875c32e2e4SJose Ricardo Ziviani uint32_t ox_flag = 0; 28885c32e2e4SJose Ricardo Ziviani int invalid = 0; 28895c32e2e4SJose Ricardo Ziviani ppc_avr_t ret = *b; 28905c32e2e4SJose Ricardo Ziviani 28915c32e2e4SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 28925c32e2e4SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 28935c32e2e4SJose Ricardo Ziviani 28945c32e2e4SJose Ricardo Ziviani if (unlikely(invalid)) { 28955c32e2e4SJose Ricardo Ziviani return CRF_SO; 28965c32e2e4SJose Ricardo Ziviani } 28975c32e2e4SJose Ricardo Ziviani } 28985c32e2e4SJose Ricardo Ziviani 2899428115c3SMark Cave-Ayland i = a->VsrSH(3); 29005c32e2e4SJose Ricardo Ziviani if (i > 16 && i < 33) { 29015c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 29023c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 29035c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 29045c32e2e4SJose Ricardo Ziviani } 29055c32e2e4SJose Ricardo Ziviani 29063c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 29075c32e2e4SJose Ricardo Ziviani } else if (i > 0 && i <= 16) { 29085c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 29093c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 29105c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 29115c32e2e4SJose Ricardo Ziviani } 29125c32e2e4SJose Ricardo Ziviani 29133c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 29143c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 29155c32e2e4SJose Ricardo Ziviani } else if (i == 0) { 29163c385a93SMark Cave-Ayland if (ret.VsrD(0) || ret.VsrD(1)) { 29175c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 29185c32e2e4SJose Ricardo Ziviani } 29193c385a93SMark Cave-Ayland ret.VsrD(0) = ret.VsrD(1) = 0; 29205c32e2e4SJose Ricardo Ziviani } 29215c32e2e4SJose Ricardo Ziviani 29225c32e2e4SJose Ricardo Ziviani *r = ret; 29233c385a93SMark Cave-Ayland if (r->VsrD(0) == 0 && r->VsrD(1) == 0) { 29245c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_EQ; 29255c32e2e4SJose Ricardo Ziviani } 29265c32e2e4SJose Ricardo Ziviani 29275c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_GT; 29285c32e2e4SJose Ricardo Ziviani } 29295c32e2e4SJose Ricardo Ziviani 2930fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a) 2931fcf5ef2aSThomas Huth { 2932fcf5ef2aSThomas Huth int i; 2933fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 2934fcf5ef2aSThomas Huth r->u8[i] = AES_sbox[a->u8[i]]; 2935fcf5ef2aSThomas Huth } 2936fcf5ef2aSThomas Huth } 2937fcf5ef2aSThomas Huth 2938fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2939fcf5ef2aSThomas Huth { 2940fcf5ef2aSThomas Huth ppc_avr_t result; 2941fcf5ef2aSThomas Huth int i; 2942fcf5ef2aSThomas Huth 2943fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 29442dea57dbSMark Cave-Ayland result.VsrW(i) = b->VsrW(i) ^ 29452dea57dbSMark Cave-Ayland (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^ 29462dea57dbSMark Cave-Ayland AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^ 29472dea57dbSMark Cave-Ayland AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^ 29482dea57dbSMark Cave-Ayland AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]); 2949fcf5ef2aSThomas Huth } 2950fcf5ef2aSThomas Huth *r = result; 2951fcf5ef2aSThomas Huth } 2952fcf5ef2aSThomas Huth 2953fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2954fcf5ef2aSThomas Huth { 2955fcf5ef2aSThomas Huth ppc_avr_t result; 2956fcf5ef2aSThomas Huth int i; 2957fcf5ef2aSThomas Huth 2958fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 29592dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]); 2960fcf5ef2aSThomas Huth } 2961fcf5ef2aSThomas Huth *r = result; 2962fcf5ef2aSThomas Huth } 2963fcf5ef2aSThomas Huth 2964fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2965fcf5ef2aSThomas Huth { 2966fcf5ef2aSThomas Huth /* This differs from what is written in ISA V2.07. The RTL is */ 2967fcf5ef2aSThomas Huth /* incorrect and will be fixed in V2.07B. */ 2968fcf5ef2aSThomas Huth int i; 2969fcf5ef2aSThomas Huth ppc_avr_t tmp; 2970fcf5ef2aSThomas Huth 2971fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 29722dea57dbSMark Cave-Ayland tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])]; 2973fcf5ef2aSThomas Huth } 2974fcf5ef2aSThomas Huth 2975fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 29762dea57dbSMark Cave-Ayland r->VsrW(i) = 29772dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 0)][0] ^ 29782dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 1)][1] ^ 29792dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 2)][2] ^ 29802dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 3)][3]; 2981fcf5ef2aSThomas Huth } 2982fcf5ef2aSThomas Huth } 2983fcf5ef2aSThomas Huth 2984fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2985fcf5ef2aSThomas Huth { 2986fcf5ef2aSThomas Huth ppc_avr_t result; 2987fcf5ef2aSThomas Huth int i; 2988fcf5ef2aSThomas Huth 2989fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 29902dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]); 2991fcf5ef2aSThomas Huth } 2992fcf5ef2aSThomas Huth *r = result; 2993fcf5ef2aSThomas Huth } 2994fcf5ef2aSThomas Huth 2995fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2996fcf5ef2aSThomas Huth { 2997fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2998fcf5ef2aSThomas Huth int six = st_six & 0xF; 2999fcf5ef2aSThomas Huth int i; 3000fcf5ef2aSThomas Huth 3001730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 3002fcf5ef2aSThomas Huth if (st == 0) { 3003fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 30040ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 7) ^ 30050ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 18) ^ 3006730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 3); 3007fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 30080ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 17) ^ 30090ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 19) ^ 3010730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 10); 3011fcf5ef2aSThomas Huth } 3012fcf5ef2aSThomas Huth } else { /* st == 1 */ 3013fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 30140ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 2) ^ 30150ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 13) ^ 30160ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 22); 3017fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 30180ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 6) ^ 30190ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 11) ^ 30200ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 25); 3021fcf5ef2aSThomas Huth } 3022fcf5ef2aSThomas Huth } 3023fcf5ef2aSThomas Huth } 3024fcf5ef2aSThomas Huth } 3025fcf5ef2aSThomas Huth 3026fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 3027fcf5ef2aSThomas Huth { 3028fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 3029fcf5ef2aSThomas Huth int six = st_six & 0xF; 3030fcf5ef2aSThomas Huth int i; 3031fcf5ef2aSThomas Huth 3032730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 3033fcf5ef2aSThomas Huth if (st == 0) { 3034fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 30350ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 1) ^ 30360ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 8) ^ 3037730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 7); 3038fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 30390ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 19) ^ 30400ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 61) ^ 3041730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 6); 3042fcf5ef2aSThomas Huth } 3043fcf5ef2aSThomas Huth } else { /* st == 1 */ 3044fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 30450ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 28) ^ 30460ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 34) ^ 30470ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 39); 3048fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 30490ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 14) ^ 30500ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 18) ^ 30510ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 41); 3052fcf5ef2aSThomas Huth } 3053fcf5ef2aSThomas Huth } 3054fcf5ef2aSThomas Huth } 3055fcf5ef2aSThomas Huth } 3056fcf5ef2aSThomas Huth 3057fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 3058fcf5ef2aSThomas Huth { 3059fcf5ef2aSThomas Huth ppc_avr_t result; 3060fcf5ef2aSThomas Huth int i; 3061fcf5ef2aSThomas Huth 306260594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 306360594feaSMark Cave-Ayland int indexA = c->VsrB(i) >> 4; 306460594feaSMark Cave-Ayland int indexB = c->VsrB(i) & 0xF; 306560594feaSMark Cave-Ayland 306660594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB); 3067fcf5ef2aSThomas Huth } 3068fcf5ef2aSThomas Huth *r = result; 3069fcf5ef2aSThomas Huth } 3070fcf5ef2aSThomas Huth 3071fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I 3072fcf5ef2aSThomas Huth 3073fcf5ef2aSThomas Huth /*****************************************************************************/ 3074fcf5ef2aSThomas Huth /* SPE extension helpers */ 3075fcf5ef2aSThomas Huth /* Use a table to make this quicker */ 3076fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = { 3077fcf5ef2aSThomas Huth 0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE, 3078fcf5ef2aSThomas Huth 0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF, 3079fcf5ef2aSThomas Huth }; 3080fcf5ef2aSThomas Huth 3081fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val) 3082fcf5ef2aSThomas Huth { 3083fcf5ef2aSThomas Huth return hbrev[val >> 4] | (hbrev[val & 0xF] << 4); 3084fcf5ef2aSThomas Huth } 3085fcf5ef2aSThomas Huth 3086fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val) 3087fcf5ef2aSThomas Huth { 3088fcf5ef2aSThomas Huth return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) | 3089fcf5ef2aSThomas Huth (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24); 3090fcf5ef2aSThomas Huth } 3091fcf5ef2aSThomas Huth 3092fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */ 3093fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2) 3094fcf5ef2aSThomas Huth { 3095fcf5ef2aSThomas Huth uint32_t a, b, d, mask; 3096fcf5ef2aSThomas Huth 3097fcf5ef2aSThomas Huth mask = UINT32_MAX >> (32 - MASKBITS); 3098fcf5ef2aSThomas Huth a = arg1 & mask; 3099fcf5ef2aSThomas Huth b = arg2 & mask; 3100fcf5ef2aSThomas Huth d = word_reverse(1 + word_reverse(a | ~b)); 3101fcf5ef2aSThomas Huth return (arg1 & ~mask) | (d & b); 3102fcf5ef2aSThomas Huth } 3103fcf5ef2aSThomas Huth 3104fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val) 3105fcf5ef2aSThomas Huth { 3106fcf5ef2aSThomas Huth if (val & 0x80000000) { 3107fcf5ef2aSThomas Huth return clz32(~val); 3108fcf5ef2aSThomas Huth } else { 3109fcf5ef2aSThomas Huth return clz32(val); 3110fcf5ef2aSThomas Huth } 3111fcf5ef2aSThomas Huth } 3112fcf5ef2aSThomas Huth 3113fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val) 3114fcf5ef2aSThomas Huth { 3115fcf5ef2aSThomas Huth return clz32(val); 3116fcf5ef2aSThomas Huth } 3117fcf5ef2aSThomas Huth 3118fcf5ef2aSThomas Huth /* 440 specific */ 3119fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high, 3120fcf5ef2aSThomas Huth target_ulong low, uint32_t update_Rc) 3121fcf5ef2aSThomas Huth { 3122fcf5ef2aSThomas Huth target_ulong mask; 3123fcf5ef2aSThomas Huth int i; 3124fcf5ef2aSThomas Huth 3125fcf5ef2aSThomas Huth i = 1; 3126fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3127fcf5ef2aSThomas Huth if ((high & mask) == 0) { 3128fcf5ef2aSThomas Huth if (update_Rc) { 3129fcf5ef2aSThomas Huth env->crf[0] = 0x4; 3130fcf5ef2aSThomas Huth } 3131fcf5ef2aSThomas Huth goto done; 3132fcf5ef2aSThomas Huth } 3133fcf5ef2aSThomas Huth i++; 3134fcf5ef2aSThomas Huth } 3135fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3136fcf5ef2aSThomas Huth if ((low & mask) == 0) { 3137fcf5ef2aSThomas Huth if (update_Rc) { 3138fcf5ef2aSThomas Huth env->crf[0] = 0x8; 3139fcf5ef2aSThomas Huth } 3140fcf5ef2aSThomas Huth goto done; 3141fcf5ef2aSThomas Huth } 3142fcf5ef2aSThomas Huth i++; 3143fcf5ef2aSThomas Huth } 3144fcf5ef2aSThomas Huth i = 8; 3145fcf5ef2aSThomas Huth if (update_Rc) { 3146fcf5ef2aSThomas Huth env->crf[0] = 0x2; 3147fcf5ef2aSThomas Huth } 3148fcf5ef2aSThomas Huth done: 3149fcf5ef2aSThomas Huth env->xer = (env->xer & ~0x7F) | i; 3150fcf5ef2aSThomas Huth if (update_Rc) { 3151fcf5ef2aSThomas Huth env->crf[0] |= xer_so; 3152fcf5ef2aSThomas Huth } 3153fcf5ef2aSThomas Huth return i; 3154fcf5ef2aSThomas Huth } 3155