1fcf5ef2aSThomas Huth /* 2fcf5ef2aSThomas Huth * PowerPC integer and vector emulation helpers for QEMU. 3fcf5ef2aSThomas Huth * 4fcf5ef2aSThomas Huth * Copyright (c) 2003-2007 Jocelyn Mayer 5fcf5ef2aSThomas Huth * 6fcf5ef2aSThomas Huth * This library is free software; you can redistribute it and/or 7fcf5ef2aSThomas Huth * modify it under the terms of the GNU Lesser General Public 8fcf5ef2aSThomas Huth * License as published by the Free Software Foundation; either 96bd039cdSChetan Pant * version 2.1 of the License, or (at your option) any later version. 10fcf5ef2aSThomas Huth * 11fcf5ef2aSThomas Huth * This library is distributed in the hope that it will be useful, 12fcf5ef2aSThomas Huth * but WITHOUT ANY WARRANTY; without even the implied warranty of 13fcf5ef2aSThomas Huth * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14fcf5ef2aSThomas Huth * Lesser General Public License for more details. 15fcf5ef2aSThomas Huth * 16fcf5ef2aSThomas Huth * You should have received a copy of the GNU Lesser General Public 17fcf5ef2aSThomas Huth * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18fcf5ef2aSThomas Huth */ 19db725815SMarkus Armbruster 20fcf5ef2aSThomas Huth #include "qemu/osdep.h" 21fcf5ef2aSThomas Huth #include "cpu.h" 22fcf5ef2aSThomas Huth #include "internal.h" 23fcf5ef2aSThomas Huth #include "qemu/host-utils.h" 24db725815SMarkus Armbruster #include "qemu/main-loop.h" 258a05fd9aSRichard Henderson #include "qemu/log.h" 26fcf5ef2aSThomas Huth #include "exec/helper-proto.h" 27fcf5ef2aSThomas Huth #include "crypto/aes.h" 2824f91e81SAlex Bennée #include "fpu/softfloat.h" 293f74b632SRichard Henderson #include "qapi/error.h" 303f74b632SRichard Henderson #include "qemu/guest-random.h" 311015fcabSMatheus Ferst #include "tcg/tcg-gvec-desc.h" 32fcf5ef2aSThomas Huth 33fcf5ef2aSThomas Huth #include "helper_regs.h" 34fcf5ef2aSThomas Huth /*****************************************************************************/ 35fcf5ef2aSThomas Huth /* Fixed point operations helpers */ 36fcf5ef2aSThomas Huth 37f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov) 38f32899deSNikunj A Dadhania { 39f32899deSNikunj A Dadhania if (unlikely(ov)) { 40f32899deSNikunj A Dadhania env->so = env->ov = 1; 41f32899deSNikunj A Dadhania } else { 42f32899deSNikunj A Dadhania env->ov = 0; 43f32899deSNikunj A Dadhania } 44f32899deSNikunj A Dadhania } 45f32899deSNikunj A Dadhania 46fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb, 47fcf5ef2aSThomas Huth uint32_t oe) 48fcf5ef2aSThomas Huth { 49fcf5ef2aSThomas Huth uint64_t rt = 0; 50fcf5ef2aSThomas Huth int overflow = 0; 51fcf5ef2aSThomas Huth 52fcf5ef2aSThomas Huth uint64_t dividend = (uint64_t)ra << 32; 53fcf5ef2aSThomas Huth uint64_t divisor = (uint32_t)rb; 54fcf5ef2aSThomas Huth 55fcf5ef2aSThomas Huth if (unlikely(divisor == 0)) { 56fcf5ef2aSThomas Huth overflow = 1; 57fcf5ef2aSThomas Huth } else { 58fcf5ef2aSThomas Huth rt = dividend / divisor; 59fcf5ef2aSThomas Huth overflow = rt > UINT32_MAX; 60fcf5ef2aSThomas Huth } 61fcf5ef2aSThomas Huth 62fcf5ef2aSThomas Huth if (unlikely(overflow)) { 63fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 64fcf5ef2aSThomas Huth } 65fcf5ef2aSThomas Huth 66fcf5ef2aSThomas Huth if (oe) { 67f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 68fcf5ef2aSThomas Huth } 69fcf5ef2aSThomas Huth 70fcf5ef2aSThomas Huth return (target_ulong)rt; 71fcf5ef2aSThomas Huth } 72fcf5ef2aSThomas Huth 73fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb, 74fcf5ef2aSThomas Huth uint32_t oe) 75fcf5ef2aSThomas Huth { 76fcf5ef2aSThomas Huth int64_t rt = 0; 77fcf5ef2aSThomas Huth int overflow = 0; 78fcf5ef2aSThomas Huth 79fcf5ef2aSThomas Huth int64_t dividend = (int64_t)ra << 32; 80fcf5ef2aSThomas Huth int64_t divisor = (int64_t)((int32_t)rb); 81fcf5ef2aSThomas Huth 82fcf5ef2aSThomas Huth if (unlikely((divisor == 0) || 83fcf5ef2aSThomas Huth ((divisor == -1ull) && (dividend == INT64_MIN)))) { 84fcf5ef2aSThomas Huth overflow = 1; 85fcf5ef2aSThomas Huth } else { 86fcf5ef2aSThomas Huth rt = dividend / divisor; 87fcf5ef2aSThomas Huth overflow = rt != (int32_t)rt; 88fcf5ef2aSThomas Huth } 89fcf5ef2aSThomas Huth 90fcf5ef2aSThomas Huth if (unlikely(overflow)) { 91fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 92fcf5ef2aSThomas Huth } 93fcf5ef2aSThomas Huth 94fcf5ef2aSThomas Huth if (oe) { 95f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 96fcf5ef2aSThomas Huth } 97fcf5ef2aSThomas Huth 98fcf5ef2aSThomas Huth return (target_ulong)rt; 99fcf5ef2aSThomas Huth } 100fcf5ef2aSThomas Huth 101fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 102fcf5ef2aSThomas Huth 103fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe) 104fcf5ef2aSThomas Huth { 105fcf5ef2aSThomas Huth uint64_t rt = 0; 106fcf5ef2aSThomas Huth int overflow = 0; 107fcf5ef2aSThomas Huth 1089276a31cSLuis Pires if (unlikely(rb == 0 || ra >= rb)) { 1099276a31cSLuis Pires overflow = 1; 110fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1119276a31cSLuis Pires } else { 1129276a31cSLuis Pires divu128(&rt, &ra, rb); 113fcf5ef2aSThomas Huth } 114fcf5ef2aSThomas Huth 115fcf5ef2aSThomas Huth if (oe) { 116f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 117fcf5ef2aSThomas Huth } 118fcf5ef2aSThomas Huth 119fcf5ef2aSThomas Huth return rt; 120fcf5ef2aSThomas Huth } 121fcf5ef2aSThomas Huth 122fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe) 123fcf5ef2aSThomas Huth { 12440f3e79aSLuis Pires uint64_t rt = 0; 125fcf5ef2aSThomas Huth int64_t ra = (int64_t)rau; 126fcf5ef2aSThomas Huth int64_t rb = (int64_t)rbu; 1279276a31cSLuis Pires int overflow = 0; 128fcf5ef2aSThomas Huth 1299276a31cSLuis Pires if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) { 1309276a31cSLuis Pires overflow = 1; 131fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1329276a31cSLuis Pires } else { 1339276a31cSLuis Pires divs128(&rt, &ra, rb); 134fcf5ef2aSThomas Huth } 135fcf5ef2aSThomas Huth 136fcf5ef2aSThomas Huth if (oe) { 137f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 138fcf5ef2aSThomas Huth } 139fcf5ef2aSThomas Huth 140fcf5ef2aSThomas Huth return rt; 141fcf5ef2aSThomas Huth } 142fcf5ef2aSThomas Huth 143fcf5ef2aSThomas Huth #endif 144fcf5ef2aSThomas Huth 145fcf5ef2aSThomas Huth 146fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 147fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */ 148fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff)) 149fcf5ef2aSThomas Huth 150b6cb41b2SDavid Gibson /* 151b6cb41b2SDavid Gibson * subtract 1 from each byte, and with inverse, check if MSB is set at each 152fcf5ef2aSThomas Huth * byte. 153fcf5ef2aSThomas Huth * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80 154fcf5ef2aSThomas Huth * (0xFF & 0xFF) & 0x80 = 0x80 (zero found) 155fcf5ef2aSThomas Huth */ 156fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80)) 157fcf5ef2aSThomas Huth 158fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */ 159fcf5ef2aSThomas Huth #define hasvalue(x, n) (haszero((x) ^ pattern(n))) 160fcf5ef2aSThomas Huth 161fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb) 162fcf5ef2aSThomas Huth { 163efa73196SNikunj A Dadhania return hasvalue(rb, ra) ? CRF_GT : 0; 164fcf5ef2aSThomas Huth } 165fcf5ef2aSThomas Huth 166fcf5ef2aSThomas Huth #undef pattern 167fcf5ef2aSThomas Huth #undef haszero 168fcf5ef2aSThomas Huth #undef hasvalue 169fcf5ef2aSThomas Huth 170b6cb41b2SDavid Gibson /* 1713f74b632SRichard Henderson * Return a random number. 172fcf5ef2aSThomas Huth */ 1733f74b632SRichard Henderson uint64_t helper_darn32(void) 174fcf5ef2aSThomas Huth { 1753f74b632SRichard Henderson Error *err = NULL; 1763f74b632SRichard Henderson uint32_t ret; 1773f74b632SRichard Henderson 1783f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1793f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1803f74b632SRichard Henderson error_get_pretty(err)); 1813f74b632SRichard Henderson error_free(err); 182fcf5ef2aSThomas Huth return -1; 183fcf5ef2aSThomas Huth } 184fcf5ef2aSThomas Huth 1853f74b632SRichard Henderson return ret; 1863f74b632SRichard Henderson } 1873f74b632SRichard Henderson 1883f74b632SRichard Henderson uint64_t helper_darn64(void) 189fcf5ef2aSThomas Huth { 1903f74b632SRichard Henderson Error *err = NULL; 1913f74b632SRichard Henderson uint64_t ret; 1923f74b632SRichard Henderson 1933f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1943f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1953f74b632SRichard Henderson error_get_pretty(err)); 1963f74b632SRichard Henderson error_free(err); 197fcf5ef2aSThomas Huth return -1; 198fcf5ef2aSThomas Huth } 199fcf5ef2aSThomas Huth 2003f74b632SRichard Henderson return ret; 2013f74b632SRichard Henderson } 202fcf5ef2aSThomas Huth 203fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb) 204fcf5ef2aSThomas Huth { 205fcf5ef2aSThomas Huth int i; 206fcf5ef2aSThomas Huth uint64_t ra = 0; 207fcf5ef2aSThomas Huth 208fcf5ef2aSThomas Huth for (i = 0; i < 8; i++) { 209fcf5ef2aSThomas Huth int index = (rs >> (i * 8)) & 0xFF; 210fcf5ef2aSThomas Huth if (index < 64) { 211a6a444a8SCédric Le Goater if (rb & PPC_BIT(index)) { 212fcf5ef2aSThomas Huth ra |= 1 << i; 213fcf5ef2aSThomas Huth } 214fcf5ef2aSThomas Huth } 215fcf5ef2aSThomas Huth } 216fcf5ef2aSThomas Huth return ra; 217fcf5ef2aSThomas Huth } 218fcf5ef2aSThomas Huth 219fcf5ef2aSThomas Huth #endif 220fcf5ef2aSThomas Huth 221fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb) 222fcf5ef2aSThomas Huth { 223fcf5ef2aSThomas Huth target_ulong mask = 0xff; 224fcf5ef2aSThomas Huth target_ulong ra = 0; 225fcf5ef2aSThomas Huth int i; 226fcf5ef2aSThomas Huth 227fcf5ef2aSThomas Huth for (i = 0; i < sizeof(target_ulong); i++) { 228fcf5ef2aSThomas Huth if ((rs & mask) == (rb & mask)) { 229fcf5ef2aSThomas Huth ra |= mask; 230fcf5ef2aSThomas Huth } 231fcf5ef2aSThomas Huth mask <<= 8; 232fcf5ef2aSThomas Huth } 233fcf5ef2aSThomas Huth return ra; 234fcf5ef2aSThomas Huth } 235fcf5ef2aSThomas Huth 236fcf5ef2aSThomas Huth /* shift right arithmetic helper */ 237fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value, 238fcf5ef2aSThomas Huth target_ulong shift) 239fcf5ef2aSThomas Huth { 240fcf5ef2aSThomas Huth int32_t ret; 241fcf5ef2aSThomas Huth 242fcf5ef2aSThomas Huth if (likely(!(shift & 0x20))) { 243fcf5ef2aSThomas Huth if (likely((uint32_t)shift != 0)) { 244fcf5ef2aSThomas Huth shift &= 0x1f; 245fcf5ef2aSThomas Huth ret = (int32_t)value >> shift; 246fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) { 247af1c259fSSandipan Das env->ca32 = env->ca = 0; 248fcf5ef2aSThomas Huth } else { 249af1c259fSSandipan Das env->ca32 = env->ca = 1; 250fcf5ef2aSThomas Huth } 251fcf5ef2aSThomas Huth } else { 252fcf5ef2aSThomas Huth ret = (int32_t)value; 253af1c259fSSandipan Das env->ca32 = env->ca = 0; 254fcf5ef2aSThomas Huth } 255fcf5ef2aSThomas Huth } else { 256fcf5ef2aSThomas Huth ret = (int32_t)value >> 31; 257af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 258fcf5ef2aSThomas Huth } 259fcf5ef2aSThomas Huth return (target_long)ret; 260fcf5ef2aSThomas Huth } 261fcf5ef2aSThomas Huth 262fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 263fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value, 264fcf5ef2aSThomas Huth target_ulong shift) 265fcf5ef2aSThomas Huth { 266fcf5ef2aSThomas Huth int64_t ret; 267fcf5ef2aSThomas Huth 268fcf5ef2aSThomas Huth if (likely(!(shift & 0x40))) { 269fcf5ef2aSThomas Huth if (likely((uint64_t)shift != 0)) { 270fcf5ef2aSThomas Huth shift &= 0x3f; 271fcf5ef2aSThomas Huth ret = (int64_t)value >> shift; 272fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) { 273af1c259fSSandipan Das env->ca32 = env->ca = 0; 274fcf5ef2aSThomas Huth } else { 275af1c259fSSandipan Das env->ca32 = env->ca = 1; 276fcf5ef2aSThomas Huth } 277fcf5ef2aSThomas Huth } else { 278fcf5ef2aSThomas Huth ret = (int64_t)value; 279af1c259fSSandipan Das env->ca32 = env->ca = 0; 280fcf5ef2aSThomas Huth } 281fcf5ef2aSThomas Huth } else { 282fcf5ef2aSThomas Huth ret = (int64_t)value >> 63; 283af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 284fcf5ef2aSThomas Huth } 285fcf5ef2aSThomas Huth return ret; 286fcf5ef2aSThomas Huth } 287fcf5ef2aSThomas Huth #endif 288fcf5ef2aSThomas Huth 289fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 290fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 291fcf5ef2aSThomas Huth { 29279770002SRichard Henderson /* Note that we don't fold past bytes */ 293fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 294fcf5ef2aSThomas Huth 0x5555555555555555ULL); 295fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 296fcf5ef2aSThomas Huth 0x3333333333333333ULL); 297fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 298fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 299fcf5ef2aSThomas Huth return val; 300fcf5ef2aSThomas Huth } 301fcf5ef2aSThomas Huth 302fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val) 303fcf5ef2aSThomas Huth { 30479770002SRichard Henderson /* Note that we don't fold past words. */ 305fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 306fcf5ef2aSThomas Huth 0x5555555555555555ULL); 307fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 308fcf5ef2aSThomas Huth 0x3333333333333333ULL); 309fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 310fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 311fcf5ef2aSThomas Huth val = (val & 0x00ff00ff00ff00ffULL) + ((val >> 8) & 312fcf5ef2aSThomas Huth 0x00ff00ff00ff00ffULL); 313fcf5ef2aSThomas Huth val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) & 314fcf5ef2aSThomas Huth 0x0000ffff0000ffffULL); 315fcf5ef2aSThomas Huth return val; 316fcf5ef2aSThomas Huth } 317fcf5ef2aSThomas Huth #else 318fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 319fcf5ef2aSThomas Huth { 32079770002SRichard Henderson /* Note that we don't fold past bytes */ 321fcf5ef2aSThomas Huth val = (val & 0x55555555) + ((val >> 1) & 0x55555555); 322fcf5ef2aSThomas Huth val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 323fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f) + ((val >> 4) & 0x0f0f0f0f); 324fcf5ef2aSThomas Huth return val; 325fcf5ef2aSThomas Huth } 326fcf5ef2aSThomas Huth #endif 327fcf5ef2aSThomas Huth 3286e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask) 32989ccd7dcSMatheus Ferst { 33089ccd7dcSMatheus Ferst /* 33189ccd7dcSMatheus Ferst * Instead of processing the mask bit-by-bit from the most significant to 33289ccd7dcSMatheus Ferst * the least significant bit, as described in PowerISA, we'll handle it in 33389ccd7dcSMatheus Ferst * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use 33489ccd7dcSMatheus Ferst * ctz or cto, we negate the mask at the end of the loop. 33589ccd7dcSMatheus Ferst */ 33689ccd7dcSMatheus Ferst target_ulong m, left = 0, right = 0; 33789ccd7dcSMatheus Ferst unsigned int n, i = 64; 33889ccd7dcSMatheus Ferst bool bit = false; /* tracks if we are processing zeros or ones */ 33989ccd7dcSMatheus Ferst 34089ccd7dcSMatheus Ferst if (mask == 0 || mask == -1) { 34189ccd7dcSMatheus Ferst return src; 34289ccd7dcSMatheus Ferst } 34389ccd7dcSMatheus Ferst 34489ccd7dcSMatheus Ferst /* Processes the mask in blocks, from LSB to MSB */ 34589ccd7dcSMatheus Ferst while (i) { 34689ccd7dcSMatheus Ferst /* Find how many bits we should take */ 34789ccd7dcSMatheus Ferst n = ctz64(mask); 34889ccd7dcSMatheus Ferst if (n > i) { 34989ccd7dcSMatheus Ferst n = i; 35089ccd7dcSMatheus Ferst } 35189ccd7dcSMatheus Ferst 35289ccd7dcSMatheus Ferst /* 35389ccd7dcSMatheus Ferst * Extracts 'n' trailing bits of src and put them on the leading 'n' 35489ccd7dcSMatheus Ferst * bits of 'right' or 'left', pushing down the previously extracted 35589ccd7dcSMatheus Ferst * values. 35689ccd7dcSMatheus Ferst */ 35789ccd7dcSMatheus Ferst m = (1ll << n) - 1; 35889ccd7dcSMatheus Ferst if (bit) { 35989ccd7dcSMatheus Ferst right = ror64(right | (src & m), n); 36089ccd7dcSMatheus Ferst } else { 36189ccd7dcSMatheus Ferst left = ror64(left | (src & m), n); 36289ccd7dcSMatheus Ferst } 36389ccd7dcSMatheus Ferst 36489ccd7dcSMatheus Ferst /* 36589ccd7dcSMatheus Ferst * Discards the processed bits from 'src' and 'mask'. Note that we are 36689ccd7dcSMatheus Ferst * removing 'n' trailing zeros from 'mask', but the logical shift will 36789ccd7dcSMatheus Ferst * add 'n' leading zeros back, so the population count of 'mask' is kept 36889ccd7dcSMatheus Ferst * the same. 36989ccd7dcSMatheus Ferst */ 37089ccd7dcSMatheus Ferst src >>= n; 37189ccd7dcSMatheus Ferst mask >>= n; 37289ccd7dcSMatheus Ferst i -= n; 37389ccd7dcSMatheus Ferst bit = !bit; 37489ccd7dcSMatheus Ferst mask = ~mask; 37589ccd7dcSMatheus Ferst } 37689ccd7dcSMatheus Ferst 37789ccd7dcSMatheus Ferst /* 37889ccd7dcSMatheus Ferst * At the end, right was ror'ed ctpop(mask) times. To put it back in place, 37989ccd7dcSMatheus Ferst * we'll shift it more 64-ctpop(mask) times. 38089ccd7dcSMatheus Ferst */ 38189ccd7dcSMatheus Ferst if (bit) { 38289ccd7dcSMatheus Ferst n = ctpop64(mask); 38389ccd7dcSMatheus Ferst } else { 38489ccd7dcSMatheus Ferst n = 64 - ctpop64(mask); 38589ccd7dcSMatheus Ferst } 38689ccd7dcSMatheus Ferst 38789ccd7dcSMatheus Ferst return left | (right >> n); 38889ccd7dcSMatheus Ferst } 38989ccd7dcSMatheus Ferst 39021ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask) 39121ba6e58SMatheus Ferst { 39221ba6e58SMatheus Ferst int i, o; 39321ba6e58SMatheus Ferst uint64_t result = 0; 39421ba6e58SMatheus Ferst 39521ba6e58SMatheus Ferst if (mask == -1) { 39621ba6e58SMatheus Ferst return src; 39721ba6e58SMatheus Ferst } 39821ba6e58SMatheus Ferst 39921ba6e58SMatheus Ferst for (i = 0; mask != 0; i++) { 40021ba6e58SMatheus Ferst o = ctz64(mask); 40121ba6e58SMatheus Ferst mask &= mask - 1; 40221ba6e58SMatheus Ferst result |= ((src >> i) & 1) << o; 40321ba6e58SMatheus Ferst } 40421ba6e58SMatheus Ferst 40521ba6e58SMatheus Ferst return result; 40621ba6e58SMatheus Ferst } 4078bdb7606SMatheus Ferst 4088bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask) 4098bdb7606SMatheus Ferst { 4108bdb7606SMatheus Ferst int i, o; 4118bdb7606SMatheus Ferst uint64_t result = 0; 4128bdb7606SMatheus Ferst 4138bdb7606SMatheus Ferst if (mask == -1) { 4148bdb7606SMatheus Ferst return src; 4158bdb7606SMatheus Ferst } 4168bdb7606SMatheus Ferst 4178bdb7606SMatheus Ferst for (o = 0; mask != 0; o++) { 4188bdb7606SMatheus Ferst i = ctz64(mask); 4198bdb7606SMatheus Ferst mask &= mask - 1; 4208bdb7606SMatheus Ferst result |= ((src >> i) & 1) << o; 4218bdb7606SMatheus Ferst } 4228bdb7606SMatheus Ferst 4238bdb7606SMatheus Ferst return result; 4248bdb7606SMatheus Ferst } 42521ba6e58SMatheus Ferst 426fcf5ef2aSThomas Huth /*****************************************************************************/ 427fcf5ef2aSThomas Huth /* Altivec extension helpers */ 428e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 429fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 430fcf5ef2aSThomas Huth for (index = 0; index < ARRAY_SIZE(r->element); index++) 431fcf5ef2aSThomas Huth #else 432fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 433fcf5ef2aSThomas Huth for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--) 434fcf5ef2aSThomas Huth #endif 435fcf5ef2aSThomas Huth 436fcf5ef2aSThomas Huth /* Saturating arithmetic helpers. */ 437fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max) \ 438fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 439fcf5ef2aSThomas Huth { \ 440fcf5ef2aSThomas Huth to_type r; \ 441fcf5ef2aSThomas Huth \ 442fcf5ef2aSThomas Huth if (x < (from_type)min) { \ 443fcf5ef2aSThomas Huth r = min; \ 444fcf5ef2aSThomas Huth *sat = 1; \ 445fcf5ef2aSThomas Huth } else if (x > (from_type)max) { \ 446fcf5ef2aSThomas Huth r = max; \ 447fcf5ef2aSThomas Huth *sat = 1; \ 448fcf5ef2aSThomas Huth } else { \ 449fcf5ef2aSThomas Huth r = x; \ 450fcf5ef2aSThomas Huth } \ 451fcf5ef2aSThomas Huth return r; \ 452fcf5ef2aSThomas Huth } 453fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max) \ 454fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 455fcf5ef2aSThomas Huth { \ 456fcf5ef2aSThomas Huth to_type r; \ 457fcf5ef2aSThomas Huth \ 458fcf5ef2aSThomas Huth if (x > (from_type)max) { \ 459fcf5ef2aSThomas Huth r = max; \ 460fcf5ef2aSThomas Huth *sat = 1; \ 461fcf5ef2aSThomas Huth } else { \ 462fcf5ef2aSThomas Huth r = x; \ 463fcf5ef2aSThomas Huth } \ 464fcf5ef2aSThomas Huth return r; \ 465fcf5ef2aSThomas Huth } 466fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX) 467fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX) 468fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX) 469fcf5ef2aSThomas Huth 470fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX) 471fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX) 472fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX) 473fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX) 474fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX) 475fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX) 476fcf5ef2aSThomas Huth #undef SATCVT 477fcf5ef2aSThomas Huth #undef SATCVTU 478fcf5ef2aSThomas Huth 479dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr) 480fcf5ef2aSThomas Huth { 481c19940dbSBruno Larsen (billionai) ppc_store_vscr(env, vscr); 482fcf5ef2aSThomas Huth } 483fcf5ef2aSThomas Huth 484cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env) 485cc2b90d7SRichard Henderson { 486c19940dbSBruno Larsen (billionai) return ppc_get_vscr(env); 487cc2b90d7SRichard Henderson } 488cc2b90d7SRichard Henderson 4896175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env) 4906175f5a0SRichard Henderson { 4919b5b74daSRichard Henderson /* The choice of non-zero value is arbitrary. */ 4929b5b74daSRichard Henderson env->vscr_sat.u32[0] = 1; 4936175f5a0SRichard Henderson } 4946175f5a0SRichard Henderson 495fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 496fcf5ef2aSThomas Huth { 497fcf5ef2aSThomas Huth int i; 498fcf5ef2aSThomas Huth 499fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 500fcf5ef2aSThomas Huth r->u32[i] = ~a->u32[i] < b->u32[i]; 501fcf5ef2aSThomas Huth } 502fcf5ef2aSThomas Huth } 503fcf5ef2aSThomas Huth 504fcf5ef2aSThomas Huth /* vprtybw */ 505fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b) 506fcf5ef2aSThomas Huth { 507fcf5ef2aSThomas Huth int i; 508fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 509fcf5ef2aSThomas Huth uint64_t res = b->u32[i] ^ (b->u32[i] >> 16); 510fcf5ef2aSThomas Huth res ^= res >> 8; 511fcf5ef2aSThomas Huth r->u32[i] = res & 1; 512fcf5ef2aSThomas Huth } 513fcf5ef2aSThomas Huth } 514fcf5ef2aSThomas Huth 515fcf5ef2aSThomas Huth /* vprtybd */ 516fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b) 517fcf5ef2aSThomas Huth { 518fcf5ef2aSThomas Huth int i; 519fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 520fcf5ef2aSThomas Huth uint64_t res = b->u64[i] ^ (b->u64[i] >> 32); 521fcf5ef2aSThomas Huth res ^= res >> 16; 522fcf5ef2aSThomas Huth res ^= res >> 8; 523fcf5ef2aSThomas Huth r->u64[i] = res & 1; 524fcf5ef2aSThomas Huth } 525fcf5ef2aSThomas Huth } 526fcf5ef2aSThomas Huth 527fcf5ef2aSThomas Huth /* vprtybq */ 528fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b) 529fcf5ef2aSThomas Huth { 530fcf5ef2aSThomas Huth uint64_t res = b->u64[0] ^ b->u64[1]; 531fcf5ef2aSThomas Huth res ^= res >> 32; 532fcf5ef2aSThomas Huth res ^= res >> 16; 533fcf5ef2aSThomas Huth res ^= res >> 8; 5343c385a93SMark Cave-Ayland r->VsrD(1) = res & 1; 5353c385a93SMark Cave-Ayland r->VsrD(0) = 0; 536fcf5ef2aSThomas Huth } 537fcf5ef2aSThomas Huth 538fcf5ef2aSThomas Huth #define VARITHFP(suffix, func) \ 539fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 540fcf5ef2aSThomas Huth ppc_avr_t *b) \ 541fcf5ef2aSThomas Huth { \ 542fcf5ef2aSThomas Huth int i; \ 543fcf5ef2aSThomas Huth \ 54405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 54505ee3e8aSMark Cave-Ayland r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status); \ 546fcf5ef2aSThomas Huth } \ 547fcf5ef2aSThomas Huth } 548fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add) 549fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub) 550fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min) 551fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max) 552fcf5ef2aSThomas Huth #undef VARITHFP 553fcf5ef2aSThomas Huth 554fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type) \ 555fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 556fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) \ 557fcf5ef2aSThomas Huth { \ 558fcf5ef2aSThomas Huth int i; \ 55905ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 56005ee3e8aSMark Cave-Ayland r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \ 561fcf5ef2aSThomas Huth type, &env->vec_status); \ 562fcf5ef2aSThomas Huth } \ 563fcf5ef2aSThomas Huth } 564fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0); 565fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c); 566fcf5ef2aSThomas Huth #undef VARITHFPFMA 567fcf5ef2aSThomas Huth 568fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element) \ 569fcf5ef2aSThomas Huth { \ 570fcf5ef2aSThomas Huth type result = (type)a->element[i] op (type)b->element[i]; \ 571fcf5ef2aSThomas Huth r->element[i] = cvt(result, &sat); \ 572fcf5ef2aSThomas Huth } 573fcf5ef2aSThomas Huth 574fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element) \ 575fb11ae7dSRichard Henderson void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat, \ 576fb11ae7dSRichard Henderson ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 577fcf5ef2aSThomas Huth { \ 578fcf5ef2aSThomas Huth int sat = 0; \ 579fcf5ef2aSThomas Huth int i; \ 580fcf5ef2aSThomas Huth \ 581fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 582fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 583fcf5ef2aSThomas Huth } \ 584fcf5ef2aSThomas Huth if (sat) { \ 585fb11ae7dSRichard Henderson vscr_sat->u32[0] = 1; \ 586fcf5ef2aSThomas Huth } \ 587fcf5ef2aSThomas Huth } 588fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt) \ 589fcf5ef2aSThomas Huth VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element) \ 590fcf5ef2aSThomas Huth VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element) 591fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt) \ 592fcf5ef2aSThomas Huth VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element) \ 593fcf5ef2aSThomas Huth VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element) 594fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb) 595fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh) 596fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw) 597fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub) 598fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh) 599fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw) 600fcf5ef2aSThomas Huth #undef VARITHSAT_CASE 601fcf5ef2aSThomas Huth #undef VARITHSAT_DO 602fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED 603fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED 604fcf5ef2aSThomas Huth 605fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype) \ 606fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 607fcf5ef2aSThomas Huth { \ 608fcf5ef2aSThomas Huth int i; \ 609fcf5ef2aSThomas Huth \ 610fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 611fcf5ef2aSThomas Huth etype x = (etype)a->element[i] + (etype)b->element[i] + 1; \ 612fcf5ef2aSThomas Huth r->element[i] = x >> 1; \ 613fcf5ef2aSThomas Huth } \ 614fcf5ef2aSThomas Huth } 615fcf5ef2aSThomas Huth 616fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element, \ 617fcf5ef2aSThomas Huth unsigned_type) \ 618fcf5ef2aSThomas Huth VAVG_DO(avgs##type, signed_element, signed_type) \ 619fcf5ef2aSThomas Huth VAVG_DO(avgu##type, unsigned_element, unsigned_type) 620fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t) 621fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t) 622fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t) 623fcf5ef2aSThomas Huth #undef VAVG_DO 624fcf5ef2aSThomas Huth #undef VAVG 625fcf5ef2aSThomas Huth 626fcf5ef2aSThomas Huth #define VABSDU_DO(name, element) \ 627fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 628fcf5ef2aSThomas Huth { \ 629fcf5ef2aSThomas Huth int i; \ 630fcf5ef2aSThomas Huth \ 631fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 632fcf5ef2aSThomas Huth r->element[i] = (a->element[i] > b->element[i]) ? \ 633fcf5ef2aSThomas Huth (a->element[i] - b->element[i]) : \ 634fcf5ef2aSThomas Huth (b->element[i] - a->element[i]); \ 635fcf5ef2aSThomas Huth } \ 636fcf5ef2aSThomas Huth } 637fcf5ef2aSThomas Huth 638b6cb41b2SDavid Gibson /* 639b6cb41b2SDavid Gibson * VABSDU - Vector absolute difference unsigned 640fcf5ef2aSThomas Huth * name - instruction mnemonic suffix (b: byte, h: halfword, w: word) 641fcf5ef2aSThomas Huth * element - element type to access from vector 642fcf5ef2aSThomas Huth */ 643fcf5ef2aSThomas Huth #define VABSDU(type, element) \ 644fcf5ef2aSThomas Huth VABSDU_DO(absdu##type, element) 645fcf5ef2aSThomas Huth VABSDU(b, u8) 646fcf5ef2aSThomas Huth VABSDU(h, u16) 647fcf5ef2aSThomas Huth VABSDU(w, u32) 648fcf5ef2aSThomas Huth #undef VABSDU_DO 649fcf5ef2aSThomas Huth #undef VABSDU 650fcf5ef2aSThomas Huth 651fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element) \ 652fcf5ef2aSThomas Huth void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r, \ 653fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 654fcf5ef2aSThomas Huth { \ 655fcf5ef2aSThomas Huth int i; \ 656fcf5ef2aSThomas Huth \ 65705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 658fcf5ef2aSThomas Huth float32 t = cvt(b->element[i], &env->vec_status); \ 65905ee3e8aSMark Cave-Ayland r->f32[i] = float32_scalbn(t, -uim, &env->vec_status); \ 660fcf5ef2aSThomas Huth } \ 661fcf5ef2aSThomas Huth } 662fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32) 663fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32) 664fcf5ef2aSThomas Huth #undef VCF 665fcf5ef2aSThomas Huth 666eb936dc0SMatheus Ferst #define VCMPNEZ(NAME, ELEM) \ 667eb936dc0SMatheus Ferst void helper_##NAME(ppc_vsr_t *t, ppc_vsr_t *a, ppc_vsr_t *b, uint32_t desc) \ 668fcf5ef2aSThomas Huth { \ 669eb936dc0SMatheus Ferst for (int i = 0; i < ARRAY_SIZE(t->ELEM); i++) { \ 670eb936dc0SMatheus Ferst t->ELEM[i] = ((a->ELEM[i] == 0) || (b->ELEM[i] == 0) || \ 671eb936dc0SMatheus Ferst (a->ELEM[i] != b->ELEM[i])) ? -1 : 0; \ 672fcf5ef2aSThomas Huth } \ 673fcf5ef2aSThomas Huth } 674eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZB, u8) 675eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZH, u16) 676eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZW, u32) 677eb936dc0SMatheus Ferst #undef VCMPNEZ 678fcf5ef2aSThomas Huth 679fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record) \ 680fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 681fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 682fcf5ef2aSThomas Huth { \ 683fcf5ef2aSThomas Huth uint32_t ones = (uint32_t)-1; \ 684fcf5ef2aSThomas Huth uint32_t all = ones; \ 685fcf5ef2aSThomas Huth uint32_t none = 0; \ 686fcf5ef2aSThomas Huth int i; \ 687fcf5ef2aSThomas Huth \ 68805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 689fcf5ef2aSThomas Huth uint32_t result; \ 69071bfd65cSRichard Henderson FloatRelation rel = \ 69171bfd65cSRichard Henderson float32_compare_quiet(a->f32[i], b->f32[i], \ 692fcf5ef2aSThomas Huth &env->vec_status); \ 693fcf5ef2aSThomas Huth if (rel == float_relation_unordered) { \ 694fcf5ef2aSThomas Huth result = 0; \ 695fcf5ef2aSThomas Huth } else if (rel compare order) { \ 696fcf5ef2aSThomas Huth result = ones; \ 697fcf5ef2aSThomas Huth } else { \ 698fcf5ef2aSThomas Huth result = 0; \ 699fcf5ef2aSThomas Huth } \ 700fcf5ef2aSThomas Huth r->u32[i] = result; \ 701fcf5ef2aSThomas Huth all &= result; \ 702fcf5ef2aSThomas Huth none |= result; \ 703fcf5ef2aSThomas Huth } \ 704fcf5ef2aSThomas Huth if (record) { \ 705fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 706fcf5ef2aSThomas Huth } \ 707fcf5ef2aSThomas Huth } 708fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order) \ 709fcf5ef2aSThomas Huth VCMPFP_DO(suffix, compare, order, 0) \ 710fcf5ef2aSThomas Huth VCMPFP_DO(suffix##_dot, compare, order, 1) 711fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal) 712fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less) 713fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater) 714fcf5ef2aSThomas Huth #undef VCMPFP_DO 715fcf5ef2aSThomas Huth #undef VCMPFP 716fcf5ef2aSThomas Huth 717fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r, 718fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b, int record) 719fcf5ef2aSThomas Huth { 720fcf5ef2aSThomas Huth int i; 721fcf5ef2aSThomas Huth int all_in = 0; 722fcf5ef2aSThomas Huth 72305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 72471bfd65cSRichard Henderson FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i], 72505ee3e8aSMark Cave-Ayland &env->vec_status); 726fcf5ef2aSThomas Huth if (le_rel == float_relation_unordered) { 727fcf5ef2aSThomas Huth r->u32[i] = 0xc0000000; 728fcf5ef2aSThomas Huth all_in = 1; 729fcf5ef2aSThomas Huth } else { 73005ee3e8aSMark Cave-Ayland float32 bneg = float32_chs(b->f32[i]); 73171bfd65cSRichard Henderson FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg, 73205ee3e8aSMark Cave-Ayland &env->vec_status); 733fcf5ef2aSThomas Huth int le = le_rel != float_relation_greater; 734fcf5ef2aSThomas Huth int ge = ge_rel != float_relation_less; 735fcf5ef2aSThomas Huth 736fcf5ef2aSThomas Huth r->u32[i] = ((!le) << 31) | ((!ge) << 30); 737fcf5ef2aSThomas Huth all_in |= (!le | !ge); 738fcf5ef2aSThomas Huth } 739fcf5ef2aSThomas Huth } 740fcf5ef2aSThomas Huth if (record) { 741fcf5ef2aSThomas Huth env->crf[6] = (all_in == 0) << 1; 742fcf5ef2aSThomas Huth } 743fcf5ef2aSThomas Huth } 744fcf5ef2aSThomas Huth 745fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 746fcf5ef2aSThomas Huth { 747fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 0); 748fcf5ef2aSThomas Huth } 749fcf5ef2aSThomas Huth 750fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 751fcf5ef2aSThomas Huth ppc_avr_t *b) 752fcf5ef2aSThomas Huth { 753fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 1); 754fcf5ef2aSThomas Huth } 755fcf5ef2aSThomas Huth 756fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element) \ 757fcf5ef2aSThomas Huth void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r, \ 758fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 759fcf5ef2aSThomas Huth { \ 760fcf5ef2aSThomas Huth int i; \ 761fcf5ef2aSThomas Huth int sat = 0; \ 762fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 763fcf5ef2aSThomas Huth \ 764fcf5ef2aSThomas Huth set_float_rounding_mode(float_round_to_zero, &s); \ 76505ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 76605ee3e8aSMark Cave-Ayland if (float32_is_any_nan(b->f32[i])) { \ 767fcf5ef2aSThomas Huth r->element[i] = 0; \ 768fcf5ef2aSThomas Huth } else { \ 76905ee3e8aSMark Cave-Ayland float64 t = float32_to_float64(b->f32[i], &s); \ 770fcf5ef2aSThomas Huth int64_t j; \ 771fcf5ef2aSThomas Huth \ 772fcf5ef2aSThomas Huth t = float64_scalbn(t, uim, &s); \ 773fcf5ef2aSThomas Huth j = float64_to_int64(t, &s); \ 774fcf5ef2aSThomas Huth r->element[i] = satcvt(j, &sat); \ 775fcf5ef2aSThomas Huth } \ 776fcf5ef2aSThomas Huth } \ 777fcf5ef2aSThomas Huth if (sat) { \ 7786175f5a0SRichard Henderson set_vscr_sat(env); \ 779fcf5ef2aSThomas Huth } \ 780fcf5ef2aSThomas Huth } 781fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32) 782fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32) 783fcf5ef2aSThomas Huth #undef VCT 784fcf5ef2aSThomas Huth 78534553153SLucas Mateus Castro (alqotel) typedef int64_t do_ger(uint32_t, uint32_t, uint32_t); 78634553153SLucas Mateus Castro (alqotel) 78734553153SLucas Mateus Castro (alqotel) static int64_t ger_rank8(uint32_t a, uint32_t b, uint32_t mask) 78834553153SLucas Mateus Castro (alqotel) { 78934553153SLucas Mateus Castro (alqotel) int64_t psum = 0; 79034553153SLucas Mateus Castro (alqotel) for (int i = 0; i < 8; i++, mask >>= 1) { 79134553153SLucas Mateus Castro (alqotel) if (mask & 1) { 79234553153SLucas Mateus Castro (alqotel) psum += sextract32(a, 4 * i, 4) * sextract32(b, 4 * i, 4); 79334553153SLucas Mateus Castro (alqotel) } 79434553153SLucas Mateus Castro (alqotel) } 79534553153SLucas Mateus Castro (alqotel) return psum; 79634553153SLucas Mateus Castro (alqotel) } 79734553153SLucas Mateus Castro (alqotel) 79834553153SLucas Mateus Castro (alqotel) static int64_t ger_rank4(uint32_t a, uint32_t b, uint32_t mask) 79934553153SLucas Mateus Castro (alqotel) { 80034553153SLucas Mateus Castro (alqotel) int64_t psum = 0; 80134553153SLucas Mateus Castro (alqotel) for (int i = 0; i < 4; i++, mask >>= 1) { 80234553153SLucas Mateus Castro (alqotel) if (mask & 1) { 80334553153SLucas Mateus Castro (alqotel) psum += sextract32(a, 8 * i, 8) * (int64_t)extract32(b, 8 * i, 8); 80434553153SLucas Mateus Castro (alqotel) } 80534553153SLucas Mateus Castro (alqotel) } 80634553153SLucas Mateus Castro (alqotel) return psum; 80734553153SLucas Mateus Castro (alqotel) } 80834553153SLucas Mateus Castro (alqotel) 80934553153SLucas Mateus Castro (alqotel) static int64_t ger_rank2(uint32_t a, uint32_t b, uint32_t mask) 81034553153SLucas Mateus Castro (alqotel) { 81134553153SLucas Mateus Castro (alqotel) int64_t psum = 0; 81234553153SLucas Mateus Castro (alqotel) for (int i = 0; i < 2; i++, mask >>= 1) { 81334553153SLucas Mateus Castro (alqotel) if (mask & 1) { 81434553153SLucas Mateus Castro (alqotel) psum += sextract32(a, 16 * i, 16) * sextract32(b, 16 * i, 16); 81534553153SLucas Mateus Castro (alqotel) } 81634553153SLucas Mateus Castro (alqotel) } 81734553153SLucas Mateus Castro (alqotel) return psum; 81834553153SLucas Mateus Castro (alqotel) } 81934553153SLucas Mateus Castro (alqotel) 82034553153SLucas Mateus Castro (alqotel) static void xviger(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, ppc_acc_t *at, 82134553153SLucas Mateus Castro (alqotel) uint32_t mask, bool sat, bool acc, do_ger ger) 82234553153SLucas Mateus Castro (alqotel) { 82334553153SLucas Mateus Castro (alqotel) uint8_t pmsk = FIELD_EX32(mask, GER_MSK, PMSK), 82434553153SLucas Mateus Castro (alqotel) xmsk = FIELD_EX32(mask, GER_MSK, XMSK), 82534553153SLucas Mateus Castro (alqotel) ymsk = FIELD_EX32(mask, GER_MSK, YMSK); 82634553153SLucas Mateus Castro (alqotel) uint8_t xmsk_bit, ymsk_bit; 82734553153SLucas Mateus Castro (alqotel) int64_t psum; 82834553153SLucas Mateus Castro (alqotel) int i, j; 82934553153SLucas Mateus Castro (alqotel) for (i = 0, xmsk_bit = 1 << 3; i < 4; i++, xmsk_bit >>= 1) { 83034553153SLucas Mateus Castro (alqotel) for (j = 0, ymsk_bit = 1 << 3; j < 4; j++, ymsk_bit >>= 1) { 83134553153SLucas Mateus Castro (alqotel) if ((xmsk_bit & xmsk) && (ymsk_bit & ymsk)) { 83234553153SLucas Mateus Castro (alqotel) psum = ger(a->VsrW(i), b->VsrW(j), pmsk); 83334553153SLucas Mateus Castro (alqotel) if (acc) { 83434553153SLucas Mateus Castro (alqotel) psum += at[i].VsrSW(j); 83534553153SLucas Mateus Castro (alqotel) } 83634553153SLucas Mateus Castro (alqotel) if (sat && psum > INT32_MAX) { 83734553153SLucas Mateus Castro (alqotel) set_vscr_sat(env); 83834553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = INT32_MAX; 83934553153SLucas Mateus Castro (alqotel) } else if (sat && psum < INT32_MIN) { 84034553153SLucas Mateus Castro (alqotel) set_vscr_sat(env); 84134553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = INT32_MIN; 84234553153SLucas Mateus Castro (alqotel) } else { 84334553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = (int32_t) psum; 84434553153SLucas Mateus Castro (alqotel) } 84534553153SLucas Mateus Castro (alqotel) } else { 84634553153SLucas Mateus Castro (alqotel) at[i].VsrSW(j) = 0; 84734553153SLucas Mateus Castro (alqotel) } 84834553153SLucas Mateus Castro (alqotel) } 84934553153SLucas Mateus Castro (alqotel) } 85034553153SLucas Mateus Castro (alqotel) } 85134553153SLucas Mateus Castro (alqotel) 85234553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 85334553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 85434553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 85534553153SLucas Mateus Castro (alqotel) { 85634553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, false, ger_rank8); 85734553153SLucas Mateus Castro (alqotel) } 85834553153SLucas Mateus Castro (alqotel) 85934553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 86034553153SLucas Mateus Castro (alqotel) void helper_XVI4GER8PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 86134553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 86234553153SLucas Mateus Castro (alqotel) { 86334553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, true, ger_rank8); 86434553153SLucas Mateus Castro (alqotel) } 86534553153SLucas Mateus Castro (alqotel) 86634553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 86734553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 86834553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 86934553153SLucas Mateus Castro (alqotel) { 87034553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, false, ger_rank4); 87134553153SLucas Mateus Castro (alqotel) } 87234553153SLucas Mateus Castro (alqotel) 87334553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 87434553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 87534553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 87634553153SLucas Mateus Castro (alqotel) { 87734553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, true, ger_rank4); 87834553153SLucas Mateus Castro (alqotel) } 87934553153SLucas Mateus Castro (alqotel) 88034553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 88134553153SLucas Mateus Castro (alqotel) void helper_XVI8GER4SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 88234553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 88334553153SLucas Mateus Castro (alqotel) { 88434553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, true, true, ger_rank4); 88534553153SLucas Mateus Castro (alqotel) } 88634553153SLucas Mateus Castro (alqotel) 88734553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 88834553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 88934553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 89034553153SLucas Mateus Castro (alqotel) { 89134553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, false, ger_rank2); 89234553153SLucas Mateus Castro (alqotel) } 89334553153SLucas Mateus Castro (alqotel) 89434553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 89534553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2S(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 89634553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 89734553153SLucas Mateus Castro (alqotel) { 89834553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, true, false, ger_rank2); 89934553153SLucas Mateus Castro (alqotel) } 90034553153SLucas Mateus Castro (alqotel) 90134553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 90234553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2PP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 90334553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 90434553153SLucas Mateus Castro (alqotel) { 90534553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, false, true, ger_rank2); 90634553153SLucas Mateus Castro (alqotel) } 90734553153SLucas Mateus Castro (alqotel) 90834553153SLucas Mateus Castro (alqotel) QEMU_FLATTEN 90934553153SLucas Mateus Castro (alqotel) void helper_XVI16GER2SPP(CPUPPCState *env, ppc_vsr_t *a, ppc_vsr_t *b, 91034553153SLucas Mateus Castro (alqotel) ppc_acc_t *at, uint32_t mask) 91134553153SLucas Mateus Castro (alqotel) { 91234553153SLucas Mateus Castro (alqotel) xviger(env, a, b, at, mask, true, true, ger_rank2); 91334553153SLucas Mateus Castro (alqotel) } 91434553153SLucas Mateus Castro (alqotel) 915fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r) 916fcf5ef2aSThomas Huth { 917fcf5ef2aSThomas Huth target_ulong count = 0; 918fcf5ef2aSThomas Huth int i; 91960594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 92060594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 921fcf5ef2aSThomas Huth break; 922fcf5ef2aSThomas Huth } 923fcf5ef2aSThomas Huth count++; 924fcf5ef2aSThomas Huth } 925fcf5ef2aSThomas Huth return count; 926fcf5ef2aSThomas Huth } 927fcf5ef2aSThomas Huth 928fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r) 929fcf5ef2aSThomas Huth { 930fcf5ef2aSThomas Huth target_ulong count = 0; 931fcf5ef2aSThomas Huth int i; 932fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 93360594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 934fcf5ef2aSThomas Huth break; 935fcf5ef2aSThomas Huth } 936fcf5ef2aSThomas Huth count++; 937fcf5ef2aSThomas Huth } 938fcf5ef2aSThomas Huth return count; 939fcf5ef2aSThomas Huth } 940fcf5ef2aSThomas Huth 941fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 942fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 943fcf5ef2aSThomas Huth { 944fcf5ef2aSThomas Huth int sat = 0; 945fcf5ef2aSThomas Huth int i; 946fcf5ef2aSThomas Huth 947fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 948fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 949fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 950fcf5ef2aSThomas Huth 951fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 952fcf5ef2aSThomas Huth } 953fcf5ef2aSThomas Huth 954fcf5ef2aSThomas Huth if (sat) { 9556175f5a0SRichard Henderson set_vscr_sat(env); 956fcf5ef2aSThomas Huth } 957fcf5ef2aSThomas Huth } 958fcf5ef2aSThomas Huth 959fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 960fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 961fcf5ef2aSThomas Huth { 962fcf5ef2aSThomas Huth int sat = 0; 963fcf5ef2aSThomas Huth int i; 964fcf5ef2aSThomas Huth 965fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 966fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i] + 0x00004000; 967fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 968fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 969fcf5ef2aSThomas Huth } 970fcf5ef2aSThomas Huth 971fcf5ef2aSThomas Huth if (sat) { 9726175f5a0SRichard Henderson set_vscr_sat(env); 973fcf5ef2aSThomas Huth } 974fcf5ef2aSThomas Huth } 975fcf5ef2aSThomas Huth 976fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 977fcf5ef2aSThomas Huth { 978fcf5ef2aSThomas Huth int i; 979fcf5ef2aSThomas Huth 980fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 981fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 982fcf5ef2aSThomas Huth r->s16[i] = (int16_t) (prod + c->s16[i]); 983fcf5ef2aSThomas Huth } 984fcf5ef2aSThomas Huth } 985fcf5ef2aSThomas Huth 986d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs) \ 987fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 988fcf5ef2aSThomas Huth { \ 989fcf5ef2aSThomas Huth ppc_avr_t result; \ 990d81c2040SMark Cave-Ayland int i, half = ARRAY_SIZE(r->element) / 2; \ 991fcf5ef2aSThomas Huth \ 992d81c2040SMark Cave-Ayland for (i = 0; i < half; i++) { \ 993d81c2040SMark Cave-Ayland result.access(i * 2 + 0) = a->access(i + ofs); \ 994d81c2040SMark Cave-Ayland result.access(i * 2 + 1) = b->access(i + ofs); \ 995fcf5ef2aSThomas Huth } \ 996fcf5ef2aSThomas Huth *r = result; \ 997fcf5ef2aSThomas Huth } 998d81c2040SMark Cave-Ayland 999d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access) \ 1000d81c2040SMark Cave-Ayland VMRG_DO(mrgl##suffix, element, access, half) \ 1001d81c2040SMark Cave-Ayland VMRG_DO(mrgh##suffix, element, access, 0) 1002d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB) 1003d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH) 1004d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW) 1005fcf5ef2aSThomas Huth #undef VMRG_DO 1006fcf5ef2aSThomas Huth #undef VMRG 1007fcf5ef2aSThomas Huth 1008b2dc03a5SMatheus Ferst void helper_VMSUMMBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1009fcf5ef2aSThomas Huth { 1010fcf5ef2aSThomas Huth int32_t prod[16]; 1011fcf5ef2aSThomas Huth int i; 1012fcf5ef2aSThomas Huth 1013fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s8); i++) { 1014fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s8[i] * b->u8[i]; 1015fcf5ef2aSThomas Huth } 1016fcf5ef2aSThomas Huth 1017fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1018fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] + 1019fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1020fcf5ef2aSThomas Huth } 1021fcf5ef2aSThomas Huth } 1022fcf5ef2aSThomas Huth 10236f52f731SMatheus Ferst void helper_VMSUMSHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1024fcf5ef2aSThomas Huth { 1025fcf5ef2aSThomas Huth int32_t prod[8]; 1026fcf5ef2aSThomas Huth int i; 1027fcf5ef2aSThomas Huth 1028fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1029fcf5ef2aSThomas Huth prod[i] = a->s16[i] * b->s16[i]; 1030fcf5ef2aSThomas Huth } 1031fcf5ef2aSThomas Huth 1032fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1033fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1034fcf5ef2aSThomas Huth } 1035fcf5ef2aSThomas Huth } 1036fcf5ef2aSThomas Huth 10376f52f731SMatheus Ferst void helper_VMSUMSHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1038fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1039fcf5ef2aSThomas Huth { 1040fcf5ef2aSThomas Huth int32_t prod[8]; 1041fcf5ef2aSThomas Huth int i; 1042fcf5ef2aSThomas Huth int sat = 0; 1043fcf5ef2aSThomas Huth 1044fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1045fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s16[i] * b->s16[i]; 1046fcf5ef2aSThomas Huth } 1047fcf5ef2aSThomas Huth 1048fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1049fcf5ef2aSThomas Huth int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1050fcf5ef2aSThomas Huth 1051fcf5ef2aSThomas Huth r->u32[i] = cvtsdsw(t, &sat); 1052fcf5ef2aSThomas Huth } 1053fcf5ef2aSThomas Huth 1054fcf5ef2aSThomas Huth if (sat) { 10556175f5a0SRichard Henderson set_vscr_sat(env); 1056fcf5ef2aSThomas Huth } 1057fcf5ef2aSThomas Huth } 1058fcf5ef2aSThomas Huth 1059b2dc03a5SMatheus Ferst void helper_VMSUMUBM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1060fcf5ef2aSThomas Huth { 1061fcf5ef2aSThomas Huth uint16_t prod[16]; 1062fcf5ef2aSThomas Huth int i; 1063fcf5ef2aSThomas Huth 1064fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1065fcf5ef2aSThomas Huth prod[i] = a->u8[i] * b->u8[i]; 1066fcf5ef2aSThomas Huth } 1067fcf5ef2aSThomas Huth 1068fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1069fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] + 1070fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1071fcf5ef2aSThomas Huth } 1072fcf5ef2aSThomas Huth } 1073fcf5ef2aSThomas Huth 107489a5a1aeSMatheus Ferst void helper_VMSUMUHM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1075fcf5ef2aSThomas Huth { 1076fcf5ef2aSThomas Huth uint32_t prod[8]; 1077fcf5ef2aSThomas Huth int i; 1078fcf5ef2aSThomas Huth 1079fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1080fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1081fcf5ef2aSThomas Huth } 1082fcf5ef2aSThomas Huth 1083fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1084fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1085fcf5ef2aSThomas Huth } 1086fcf5ef2aSThomas Huth } 1087fcf5ef2aSThomas Huth 108889a5a1aeSMatheus Ferst void helper_VMSUMUHS(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1089fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1090fcf5ef2aSThomas Huth { 1091fcf5ef2aSThomas Huth uint32_t prod[8]; 1092fcf5ef2aSThomas Huth int i; 1093fcf5ef2aSThomas Huth int sat = 0; 1094fcf5ef2aSThomas Huth 1095fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1096fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1097fcf5ef2aSThomas Huth } 1098fcf5ef2aSThomas Huth 1099fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1100fcf5ef2aSThomas Huth uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1101fcf5ef2aSThomas Huth 1102fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1103fcf5ef2aSThomas Huth } 1104fcf5ef2aSThomas Huth 1105fcf5ef2aSThomas Huth if (sat) { 11066175f5a0SRichard Henderson set_vscr_sat(env); 1107fcf5ef2aSThomas Huth } 1108fcf5ef2aSThomas Huth } 1109fcf5ef2aSThomas Huth 11104fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast) \ 111180eca687SLucas Mateus Castro (alqotel) void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1112fcf5ef2aSThomas Huth { \ 1113fcf5ef2aSThomas Huth int i; \ 1114fcf5ef2aSThomas Huth \ 11154fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 11164fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i) * \ 11174fbc89edSMark Cave-Ayland (cast)b->mul_access(i); \ 1118fcf5ef2aSThomas Huth } \ 1119fcf5ef2aSThomas Huth } 11204fbc89edSMark Cave-Ayland 11214fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast) \ 112280eca687SLucas Mateus Castro (alqotel) void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 11234fbc89edSMark Cave-Ayland { \ 11244fbc89edSMark Cave-Ayland int i; \ 11254fbc89edSMark Cave-Ayland \ 11264fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 11274fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) * \ 11284fbc89edSMark Cave-Ayland (cast)b->mul_access(i + 1); \ 11294fbc89edSMark Cave-Ayland } \ 11304fbc89edSMark Cave-Ayland } 11314fbc89edSMark Cave-Ayland 11324fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast) \ 113380eca687SLucas Mateus Castro (alqotel) VMUL_DO_EVN(MULE##suffix, mul_element, mul_access, prod_access, cast) \ 113480eca687SLucas Mateus Castro (alqotel) VMUL_DO_ODD(MULO##suffix, mul_element, mul_access, prod_access, cast) 113580eca687SLucas Mateus Castro (alqotel) VMUL(SB, s8, VsrSB, VsrSH, int16_t) 113680eca687SLucas Mateus Castro (alqotel) VMUL(SH, s16, VsrSH, VsrSW, int32_t) 113780eca687SLucas Mateus Castro (alqotel) VMUL(SW, s32, VsrSW, VsrSD, int64_t) 113880eca687SLucas Mateus Castro (alqotel) VMUL(UB, u8, VsrB, VsrH, uint16_t) 113980eca687SLucas Mateus Castro (alqotel) VMUL(UH, u16, VsrH, VsrW, uint32_t) 114080eca687SLucas Mateus Castro (alqotel) VMUL(UW, u32, VsrW, VsrD, uint64_t) 11414fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN 11424fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD 1143fcf5ef2aSThomas Huth #undef VMUL 1144fcf5ef2aSThomas Huth 114541c2877fSMatheus Ferst void helper_XXPERMX(ppc_vsr_t *t, ppc_vsr_t *s0, ppc_vsr_t *s1, ppc_vsr_t *pcv, 114641c2877fSMatheus Ferst target_ulong uim) 114741c2877fSMatheus Ferst { 114841c2877fSMatheus Ferst int i, idx; 114941c2877fSMatheus Ferst ppc_vsr_t tmp = { .u64 = {0, 0} }; 115041c2877fSMatheus Ferst 115141c2877fSMatheus Ferst for (i = 0; i < ARRAY_SIZE(t->u8); i++) { 115241c2877fSMatheus Ferst if ((pcv->VsrB(i) >> 5) == uim) { 115341c2877fSMatheus Ferst idx = pcv->VsrB(i) & 0x1f; 115441c2877fSMatheus Ferst if (idx < ARRAY_SIZE(t->u8)) { 115541c2877fSMatheus Ferst tmp.VsrB(i) = s0->VsrB(idx); 115641c2877fSMatheus Ferst } else { 115741c2877fSMatheus Ferst tmp.VsrB(i) = s1->VsrB(idx - ARRAY_SIZE(t->u8)); 115841c2877fSMatheus Ferst } 115941c2877fSMatheus Ferst } 116041c2877fSMatheus Ferst } 116141c2877fSMatheus Ferst 116241c2877fSMatheus Ferst *t = tmp; 116341c2877fSMatheus Ferst } 116441c2877fSMatheus Ferst 1165*1700f2bfSLucas Mateus Castro (alqotel) void helper_VDIVSQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1166*1700f2bfSLucas Mateus Castro (alqotel) { 1167*1700f2bfSLucas Mateus Castro (alqotel) Int128 neg1 = int128_makes64(-1); 1168*1700f2bfSLucas Mateus Castro (alqotel) Int128 int128_min = int128_make128(0, INT64_MIN); 1169*1700f2bfSLucas Mateus Castro (alqotel) if (likely(int128_nz(b->s128) && 1170*1700f2bfSLucas Mateus Castro (alqotel) (int128_ne(a->s128, int128_min) || int128_ne(b->s128, neg1)))) { 1171*1700f2bfSLucas Mateus Castro (alqotel) t->s128 = int128_divs(a->s128, b->s128); 1172*1700f2bfSLucas Mateus Castro (alqotel) } else { 1173*1700f2bfSLucas Mateus Castro (alqotel) t->s128 = a->s128; /* Undefined behavior */ 1174*1700f2bfSLucas Mateus Castro (alqotel) } 1175*1700f2bfSLucas Mateus Castro (alqotel) } 1176*1700f2bfSLucas Mateus Castro (alqotel) 1177*1700f2bfSLucas Mateus Castro (alqotel) void helper_VDIVUQ(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b) 1178*1700f2bfSLucas Mateus Castro (alqotel) { 1179*1700f2bfSLucas Mateus Castro (alqotel) if (int128_nz(b->s128)) { 1180*1700f2bfSLucas Mateus Castro (alqotel) t->s128 = int128_divu(a->s128, b->s128); 1181*1700f2bfSLucas Mateus Castro (alqotel) } else { 1182*1700f2bfSLucas Mateus Castro (alqotel) t->s128 = a->s128; /* Undefined behavior */ 1183*1700f2bfSLucas Mateus Castro (alqotel) } 1184*1700f2bfSLucas Mateus Castro (alqotel) } 1185*1700f2bfSLucas Mateus Castro (alqotel) 118628347fe2SMatheus Ferst void helper_VPERM(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1187fcf5ef2aSThomas Huth { 1188fcf5ef2aSThomas Huth ppc_avr_t result; 1189fcf5ef2aSThomas Huth int i; 1190fcf5ef2aSThomas Huth 119160594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 119260594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1193fcf5ef2aSThomas Huth int index = s & 0xf; 1194fcf5ef2aSThomas Huth 1195fcf5ef2aSThomas Huth if (s & 0x10) { 119660594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1197fcf5ef2aSThomas Huth } else { 119860594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1199fcf5ef2aSThomas Huth } 1200fcf5ef2aSThomas Huth } 1201fcf5ef2aSThomas Huth *r = result; 1202fcf5ef2aSThomas Huth } 1203fcf5ef2aSThomas Huth 120428347fe2SMatheus Ferst void helper_VPERMR(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1205fcf5ef2aSThomas Huth { 1206fcf5ef2aSThomas Huth ppc_avr_t result; 1207fcf5ef2aSThomas Huth int i; 1208fcf5ef2aSThomas Huth 120960594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 121060594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1211fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1212fcf5ef2aSThomas Huth 1213fcf5ef2aSThomas Huth if (s & 0x10) { 121460594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1215fcf5ef2aSThomas Huth } else { 121660594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1217fcf5ef2aSThomas Huth } 1218fcf5ef2aSThomas Huth } 1219fcf5ef2aSThomas Huth *r = result; 1220fcf5ef2aSThomas Huth } 1221fcf5ef2aSThomas Huth 1222618574ddSMatheus Ferst #define XXGENPCV_BE_EXP(NAME, SZ) \ 1223b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \ 1224b090f4f1SMatheus Ferst { \ 1225b090f4f1SMatheus Ferst ppc_vsr_t tmp; \ 1226b090f4f1SMatheus Ferst \ 1227b090f4f1SMatheus Ferst /* Initialize tmp with the result of an all-zeros mask */ \ 1228b090f4f1SMatheus Ferst tmp.VsrD(0) = 0x1011121314151617; \ 1229b090f4f1SMatheus Ferst tmp.VsrD(1) = 0x18191A1B1C1D1E1F; \ 1230b090f4f1SMatheus Ferst \ 1231b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1232b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1233b090f4f1SMatheus Ferst if (b->VsrB(i) & 0x80) { \ 1234b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1235b090f4f1SMatheus Ferst for (int k = 0; k < SZ; k++) { \ 1236b090f4f1SMatheus Ferst tmp.VsrB(i + k) = j + k; \ 1237b090f4f1SMatheus Ferst } \ 1238b090f4f1SMatheus Ferst j += SZ; \ 1239b090f4f1SMatheus Ferst } \ 1240b090f4f1SMatheus Ferst } \ 1241b090f4f1SMatheus Ferst \ 1242b090f4f1SMatheus Ferst *t = tmp; \ 1243618574ddSMatheus Ferst } 1244618574ddSMatheus Ferst 1245618574ddSMatheus Ferst #define XXGENPCV_BE_COMP(NAME, SZ) \ 1246b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _be_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\ 1247b090f4f1SMatheus Ferst { \ 1248b090f4f1SMatheus Ferst ppc_vsr_t tmp = { .u64 = { 0, 0 } }; \ 1249b090f4f1SMatheus Ferst \ 1250b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1251b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1252b090f4f1SMatheus Ferst if (b->VsrB(i) & 0x80) { \ 1253b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1254b090f4f1SMatheus Ferst for (int k = 0; k < SZ; k++) { \ 1255b090f4f1SMatheus Ferst tmp.VsrB(j + k) = i + k; \ 1256b090f4f1SMatheus Ferst } \ 1257b090f4f1SMatheus Ferst j += SZ; \ 1258b090f4f1SMatheus Ferst } \ 1259b090f4f1SMatheus Ferst } \ 1260b090f4f1SMatheus Ferst \ 1261b090f4f1SMatheus Ferst *t = tmp; \ 1262618574ddSMatheus Ferst } 1263618574ddSMatheus Ferst 1264618574ddSMatheus Ferst #define XXGENPCV_LE_EXP(NAME, SZ) \ 1265b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_exp))(ppc_vsr_t *t, ppc_vsr_t *b) \ 1266b090f4f1SMatheus Ferst { \ 1267b090f4f1SMatheus Ferst ppc_vsr_t tmp; \ 1268b090f4f1SMatheus Ferst \ 1269b090f4f1SMatheus Ferst /* Initialize tmp with the result of an all-zeros mask */ \ 1270b090f4f1SMatheus Ferst tmp.VsrD(0) = 0x1F1E1D1C1B1A1918; \ 1271b090f4f1SMatheus Ferst tmp.VsrD(1) = 0x1716151413121110; \ 1272b090f4f1SMatheus Ferst \ 1273b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1274b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1275b090f4f1SMatheus Ferst /* Reverse indexing of "i" */ \ 1276b090f4f1SMatheus Ferst const int idx = ARRAY_SIZE(b->u8) - i - SZ; \ 1277b090f4f1SMatheus Ferst if (b->VsrB(idx) & 0x80) { \ 1278b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1279b090f4f1SMatheus Ferst for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) { \ 1280b090f4f1SMatheus Ferst tmp.VsrB(idx + rk) = j + k; \ 1281b090f4f1SMatheus Ferst } \ 1282b090f4f1SMatheus Ferst j += SZ; \ 1283b090f4f1SMatheus Ferst } \ 1284b090f4f1SMatheus Ferst } \ 1285b090f4f1SMatheus Ferst \ 1286b090f4f1SMatheus Ferst *t = tmp; \ 1287618574ddSMatheus Ferst } 1288618574ddSMatheus Ferst 1289618574ddSMatheus Ferst #define XXGENPCV_LE_COMP(NAME, SZ) \ 1290b090f4f1SMatheus Ferst void glue(helper_, glue(NAME, _le_comp))(ppc_vsr_t *t, ppc_vsr_t *b)\ 1291b090f4f1SMatheus Ferst { \ 1292b090f4f1SMatheus Ferst ppc_vsr_t tmp = { .u64 = { 0, 0 } }; \ 1293b090f4f1SMatheus Ferst \ 1294b090f4f1SMatheus Ferst /* Iterate over the most significant byte of each element */ \ 1295b090f4f1SMatheus Ferst for (int i = 0, j = 0; i < ARRAY_SIZE(b->u8); i += SZ) { \ 1296b090f4f1SMatheus Ferst if (b->VsrB(ARRAY_SIZE(b->u8) - i - SZ) & 0x80) { \ 1297b090f4f1SMatheus Ferst /* Update each byte of the element */ \ 1298b090f4f1SMatheus Ferst for (int k = 0, rk = SZ - 1; k < SZ; k++, rk--) { \ 1299b090f4f1SMatheus Ferst /* Reverse indexing of "j" */ \ 1300b090f4f1SMatheus Ferst const int idx = ARRAY_SIZE(b->u8) - j - SZ; \ 1301b090f4f1SMatheus Ferst tmp.VsrB(idx + rk) = i + k; \ 1302b090f4f1SMatheus Ferst } \ 1303b090f4f1SMatheus Ferst j += SZ; \ 1304b090f4f1SMatheus Ferst } \ 1305b090f4f1SMatheus Ferst } \ 1306b090f4f1SMatheus Ferst \ 1307b090f4f1SMatheus Ferst *t = tmp; \ 1308b090f4f1SMatheus Ferst } 1309b090f4f1SMatheus Ferst 1310618574ddSMatheus Ferst #define XXGENPCV(NAME, SZ) \ 1311618574ddSMatheus Ferst XXGENPCV_BE_EXP(NAME, SZ) \ 1312618574ddSMatheus Ferst XXGENPCV_BE_COMP(NAME, SZ) \ 1313618574ddSMatheus Ferst XXGENPCV_LE_EXP(NAME, SZ) \ 1314618574ddSMatheus Ferst XXGENPCV_LE_COMP(NAME, SZ) \ 1315618574ddSMatheus Ferst 1316b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVBM, 1) 1317b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVHM, 2) 1318b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVWM, 4) 1319b090f4f1SMatheus Ferst XXGENPCV(XXGENPCVDM, 8) 1320618574ddSMatheus Ferst 1321618574ddSMatheus Ferst #undef XXGENPCV_BE_EXP 1322618574ddSMatheus Ferst #undef XXGENPCV_BE_COMP 1323618574ddSMatheus Ferst #undef XXGENPCV_LE_EXP 1324618574ddSMatheus Ferst #undef XXGENPCV_LE_COMP 1325b090f4f1SMatheus Ferst #undef XXGENPCV 1326b090f4f1SMatheus Ferst 1327e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1328fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)]) 1329fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i) 1330fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0) 1331fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1)) 1332fcf5ef2aSThomas Huth #else 1333fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)]) 1334fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i) 1335fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0) 1336fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \ 1337fcf5ef2aSThomas Huth (extract64((avr)->u64[1 - i], 63 - index, 1)) 1338fcf5ef2aSThomas Huth #endif 1339fcf5ef2aSThomas Huth 1340fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1341fcf5ef2aSThomas Huth { 1342fcf5ef2aSThomas Huth int i, j; 1343fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 1344fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1345fcf5ef2aSThomas Huth for (j = 0; j < 8; j++) { 1346fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, (i * 8) + j); 1347fcf5ef2aSThomas Huth if (index < 64 && EXTRACT_BIT(a, i, index)) { 1348fcf5ef2aSThomas Huth result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j); 1349fcf5ef2aSThomas Huth } 1350fcf5ef2aSThomas Huth } 1351fcf5ef2aSThomas Huth } 1352fcf5ef2aSThomas Huth *r = result; 1353fcf5ef2aSThomas Huth } 1354fcf5ef2aSThomas Huth 1355fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1356fcf5ef2aSThomas Huth { 1357fcf5ef2aSThomas Huth int i; 1358fcf5ef2aSThomas Huth uint64_t perm = 0; 1359fcf5ef2aSThomas Huth 1360fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1361fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, i); 1362fcf5ef2aSThomas Huth 1363fcf5ef2aSThomas Huth if (index < 128) { 1364fcf5ef2aSThomas Huth uint64_t mask = (1ull << (63 - (index & 0x3F))); 1365fcf5ef2aSThomas Huth if (a->u64[VBPERMQ_DW(index)] & mask) { 1366fcf5ef2aSThomas Huth perm |= (0x8000 >> i); 1367fcf5ef2aSThomas Huth } 1368fcf5ef2aSThomas Huth } 1369fcf5ef2aSThomas Huth } 1370fcf5ef2aSThomas Huth 13713c385a93SMark Cave-Ayland r->VsrD(0) = perm; 13723c385a93SMark Cave-Ayland r->VsrD(1) = 0; 1373fcf5ef2aSThomas Huth } 1374fcf5ef2aSThomas Huth 1375fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX 1376fcf5ef2aSThomas Huth #undef VBPERMQ_DW 1377fcf5ef2aSThomas Huth 1378fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp) \ 1379fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1380fcf5ef2aSThomas Huth { \ 1381fcf5ef2aSThomas Huth int i, j; \ 1382fcf5ef2aSThomas Huth trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])]; \ 1383fcf5ef2aSThomas Huth \ 1384fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, srcfld) { \ 1385fcf5ef2aSThomas Huth prod[i] = 0; \ 1386fcf5ef2aSThomas Huth for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) { \ 1387fcf5ef2aSThomas Huth if (a->srcfld[i] & (1ull << j)) { \ 1388fcf5ef2aSThomas Huth prod[i] ^= ((trgtyp)b->srcfld[i] << j); \ 1389fcf5ef2aSThomas Huth } \ 1390fcf5ef2aSThomas Huth } \ 1391fcf5ef2aSThomas Huth } \ 1392fcf5ef2aSThomas Huth \ 1393fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, trgfld) { \ 1394fcf5ef2aSThomas Huth r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1]; \ 1395fcf5ef2aSThomas Huth } \ 1396fcf5ef2aSThomas Huth } 1397fcf5ef2aSThomas Huth 1398fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t) 1399fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t) 1400fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t) 1401fcf5ef2aSThomas Huth 1402fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1403fcf5ef2aSThomas Huth { 1404fcf5ef2aSThomas Huth 1405fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1406fcf5ef2aSThomas Huth int i, j; 1407fcf5ef2aSThomas Huth __uint128_t prod[2]; 1408fcf5ef2aSThomas Huth 1409fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1410fcf5ef2aSThomas Huth prod[i] = 0; 1411fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1412fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1413fcf5ef2aSThomas Huth prod[i] ^= (((__uint128_t)b->u64[i]) << j); 1414fcf5ef2aSThomas Huth } 1415fcf5ef2aSThomas Huth } 1416fcf5ef2aSThomas Huth } 1417fcf5ef2aSThomas Huth 1418fcf5ef2aSThomas Huth r->u128 = prod[0] ^ prod[1]; 1419fcf5ef2aSThomas Huth 1420fcf5ef2aSThomas Huth #else 1421fcf5ef2aSThomas Huth int i, j; 1422fcf5ef2aSThomas Huth ppc_avr_t prod[2]; 1423fcf5ef2aSThomas Huth 1424fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 14253c385a93SMark Cave-Ayland prod[i].VsrD(1) = prod[i].VsrD(0) = 0; 1426fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1427fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1428fcf5ef2aSThomas Huth ppc_avr_t bshift; 1429fcf5ef2aSThomas Huth if (j == 0) { 14303c385a93SMark Cave-Ayland bshift.VsrD(0) = 0; 14313c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i]; 1432fcf5ef2aSThomas Huth } else { 14333c385a93SMark Cave-Ayland bshift.VsrD(0) = b->u64[i] >> (64 - j); 14343c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i] << j; 1435fcf5ef2aSThomas Huth } 14363c385a93SMark Cave-Ayland prod[i].VsrD(1) ^= bshift.VsrD(1); 14373c385a93SMark Cave-Ayland prod[i].VsrD(0) ^= bshift.VsrD(0); 1438fcf5ef2aSThomas Huth } 1439fcf5ef2aSThomas Huth } 1440fcf5ef2aSThomas Huth } 1441fcf5ef2aSThomas Huth 14423c385a93SMark Cave-Ayland r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1); 14433c385a93SMark Cave-Ayland r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0); 1444fcf5ef2aSThomas Huth #endif 1445fcf5ef2aSThomas Huth } 1446fcf5ef2aSThomas Huth 1447fcf5ef2aSThomas Huth 1448e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1449fcf5ef2aSThomas Huth #define PKBIG 1 1450fcf5ef2aSThomas Huth #else 1451fcf5ef2aSThomas Huth #define PKBIG 0 1452fcf5ef2aSThomas Huth #endif 1453fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1454fcf5ef2aSThomas Huth { 1455fcf5ef2aSThomas Huth int i, j; 1456fcf5ef2aSThomas Huth ppc_avr_t result; 1457e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1458fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { a, b }; 1459fcf5ef2aSThomas Huth #else 1460fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { b, a }; 1461fcf5ef2aSThomas Huth #endif 1462fcf5ef2aSThomas Huth 1463fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1464fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(j, u32) { 1465fcf5ef2aSThomas Huth uint32_t e = x[i]->u32[j]; 1466fcf5ef2aSThomas Huth 1467fcf5ef2aSThomas Huth result.u16[4 * i + j] = (((e >> 9) & 0xfc00) | 1468fcf5ef2aSThomas Huth ((e >> 6) & 0x3e0) | 1469fcf5ef2aSThomas Huth ((e >> 3) & 0x1f)); 1470fcf5ef2aSThomas Huth } 1471fcf5ef2aSThomas Huth } 1472fcf5ef2aSThomas Huth *r = result; 1473fcf5ef2aSThomas Huth } 1474fcf5ef2aSThomas Huth 1475fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat) \ 1476fcf5ef2aSThomas Huth void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1477fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 1478fcf5ef2aSThomas Huth { \ 1479fcf5ef2aSThomas Huth int i; \ 1480fcf5ef2aSThomas Huth int sat = 0; \ 1481fcf5ef2aSThomas Huth ppc_avr_t result; \ 1482fcf5ef2aSThomas Huth ppc_avr_t *a0 = PKBIG ? a : b; \ 1483fcf5ef2aSThomas Huth ppc_avr_t *a1 = PKBIG ? b : a; \ 1484fcf5ef2aSThomas Huth \ 1485fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, from) { \ 1486fcf5ef2aSThomas Huth result.to[i] = cvt(a0->from[i], &sat); \ 1487fcf5ef2aSThomas Huth result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\ 1488fcf5ef2aSThomas Huth } \ 1489fcf5ef2aSThomas Huth *r = result; \ 1490fcf5ef2aSThomas Huth if (dosat && sat) { \ 14916175f5a0SRichard Henderson set_vscr_sat(env); \ 1492fcf5ef2aSThomas Huth } \ 1493fcf5ef2aSThomas Huth } 1494fcf5ef2aSThomas Huth #define I(x, y) (x) 1495fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1) 1496fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1) 1497fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1) 1498fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1) 1499fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1) 1500fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1) 1501fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1) 1502fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1) 1503fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1) 1504fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0) 1505fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0) 1506fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0) 1507fcf5ef2aSThomas Huth #undef I 1508fcf5ef2aSThomas Huth #undef VPK 1509fcf5ef2aSThomas Huth #undef PKBIG 1510fcf5ef2aSThomas Huth 1511fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1512fcf5ef2aSThomas Huth { 1513fcf5ef2aSThomas Huth int i; 1514fcf5ef2aSThomas Huth 151505ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 151605ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status); 1517fcf5ef2aSThomas Huth } 1518fcf5ef2aSThomas Huth } 1519fcf5ef2aSThomas Huth 1520fcf5ef2aSThomas Huth #define VRFI(suffix, rounding) \ 1521fcf5ef2aSThomas Huth void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1522fcf5ef2aSThomas Huth ppc_avr_t *b) \ 1523fcf5ef2aSThomas Huth { \ 1524fcf5ef2aSThomas Huth int i; \ 1525fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 1526fcf5ef2aSThomas Huth \ 1527fcf5ef2aSThomas Huth set_float_rounding_mode(rounding, &s); \ 152805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 152905ee3e8aSMark Cave-Ayland r->f32[i] = float32_round_to_int (b->f32[i], &s); \ 1530fcf5ef2aSThomas Huth } \ 1531fcf5ef2aSThomas Huth } 1532fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even) 1533fcf5ef2aSThomas Huth VRFI(m, float_round_down) 1534fcf5ef2aSThomas Huth VRFI(p, float_round_up) 1535fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero) 1536fcf5ef2aSThomas Huth #undef VRFI 1537fcf5ef2aSThomas Huth 1538fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1539fcf5ef2aSThomas Huth { 1540fcf5ef2aSThomas Huth int i; 1541fcf5ef2aSThomas Huth 154205ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 154305ee3e8aSMark Cave-Ayland float32 t = float32_sqrt(b->f32[i], &env->vec_status); 1544fcf5ef2aSThomas Huth 154505ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, t, &env->vec_status); 1546fcf5ef2aSThomas Huth } 1547fcf5ef2aSThomas Huth } 1548fcf5ef2aSThomas Huth 1549fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert) \ 155002c74f0eSMatheus Ferst void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 1551fcf5ef2aSThomas Huth { \ 1552fcf5ef2aSThomas Huth int i; \ 1553fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1554fcf5ef2aSThomas Huth uint##size##_t src1 = a->element[i]; \ 1555fcf5ef2aSThomas Huth uint##size##_t src2 = b->element[i]; \ 1556fcf5ef2aSThomas Huth uint##size##_t src3 = r->element[i]; \ 1557fcf5ef2aSThomas Huth uint##size##_t begin, end, shift, mask, rot_val; \ 1558fcf5ef2aSThomas Huth \ 1559fcf5ef2aSThomas Huth shift = extract##size(src2, 0, 6); \ 1560fcf5ef2aSThomas Huth end = extract##size(src2, 8, 6); \ 1561fcf5ef2aSThomas Huth begin = extract##size(src2, 16, 6); \ 1562fcf5ef2aSThomas Huth rot_val = rol##size(src1, shift); \ 1563fcf5ef2aSThomas Huth mask = mask_u##size(begin, end); \ 1564fcf5ef2aSThomas Huth if (insert) { \ 1565fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask) | (src3 & ~mask); \ 1566fcf5ef2aSThomas Huth } else { \ 1567fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask); \ 1568fcf5ef2aSThomas Huth } \ 1569fcf5ef2aSThomas Huth } \ 1570fcf5ef2aSThomas Huth } 1571fcf5ef2aSThomas Huth 157202c74f0eSMatheus Ferst VRLMI(VRLDMI, 64, u64, 1); 157302c74f0eSMatheus Ferst VRLMI(VRLWMI, 32, u32, 1); 157402c74f0eSMatheus Ferst VRLMI(VRLDNM, 64, u64, 0); 157502c74f0eSMatheus Ferst VRLMI(VRLWNM, 32, u32, 0); 1576fcf5ef2aSThomas Huth 1577fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1578fcf5ef2aSThomas Huth { 1579fcf5ef2aSThomas Huth int i; 1580fcf5ef2aSThomas Huth 158105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 158205ee3e8aSMark Cave-Ayland r->f32[i] = float32_exp2(b->f32[i], &env->vec_status); 1583fcf5ef2aSThomas Huth } 1584fcf5ef2aSThomas Huth } 1585fcf5ef2aSThomas Huth 1586fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1587fcf5ef2aSThomas Huth { 1588fcf5ef2aSThomas Huth int i; 1589fcf5ef2aSThomas Huth 159005ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 159105ee3e8aSMark Cave-Ayland r->f32[i] = float32_log2(b->f32[i], &env->vec_status); 1592fcf5ef2aSThomas Huth } 1593fcf5ef2aSThomas Huth } 1594fcf5ef2aSThomas Huth 159560caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 159660caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 159760caf221SAvinesh Kumar { \ 1598f297c4c6SMatheus Ferst int index = (a & 0xf) * 8; \ 159960caf221SAvinesh Kumar if (left) { \ 1600f297c4c6SMatheus Ferst index = 128 - index - size; \ 160160caf221SAvinesh Kumar } \ 160260caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 160360caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 160460caf221SAvinesh Kumar } 160560caf221SAvinesh Kumar VEXTU_X_DO(vextublx, 8, 1) 160660caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1) 160760caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1) 160860caf221SAvinesh Kumar VEXTU_X_DO(vextubrx, 8, 0) 160960caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0) 161060caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0) 161160caf221SAvinesh Kumar #undef VEXTU_X_DO 161260caf221SAvinesh Kumar 1613fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1614fcf5ef2aSThomas Huth { 1615fcf5ef2aSThomas Huth int i; 1616fcf5ef2aSThomas Huth unsigned int shift, bytes, size; 1617fcf5ef2aSThomas Huth 1618fcf5ef2aSThomas Huth size = ARRAY_SIZE(r->u8); 1619fcf5ef2aSThomas Huth for (i = 0; i < size; i++) { 162063be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 162163be02fcSAnton Blanchard bytes = (a->VsrB(i) << 8) + /* extract adjacent bytes */ 162263be02fcSAnton Blanchard (((i + 1) < size) ? a->VsrB(i + 1) : 0); 162363be02fcSAnton Blanchard r->VsrB(i) = (bytes << shift) >> 8; /* shift and store result */ 1624fcf5ef2aSThomas Huth } 1625fcf5ef2aSThomas Huth } 1626fcf5ef2aSThomas Huth 1627fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1628fcf5ef2aSThomas Huth { 1629fcf5ef2aSThomas Huth int i; 1630fcf5ef2aSThomas Huth unsigned int shift, bytes; 1631fcf5ef2aSThomas Huth 1632b6cb41b2SDavid Gibson /* 1633b6cb41b2SDavid Gibson * Use reverse order, as destination and source register can be 1634b6cb41b2SDavid Gibson * same. Its being modified in place saving temporary, reverse 1635b6cb41b2SDavid Gibson * order will guarantee that computed result is not fed back. 1636fcf5ef2aSThomas Huth */ 1637fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 163863be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 163963be02fcSAnton Blanchard bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i); 1640fcf5ef2aSThomas Huth /* extract adjacent bytes */ 164163be02fcSAnton Blanchard r->VsrB(i) = (bytes >> shift) & 0xFF; /* shift and store result */ 1642fcf5ef2aSThomas Huth } 1643fcf5ef2aSThomas Huth } 1644fcf5ef2aSThomas Huth 1645fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift) 1646fcf5ef2aSThomas Huth { 1647fcf5ef2aSThomas Huth int sh = shift & 0xf; 1648fcf5ef2aSThomas Huth int i; 1649fcf5ef2aSThomas Huth ppc_avr_t result; 1650fcf5ef2aSThomas Huth 1651fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1652fcf5ef2aSThomas Huth int index = sh + i; 1653fcf5ef2aSThomas Huth if (index > 0xf) { 165460594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index - 0x10); 1655fcf5ef2aSThomas Huth } else { 165660594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1657fcf5ef2aSThomas Huth } 1658fcf5ef2aSThomas Huth } 1659fcf5ef2aSThomas Huth *r = result; 1660fcf5ef2aSThomas Huth } 1661fcf5ef2aSThomas Huth 1662fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1663fcf5ef2aSThomas Huth { 16643c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1665fcf5ef2aSThomas Huth 1666e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1667fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1668fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1669fcf5ef2aSThomas Huth #else 1670fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1671fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1672fcf5ef2aSThomas Huth #endif 1673fcf5ef2aSThomas Huth } 1674fcf5ef2aSThomas Huth 1675e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 16762cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX]) 16772cc12af3SMatheus Ferst #else 16782cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1) 16792cc12af3SMatheus Ferst #endif 16802cc12af3SMatheus Ferst 16812cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \ 16822cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t, \ 16832cc12af3SMatheus Ferst uint64_t val, target_ulong index) \ 16842cc12af3SMatheus Ferst { \ 16852cc12af3SMatheus Ferst const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE); \ 16862cc12af3SMatheus Ferst target_long idx = index; \ 16872cc12af3SMatheus Ferst \ 16882cc12af3SMatheus Ferst if (idx < 0 || idx > maxidx) { \ 16892cc12af3SMatheus Ferst idx = idx < 0 ? sizeof(TYPE) - idx : idx; \ 16902cc12af3SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, \ 16912cc12af3SMatheus Ferst "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx \ 16922cc12af3SMatheus Ferst ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx); \ 16932cc12af3SMatheus Ferst } else { \ 16942cc12af3SMatheus Ferst TYPE src = val; \ 16952cc12af3SMatheus Ferst memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE)); \ 16962cc12af3SMatheus Ferst } \ 16972cc12af3SMatheus Ferst } 16982cc12af3SMatheus Ferst VINSX(B, uint8_t) 16992cc12af3SMatheus Ferst VINSX(H, uint16_t) 17002cc12af3SMatheus Ferst VINSX(W, uint32_t) 17012cc12af3SMatheus Ferst VINSX(D, uint64_t) 17022cc12af3SMatheus Ferst #undef ELEM_ADDR 17032cc12af3SMatheus Ferst #undef VINSX 1704e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 170528110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \ 170628110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 170728110b72SMatheus Ferst target_ulong index) \ 170828110b72SMatheus Ferst { \ 170928110b72SMatheus Ferst const target_long idx = index; \ 171028110b72SMatheus Ferst ppc_avr_t tmp[2] = { *a, *b }; \ 171128110b72SMatheus Ferst memset(t, 0, sizeof(*t)); \ 171228110b72SMatheus Ferst if (idx >= 0 && idx + SIZE <= sizeof(tmp)) { \ 171328110b72SMatheus Ferst memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \ 171428110b72SMatheus Ferst } else { \ 171528110b72SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x" \ 171628110b72SMatheus Ferst TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n", \ 171728110b72SMatheus Ferst env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE); \ 171828110b72SMatheus Ferst } \ 171928110b72SMatheus Ferst } 172028110b72SMatheus Ferst #else 172128110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \ 172228110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 172328110b72SMatheus Ferst target_ulong index) \ 172428110b72SMatheus Ferst { \ 172528110b72SMatheus Ferst const target_long idx = index; \ 172628110b72SMatheus Ferst ppc_avr_t tmp[2] = { *b, *a }; \ 172728110b72SMatheus Ferst memset(t, 0, sizeof(*t)); \ 172828110b72SMatheus Ferst if (idx >= 0 && idx + SIZE <= sizeof(tmp)) { \ 172928110b72SMatheus Ferst memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2], \ 173028110b72SMatheus Ferst (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE); \ 173128110b72SMatheus Ferst } else { \ 173228110b72SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x" \ 173328110b72SMatheus Ferst TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n", \ 173428110b72SMatheus Ferst env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE); \ 173528110b72SMatheus Ferst } \ 173628110b72SMatheus Ferst } 173728110b72SMatheus Ferst #endif 173828110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1) 173928110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2) 174028110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4) 174128110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8) 174228110b72SMatheus Ferst #undef VEXTDVLX 1743e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1744fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1745fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1746fcf5ef2aSThomas Huth { \ 1747fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1748fcf5ef2aSThomas Huth memmove(&r->u8[8 - es], &b->u8[index], es); \ 1749fcf5ef2aSThomas Huth memset(&r->u8[8], 0, 8); \ 1750fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8 - es); \ 1751fcf5ef2aSThomas Huth } 1752fcf5ef2aSThomas Huth #else 1753fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1754fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1755fcf5ef2aSThomas Huth { \ 1756fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1757fcf5ef2aSThomas Huth uint32_t s = (16 - index) - es; \ 1758fcf5ef2aSThomas Huth memmove(&r->u8[8], &b->u8[s], es); \ 1759fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8); \ 1760fcf5ef2aSThomas Huth memset(&r->u8[8 + es], 0, 8 - es); \ 1761fcf5ef2aSThomas Huth } 1762fcf5ef2aSThomas Huth #endif 1763fcf5ef2aSThomas Huth VEXTRACT(ub, u8) 1764fcf5ef2aSThomas Huth VEXTRACT(uh, u16) 1765fcf5ef2aSThomas Huth VEXTRACT(uw, u32) 1766fcf5ef2aSThomas Huth VEXTRACT(d, u64) 1767fcf5ef2aSThomas Huth #undef VEXTRACT 1768fcf5ef2aSThomas Huth 1769fb5303ccSMatheus Ferst #define VSTRI(NAME, ELEM, NUM_ELEMS, LEFT) \ 1770fb5303ccSMatheus Ferst uint32_t helper_##NAME(ppc_avr_t *t, ppc_avr_t *b) \ 1771fb5303ccSMatheus Ferst { \ 1772fb5303ccSMatheus Ferst int i, idx, crf = 0; \ 1773fb5303ccSMatheus Ferst \ 1774fb5303ccSMatheus Ferst for (i = 0; i < NUM_ELEMS; i++) { \ 1775fb5303ccSMatheus Ferst idx = LEFT ? i : NUM_ELEMS - i - 1; \ 1776fb5303ccSMatheus Ferst if (b->Vsr##ELEM(idx)) { \ 1777fb5303ccSMatheus Ferst t->Vsr##ELEM(idx) = b->Vsr##ELEM(idx); \ 1778fb5303ccSMatheus Ferst } else { \ 1779fb5303ccSMatheus Ferst crf = 0b0010; \ 1780fb5303ccSMatheus Ferst break; \ 1781fb5303ccSMatheus Ferst } \ 1782fb5303ccSMatheus Ferst } \ 1783fb5303ccSMatheus Ferst \ 1784fb5303ccSMatheus Ferst for (; i < NUM_ELEMS; i++) { \ 1785fb5303ccSMatheus Ferst idx = LEFT ? i : NUM_ELEMS - i - 1; \ 1786fb5303ccSMatheus Ferst t->Vsr##ELEM(idx) = 0; \ 1787fb5303ccSMatheus Ferst } \ 1788fb5303ccSMatheus Ferst \ 1789fb5303ccSMatheus Ferst return crf; \ 1790fb5303ccSMatheus Ferst } 1791fb5303ccSMatheus Ferst VSTRI(VSTRIBL, B, 16, true) 1792fb5303ccSMatheus Ferst VSTRI(VSTRIBR, B, 16, false) 1793fb5303ccSMatheus Ferst VSTRI(VSTRIHL, H, 8, true) 1794fb5303ccSMatheus Ferst VSTRI(VSTRIHR, H, 8, false) 1795fb5303ccSMatheus Ferst #undef VSTRI 1796fb5303ccSMatheus Ferst 17978f5eeee3SMatheus Ferst void helper_XXEXTRACTUW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index) 17988ad901e5SNikunj A Dadhania { 179903b32c09SMark Cave-Ayland ppc_vsr_t t = { }; 18008ad901e5SNikunj A Dadhania size_t es = sizeof(uint32_t); 18018ad901e5SNikunj A Dadhania uint32_t ext_index; 18028ad901e5SNikunj A Dadhania int i; 18038ad901e5SNikunj A Dadhania 18048ad901e5SNikunj A Dadhania ext_index = index; 18058ad901e5SNikunj A Dadhania for (i = 0; i < es; i++, ext_index++) { 180603b32c09SMark Cave-Ayland t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16); 18078ad901e5SNikunj A Dadhania } 18088ad901e5SNikunj A Dadhania 180903b32c09SMark Cave-Ayland *xt = t; 18108ad901e5SNikunj A Dadhania } 18118ad901e5SNikunj A Dadhania 18128f5eeee3SMatheus Ferst void helper_XXINSERTW(ppc_vsr_t *xt, ppc_vsr_t *xb, uint32_t index) 18133398b742SNikunj A Dadhania { 181403b32c09SMark Cave-Ayland ppc_vsr_t t = *xt; 18153398b742SNikunj A Dadhania size_t es = sizeof(uint32_t); 18163398b742SNikunj A Dadhania int ins_index, i = 0; 18173398b742SNikunj A Dadhania 18183398b742SNikunj A Dadhania ins_index = index; 18193398b742SNikunj A Dadhania for (i = 0; i < es && ins_index < 16; i++, ins_index++) { 182003b32c09SMark Cave-Ayland t.VsrB(ins_index) = xb->VsrB(8 - es + i); 18213398b742SNikunj A Dadhania } 18223398b742SNikunj A Dadhania 182303b32c09SMark Cave-Ayland *xt = t; 18243398b742SNikunj A Dadhania } 18253398b742SNikunj A Dadhania 18261015fcabSMatheus Ferst void helper_XXEVAL(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c, 18271015fcabSMatheus Ferst uint32_t desc) 18281015fcabSMatheus Ferst { 18291015fcabSMatheus Ferst /* 18301015fcabSMatheus Ferst * Instead of processing imm bit-by-bit, we'll skip the computation of 18311015fcabSMatheus Ferst * conjunctions whose corresponding bit is unset. 18321015fcabSMatheus Ferst */ 18331015fcabSMatheus Ferst int bit, imm = simd_data(desc); 18341015fcabSMatheus Ferst Int128 conj, disj = int128_zero(); 18351015fcabSMatheus Ferst 18361015fcabSMatheus Ferst /* Iterate over set bits from the least to the most significant bit */ 18371015fcabSMatheus Ferst while (imm) { 18381015fcabSMatheus Ferst /* 18391015fcabSMatheus Ferst * Get the next bit to be processed with ctz64. Invert the result of 18401015fcabSMatheus Ferst * ctz64 to match the indexing used by PowerISA. 18411015fcabSMatheus Ferst */ 18421015fcabSMatheus Ferst bit = 7 - ctzl(imm); 18431015fcabSMatheus Ferst if (bit & 0x4) { 18441015fcabSMatheus Ferst conj = a->s128; 18451015fcabSMatheus Ferst } else { 18461015fcabSMatheus Ferst conj = int128_not(a->s128); 18471015fcabSMatheus Ferst } 18481015fcabSMatheus Ferst if (bit & 0x2) { 18491015fcabSMatheus Ferst conj = int128_and(conj, b->s128); 18501015fcabSMatheus Ferst } else { 18511015fcabSMatheus Ferst conj = int128_and(conj, int128_not(b->s128)); 18521015fcabSMatheus Ferst } 18531015fcabSMatheus Ferst if (bit & 0x1) { 18541015fcabSMatheus Ferst conj = int128_and(conj, c->s128); 18551015fcabSMatheus Ferst } else { 18561015fcabSMatheus Ferst conj = int128_and(conj, int128_not(c->s128)); 18571015fcabSMatheus Ferst } 18581015fcabSMatheus Ferst disj = int128_or(disj, conj); 18591015fcabSMatheus Ferst 18601015fcabSMatheus Ferst /* Unset the least significant bit that is set */ 18611015fcabSMatheus Ferst imm &= imm - 1; 18621015fcabSMatheus Ferst } 18631015fcabSMatheus Ferst 18641015fcabSMatheus Ferst t->s128 = disj; 18651015fcabSMatheus Ferst } 18661015fcabSMatheus Ferst 1867788c6399SMatheus Ferst #define XXBLEND(name, sz) \ 1868788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 1869788c6399SMatheus Ferst ppc_avr_t *c, uint32_t desc) \ 1870788c6399SMatheus Ferst { \ 1871788c6399SMatheus Ferst for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) { \ 1872788c6399SMatheus Ferst t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ? \ 1873788c6399SMatheus Ferst b->glue(u, sz)[i] : a->glue(u, sz)[i]; \ 1874788c6399SMatheus Ferst } \ 1875788c6399SMatheus Ferst } 1876788c6399SMatheus Ferst XXBLEND(B, 8) 1877788c6399SMatheus Ferst XXBLEND(H, 16) 1878788c6399SMatheus Ferst XXBLEND(W, 32) 1879788c6399SMatheus Ferst XXBLEND(D, 64) 1880788c6399SMatheus Ferst #undef XXBLEND 1881788c6399SMatheus Ferst 1882fcf5ef2aSThomas Huth #define VNEG(name, element) \ 1883fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 1884fcf5ef2aSThomas Huth { \ 1885fcf5ef2aSThomas Huth int i; \ 188660594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1887fcf5ef2aSThomas Huth r->element[i] = -b->element[i]; \ 1888fcf5ef2aSThomas Huth } \ 1889fcf5ef2aSThomas Huth } 1890fcf5ef2aSThomas Huth VNEG(vnegw, s32) 1891fcf5ef2aSThomas Huth VNEG(vnegd, s64) 1892fcf5ef2aSThomas Huth #undef VNEG 1893fcf5ef2aSThomas Huth 1894fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1895fcf5ef2aSThomas Huth { 18963c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1897fcf5ef2aSThomas Huth 1898e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 1899fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1900fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1901fcf5ef2aSThomas Huth #else 1902fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1903fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1904fcf5ef2aSThomas Huth #endif 1905fcf5ef2aSThomas Huth } 1906fcf5ef2aSThomas Huth 1907fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1908fcf5ef2aSThomas Huth { 1909fcf5ef2aSThomas Huth int i; 1910fcf5ef2aSThomas Huth 1911fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1912fcf5ef2aSThomas Huth r->u32[i] = a->u32[i] >= b->u32[i]; 1913fcf5ef2aSThomas Huth } 1914fcf5ef2aSThomas Huth } 1915fcf5ef2aSThomas Huth 1916fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1917fcf5ef2aSThomas Huth { 1918fcf5ef2aSThomas Huth int64_t t; 1919fcf5ef2aSThomas Huth int i, upper; 1920fcf5ef2aSThomas Huth ppc_avr_t result; 1921fcf5ef2aSThomas Huth int sat = 0; 1922fcf5ef2aSThomas Huth 1923fcf5ef2aSThomas Huth upper = ARRAY_SIZE(r->s32) - 1; 192460594feaSMark Cave-Ayland t = (int64_t)b->VsrSW(upper); 1925fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 192660594feaSMark Cave-Ayland t += a->VsrSW(i); 192760594feaSMark Cave-Ayland result.VsrSW(i) = 0; 1928fcf5ef2aSThomas Huth } 192960594feaSMark Cave-Ayland result.VsrSW(upper) = cvtsdsw(t, &sat); 1930fcf5ef2aSThomas Huth *r = result; 1931fcf5ef2aSThomas Huth 1932fcf5ef2aSThomas Huth if (sat) { 19336175f5a0SRichard Henderson set_vscr_sat(env); 1934fcf5ef2aSThomas Huth } 1935fcf5ef2aSThomas Huth } 1936fcf5ef2aSThomas Huth 1937fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1938fcf5ef2aSThomas Huth { 1939fcf5ef2aSThomas Huth int i, j, upper; 1940fcf5ef2aSThomas Huth ppc_avr_t result; 1941fcf5ef2aSThomas Huth int sat = 0; 1942fcf5ef2aSThomas Huth 1943fcf5ef2aSThomas Huth upper = 1; 1944fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 194560594feaSMark Cave-Ayland int64_t t = (int64_t)b->VsrSW(upper + i * 2); 1946fcf5ef2aSThomas Huth 19477fa0ddc1SAnton Blanchard result.VsrD(i) = 0; 1948fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u64); j++) { 194960594feaSMark Cave-Ayland t += a->VsrSW(2 * i + j); 1950fcf5ef2aSThomas Huth } 195160594feaSMark Cave-Ayland result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat); 1952fcf5ef2aSThomas Huth } 1953fcf5ef2aSThomas Huth 1954fcf5ef2aSThomas Huth *r = result; 1955fcf5ef2aSThomas Huth if (sat) { 19566175f5a0SRichard Henderson set_vscr_sat(env); 1957fcf5ef2aSThomas Huth } 1958fcf5ef2aSThomas Huth } 1959fcf5ef2aSThomas Huth 1960fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1961fcf5ef2aSThomas Huth { 1962fcf5ef2aSThomas Huth int i, j; 1963fcf5ef2aSThomas Huth int sat = 0; 1964fcf5ef2aSThomas Huth 1965fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1966fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1967fcf5ef2aSThomas Huth 1968fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->s32); j++) { 1969fcf5ef2aSThomas Huth t += a->s8[4 * i + j]; 1970fcf5ef2aSThomas Huth } 1971fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1972fcf5ef2aSThomas Huth } 1973fcf5ef2aSThomas Huth 1974fcf5ef2aSThomas Huth if (sat) { 19756175f5a0SRichard Henderson set_vscr_sat(env); 1976fcf5ef2aSThomas Huth } 1977fcf5ef2aSThomas Huth } 1978fcf5ef2aSThomas Huth 1979fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1980fcf5ef2aSThomas Huth { 1981fcf5ef2aSThomas Huth int sat = 0; 1982fcf5ef2aSThomas Huth int i; 1983fcf5ef2aSThomas Huth 1984fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1985fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1986fcf5ef2aSThomas Huth 1987fcf5ef2aSThomas Huth t += a->s16[2 * i] + a->s16[2 * i + 1]; 1988fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1989fcf5ef2aSThomas Huth } 1990fcf5ef2aSThomas Huth 1991fcf5ef2aSThomas Huth if (sat) { 19926175f5a0SRichard Henderson set_vscr_sat(env); 1993fcf5ef2aSThomas Huth } 1994fcf5ef2aSThomas Huth } 1995fcf5ef2aSThomas Huth 1996fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1997fcf5ef2aSThomas Huth { 1998fcf5ef2aSThomas Huth int i, j; 1999fcf5ef2aSThomas Huth int sat = 0; 2000fcf5ef2aSThomas Huth 2001fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2002fcf5ef2aSThomas Huth uint64_t t = (uint64_t)b->u32[i]; 2003fcf5ef2aSThomas Huth 2004fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u32); j++) { 2005fcf5ef2aSThomas Huth t += a->u8[4 * i + j]; 2006fcf5ef2aSThomas Huth } 2007fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 2008fcf5ef2aSThomas Huth } 2009fcf5ef2aSThomas Huth 2010fcf5ef2aSThomas Huth if (sat) { 20116175f5a0SRichard Henderson set_vscr_sat(env); 2012fcf5ef2aSThomas Huth } 2013fcf5ef2aSThomas Huth } 2014fcf5ef2aSThomas Huth 2015e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 2016fcf5ef2aSThomas Huth #define UPKHI 1 2017fcf5ef2aSThomas Huth #define UPKLO 0 2018fcf5ef2aSThomas Huth #else 2019fcf5ef2aSThomas Huth #define UPKHI 0 2020fcf5ef2aSThomas Huth #define UPKLO 1 2021fcf5ef2aSThomas Huth #endif 2022fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi) \ 2023fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 2024fcf5ef2aSThomas Huth { \ 2025fcf5ef2aSThomas Huth int i; \ 2026fcf5ef2aSThomas Huth ppc_avr_t result; \ 2027fcf5ef2aSThomas Huth \ 2028fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { \ 2029fcf5ef2aSThomas Huth uint16_t e = b->u16[hi ? i : i + 4]; \ 2030fcf5ef2aSThomas Huth uint8_t a = (e >> 15) ? 0xff : 0; \ 2031fcf5ef2aSThomas Huth uint8_t r = (e >> 10) & 0x1f; \ 2032fcf5ef2aSThomas Huth uint8_t g = (e >> 5) & 0x1f; \ 2033fcf5ef2aSThomas Huth uint8_t b = e & 0x1f; \ 2034fcf5ef2aSThomas Huth \ 2035fcf5ef2aSThomas Huth result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b; \ 2036fcf5ef2aSThomas Huth } \ 2037fcf5ef2aSThomas Huth *r = result; \ 2038fcf5ef2aSThomas Huth } 2039fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO) 2040fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI) 2041fcf5ef2aSThomas Huth #undef VUPKPX 2042fcf5ef2aSThomas Huth 2043fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi) \ 2044fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 2045fcf5ef2aSThomas Huth { \ 2046fcf5ef2aSThomas Huth int i; \ 2047fcf5ef2aSThomas Huth ppc_avr_t result; \ 2048fcf5ef2aSThomas Huth \ 2049fcf5ef2aSThomas Huth if (hi) { \ 2050fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) { \ 2051fcf5ef2aSThomas Huth result.unpacked[i] = b->packee[i]; \ 2052fcf5ef2aSThomas Huth } \ 2053fcf5ef2aSThomas Huth } else { \ 2054fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \ 2055fcf5ef2aSThomas Huth i++) { \ 2056fcf5ef2aSThomas Huth result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \ 2057fcf5ef2aSThomas Huth } \ 2058fcf5ef2aSThomas Huth } \ 2059fcf5ef2aSThomas Huth *r = result; \ 2060fcf5ef2aSThomas Huth } 2061fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI) 2062fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI) 2063fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI) 2064fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO) 2065fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO) 2066fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO) 2067fcf5ef2aSThomas Huth #undef VUPK 2068fcf5ef2aSThomas Huth #undef UPKHI 2069fcf5ef2aSThomas Huth #undef UPKLO 2070fcf5ef2aSThomas Huth 2071fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element) \ 2072fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *b) \ 2073fcf5ef2aSThomas Huth { \ 2074fcf5ef2aSThomas Huth int i; \ 2075fcf5ef2aSThomas Huth \ 207660594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 2077fcf5ef2aSThomas Huth r->element[i] = name(b->element[i]); \ 2078fcf5ef2aSThomas Huth } \ 2079fcf5ef2aSThomas Huth } 2080fcf5ef2aSThomas Huth 2081fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8) 2082fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16) 2083fcf5ef2aSThomas Huth 2084fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8) 2085fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16) 2086fcf5ef2aSThomas Huth 2087fcf5ef2aSThomas Huth #undef clzb 2088fcf5ef2aSThomas Huth #undef clzh 2089fcf5ef2aSThomas Huth 2090fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8) 2091fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16) 2092fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v)) 2093fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v)) 2094fcf5ef2aSThomas Huth 2095fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8) 2096fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16) 2097fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32) 2098fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64) 2099fcf5ef2aSThomas Huth 2100fcf5ef2aSThomas Huth #undef ctzb 2101fcf5ef2aSThomas Huth #undef ctzh 2102fcf5ef2aSThomas Huth #undef ctzw 2103fcf5ef2aSThomas Huth #undef ctzd 2104fcf5ef2aSThomas Huth 2105fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v) 2106fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v) 2107fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v) 2108fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v) 2109fcf5ef2aSThomas Huth 2110fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8) 2111fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16) 2112fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32) 2113fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64) 2114fcf5ef2aSThomas Huth 2115fcf5ef2aSThomas Huth #undef popcntb 2116fcf5ef2aSThomas Huth #undef popcnth 2117fcf5ef2aSThomas Huth #undef popcntw 2118fcf5ef2aSThomas Huth #undef popcntd 2119fcf5ef2aSThomas Huth 2120fcf5ef2aSThomas Huth #undef VGENERIC_DO 2121fcf5ef2aSThomas Huth 2122e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 2123fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } } 2124fcf5ef2aSThomas Huth #else 2125fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } } 2126fcf5ef2aSThomas Huth #endif 2127fcf5ef2aSThomas Huth 2128fcf5ef2aSThomas Huth #ifndef CONFIG_INT128 2129fcf5ef2aSThomas Huth 2130fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a) 2131fcf5ef2aSThomas Huth { 2132fcf5ef2aSThomas Huth t->u64[0] = ~a.u64[0]; 2133fcf5ef2aSThomas Huth t->u64[1] = ~a.u64[1]; 2134fcf5ef2aSThomas Huth } 2135fcf5ef2aSThomas Huth 2136fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b) 2137fcf5ef2aSThomas Huth { 21383c385a93SMark Cave-Ayland if (a.VsrD(0) < b.VsrD(0)) { 2139fcf5ef2aSThomas Huth return -1; 21403c385a93SMark Cave-Ayland } else if (a.VsrD(0) > b.VsrD(0)) { 2141fcf5ef2aSThomas Huth return 1; 21423c385a93SMark Cave-Ayland } else if (a.VsrD(1) < b.VsrD(1)) { 2143fcf5ef2aSThomas Huth return -1; 21443c385a93SMark Cave-Ayland } else if (a.VsrD(1) > b.VsrD(1)) { 2145fcf5ef2aSThomas Huth return 1; 2146fcf5ef2aSThomas Huth } else { 2147fcf5ef2aSThomas Huth return 0; 2148fcf5ef2aSThomas Huth } 2149fcf5ef2aSThomas Huth } 2150fcf5ef2aSThomas Huth 2151fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 2152fcf5ef2aSThomas Huth { 21533c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 21543c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 21553c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 2156fcf5ef2aSThomas Huth } 2157fcf5ef2aSThomas Huth 2158fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 2159fcf5ef2aSThomas Huth { 2160fcf5ef2aSThomas Huth ppc_avr_t not_a; 21613c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 21623c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 21633c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 2164fcf5ef2aSThomas Huth avr_qw_not(¬_a, a); 2165fcf5ef2aSThomas Huth return avr_qw_cmpu(not_a, b) < 0; 2166fcf5ef2aSThomas Huth } 2167fcf5ef2aSThomas Huth 2168fcf5ef2aSThomas Huth #endif 2169fcf5ef2aSThomas Huth 2170fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2171fcf5ef2aSThomas Huth { 2172fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2173fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128; 2174fcf5ef2aSThomas Huth #else 2175fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 2176fcf5ef2aSThomas Huth #endif 2177fcf5ef2aSThomas Huth } 2178fcf5ef2aSThomas Huth 2179fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2180fcf5ef2aSThomas Huth { 2181fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2182fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128 + (c->u128 & 1); 2183fcf5ef2aSThomas Huth #else 2184fcf5ef2aSThomas Huth 21853c385a93SMark Cave-Ayland if (c->VsrD(1) & 1) { 2186fcf5ef2aSThomas Huth ppc_avr_t tmp; 2187fcf5ef2aSThomas Huth 21883c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 21893c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2190fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 2191fcf5ef2aSThomas Huth avr_qw_add(r, tmp, *b); 2192fcf5ef2aSThomas Huth } else { 2193fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 2194fcf5ef2aSThomas Huth } 2195fcf5ef2aSThomas Huth #endif 2196fcf5ef2aSThomas Huth } 2197fcf5ef2aSThomas Huth 2198fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2199fcf5ef2aSThomas Huth { 2200fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2201fcf5ef2aSThomas Huth r->u128 = (~a->u128 < b->u128); 2202fcf5ef2aSThomas Huth #else 2203fcf5ef2aSThomas Huth ppc_avr_t not_a; 2204fcf5ef2aSThomas Huth 2205fcf5ef2aSThomas Huth avr_qw_not(¬_a, *a); 2206fcf5ef2aSThomas Huth 22073c385a93SMark Cave-Ayland r->VsrD(0) = 0; 22083c385a93SMark Cave-Ayland r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0); 2209fcf5ef2aSThomas Huth #endif 2210fcf5ef2aSThomas Huth } 2211fcf5ef2aSThomas Huth 2212fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2213fcf5ef2aSThomas Huth { 2214fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2215fcf5ef2aSThomas Huth int carry_out = (~a->u128 < b->u128); 2216fcf5ef2aSThomas Huth if (!carry_out && (c->u128 & 1)) { 2217fcf5ef2aSThomas Huth carry_out = ((a->u128 + b->u128 + 1) == 0) && 2218fcf5ef2aSThomas Huth ((a->u128 != 0) || (b->u128 != 0)); 2219fcf5ef2aSThomas Huth } 2220fcf5ef2aSThomas Huth r->u128 = carry_out; 2221fcf5ef2aSThomas Huth #else 2222fcf5ef2aSThomas Huth 22233c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2224fcf5ef2aSThomas Huth int carry_out = 0; 2225fcf5ef2aSThomas Huth ppc_avr_t tmp; 2226fcf5ef2aSThomas Huth 2227fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, *a, *b); 2228fcf5ef2aSThomas Huth 2229fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2230fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 2231fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, tmp, one); 2232fcf5ef2aSThomas Huth } 22333c385a93SMark Cave-Ayland r->VsrD(0) = 0; 22343c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2235fcf5ef2aSThomas Huth #endif 2236fcf5ef2aSThomas Huth } 2237fcf5ef2aSThomas Huth 2238fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2239fcf5ef2aSThomas Huth { 2240fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2241fcf5ef2aSThomas Huth r->u128 = a->u128 - b->u128; 2242fcf5ef2aSThomas Huth #else 2243fcf5ef2aSThomas Huth ppc_avr_t tmp; 2244fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 2245fcf5ef2aSThomas Huth 2246fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2247fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 2248fcf5ef2aSThomas Huth avr_qw_add(r, tmp, one); 2249fcf5ef2aSThomas Huth #endif 2250fcf5ef2aSThomas Huth } 2251fcf5ef2aSThomas Huth 2252fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2253fcf5ef2aSThomas Huth { 2254fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2255fcf5ef2aSThomas Huth r->u128 = a->u128 + ~b->u128 + (c->u128 & 1); 2256fcf5ef2aSThomas Huth #else 2257fcf5ef2aSThomas Huth ppc_avr_t tmp, sum; 2258fcf5ef2aSThomas Huth 2259fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2260fcf5ef2aSThomas Huth avr_qw_add(&sum, *a, tmp); 2261fcf5ef2aSThomas Huth 22623c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 22633c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2264fcf5ef2aSThomas Huth avr_qw_add(r, sum, tmp); 2265fcf5ef2aSThomas Huth #endif 2266fcf5ef2aSThomas Huth } 2267fcf5ef2aSThomas Huth 2268fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2269fcf5ef2aSThomas Huth { 2270fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2271fcf5ef2aSThomas Huth r->u128 = (~a->u128 < ~b->u128) || 2272fcf5ef2aSThomas Huth (a->u128 + ~b->u128 == (__uint128_t)-1); 2273fcf5ef2aSThomas Huth #else 2274fcf5ef2aSThomas Huth int carry = (avr_qw_cmpu(*a, *b) > 0); 2275fcf5ef2aSThomas Huth if (!carry) { 2276fcf5ef2aSThomas Huth ppc_avr_t tmp; 2277fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2278fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 22793c385a93SMark Cave-Ayland carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull)); 2280fcf5ef2aSThomas Huth } 22813c385a93SMark Cave-Ayland r->VsrD(0) = 0; 22823c385a93SMark Cave-Ayland r->VsrD(1) = carry; 2283fcf5ef2aSThomas Huth #endif 2284fcf5ef2aSThomas Huth } 2285fcf5ef2aSThomas Huth 2286fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2287fcf5ef2aSThomas Huth { 2288fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2289fcf5ef2aSThomas Huth r->u128 = 2290fcf5ef2aSThomas Huth (~a->u128 < ~b->u128) || 2291fcf5ef2aSThomas Huth ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1)); 2292fcf5ef2aSThomas Huth #else 22933c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2294fcf5ef2aSThomas Huth int carry_out = (avr_qw_cmpu(*a, *b) > 0); 2295fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2296fcf5ef2aSThomas Huth ppc_avr_t tmp; 2297fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2298fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 22993c385a93SMark Cave-Ayland carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull)); 2300fcf5ef2aSThomas Huth } 2301fcf5ef2aSThomas Huth 23023c385a93SMark Cave-Ayland r->VsrD(0) = 0; 23033c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2304fcf5ef2aSThomas Huth #endif 2305fcf5ef2aSThomas Huth } 2306fcf5ef2aSThomas Huth 2307fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC 2308fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF 2309fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1 0xA 2310fcf5ef2aSThomas Huth #define BCD_NEG_PREF 0xD 2311fcf5ef2aSThomas Huth #define BCD_NEG_ALT 0xB 2312fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2 0xE 2313fcf5ef2aSThomas Huth #define NATIONAL_PLUS 0x2B 2314fcf5ef2aSThomas Huth #define NATIONAL_NEG 0x2D 2315fcf5ef2aSThomas Huth 2316365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2)) 2317fcf5ef2aSThomas Huth 2318fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd) 2319fcf5ef2aSThomas Huth { 2320428115c3SMark Cave-Ayland switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) { 2321fcf5ef2aSThomas Huth case BCD_PLUS_PREF_1: 2322fcf5ef2aSThomas Huth case BCD_PLUS_PREF_2: 2323fcf5ef2aSThomas Huth case BCD_PLUS_ALT_1: 2324fcf5ef2aSThomas Huth case BCD_PLUS_ALT_2: 2325fcf5ef2aSThomas Huth { 2326fcf5ef2aSThomas Huth return 1; 2327fcf5ef2aSThomas Huth } 2328fcf5ef2aSThomas Huth 2329fcf5ef2aSThomas Huth case BCD_NEG_PREF: 2330fcf5ef2aSThomas Huth case BCD_NEG_ALT: 2331fcf5ef2aSThomas Huth { 2332fcf5ef2aSThomas Huth return -1; 2333fcf5ef2aSThomas Huth } 2334fcf5ef2aSThomas Huth 2335fcf5ef2aSThomas Huth default: 2336fcf5ef2aSThomas Huth { 2337fcf5ef2aSThomas Huth return 0; 2338fcf5ef2aSThomas Huth } 2339fcf5ef2aSThomas Huth } 2340fcf5ef2aSThomas Huth } 2341fcf5ef2aSThomas Huth 2342fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps) 2343fcf5ef2aSThomas Huth { 2344fcf5ef2aSThomas Huth if (sgn >= 0) { 2345fcf5ef2aSThomas Huth return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2; 2346fcf5ef2aSThomas Huth } else { 2347fcf5ef2aSThomas Huth return BCD_NEG_PREF; 2348fcf5ef2aSThomas Huth } 2349fcf5ef2aSThomas Huth } 2350fcf5ef2aSThomas Huth 2351fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid) 2352fcf5ef2aSThomas Huth { 2353fcf5ef2aSThomas Huth uint8_t result; 2354fcf5ef2aSThomas Huth if (n & 1) { 2355428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4; 2356fcf5ef2aSThomas Huth } else { 2357428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF; 2358fcf5ef2aSThomas Huth } 2359fcf5ef2aSThomas Huth 2360fcf5ef2aSThomas Huth if (unlikely(result > 9)) { 2361fcf5ef2aSThomas Huth *invalid = true; 2362fcf5ef2aSThomas Huth } 2363fcf5ef2aSThomas Huth return result; 2364fcf5ef2aSThomas Huth } 2365fcf5ef2aSThomas Huth 2366fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n) 2367fcf5ef2aSThomas Huth { 2368fcf5ef2aSThomas Huth if (n & 1) { 2369428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F; 2370428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4); 2371fcf5ef2aSThomas Huth } else { 2372428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0; 2373428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= digit; 2374fcf5ef2aSThomas Huth } 2375fcf5ef2aSThomas Huth } 2376fcf5ef2aSThomas Huth 2377071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd) 2378071663dfSJose Ricardo Ziviani { 2379071663dfSJose Ricardo Ziviani int i; 2380071663dfSJose Ricardo Ziviani int invalid = 0; 2381071663dfSJose Ricardo Ziviani 2382071663dfSJose Ricardo Ziviani if (bcd_get_sgn(bcd) == 0) { 2383071663dfSJose Ricardo Ziviani return false; 2384071663dfSJose Ricardo Ziviani } 2385071663dfSJose Ricardo Ziviani 2386071663dfSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2387071663dfSJose Ricardo Ziviani bcd_get_digit(bcd, i, &invalid); 2388071663dfSJose Ricardo Ziviani if (unlikely(invalid)) { 2389071663dfSJose Ricardo Ziviani return false; 2390071663dfSJose Ricardo Ziviani } 2391071663dfSJose Ricardo Ziviani } 2392071663dfSJose Ricardo Ziviani return true; 2393071663dfSJose Ricardo Ziviani } 2394071663dfSJose Ricardo Ziviani 2395fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd) 2396fcf5ef2aSThomas Huth { 23973c385a93SMark Cave-Ayland if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) { 2398efa73196SNikunj A Dadhania return CRF_EQ; 2399fcf5ef2aSThomas Huth } else { 2400efa73196SNikunj A Dadhania return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT; 2401fcf5ef2aSThomas Huth } 2402fcf5ef2aSThomas Huth } 2403fcf5ef2aSThomas Huth 2404fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n) 2405fcf5ef2aSThomas Huth { 240660594feaSMark Cave-Ayland return reg->VsrH(7 - n); 2407fcf5ef2aSThomas Huth } 2408fcf5ef2aSThomas Huth 2409fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n) 2410fcf5ef2aSThomas Huth { 241160594feaSMark Cave-Ayland reg->VsrH(7 - n) = val; 2412fcf5ef2aSThomas Huth } 2413fcf5ef2aSThomas Huth 2414fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b) 2415fcf5ef2aSThomas Huth { 2416fcf5ef2aSThomas Huth int i; 2417fcf5ef2aSThomas Huth int invalid = 0; 2418fcf5ef2aSThomas Huth for (i = 31; i > 0; i--) { 2419fcf5ef2aSThomas Huth uint8_t dig_a = bcd_get_digit(a, i, &invalid); 2420fcf5ef2aSThomas Huth uint8_t dig_b = bcd_get_digit(b, i, &invalid); 2421fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2422fcf5ef2aSThomas Huth return 0; /* doesn't matter */ 2423fcf5ef2aSThomas Huth } else if (dig_a > dig_b) { 2424fcf5ef2aSThomas Huth return 1; 2425fcf5ef2aSThomas Huth } else if (dig_a < dig_b) { 2426fcf5ef2aSThomas Huth return -1; 2427fcf5ef2aSThomas Huth } 2428fcf5ef2aSThomas Huth } 2429fcf5ef2aSThomas Huth 2430fcf5ef2aSThomas Huth return 0; 2431fcf5ef2aSThomas Huth } 2432fcf5ef2aSThomas Huth 2433936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2434fcf5ef2aSThomas Huth int *overflow) 2435fcf5ef2aSThomas Huth { 2436fcf5ef2aSThomas Huth int carry = 0; 2437fcf5ef2aSThomas Huth int i; 2438936fda4dSFabiano Rosas int is_zero = 1; 2439936fda4dSFabiano Rosas 2440fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2441fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) + 2442fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2443936fda4dSFabiano Rosas is_zero &= (digit == 0); 2444fcf5ef2aSThomas Huth if (digit > 9) { 2445fcf5ef2aSThomas Huth carry = 1; 2446fcf5ef2aSThomas Huth digit -= 10; 2447fcf5ef2aSThomas Huth } else { 2448fcf5ef2aSThomas Huth carry = 0; 2449fcf5ef2aSThomas Huth } 2450fcf5ef2aSThomas Huth 2451fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2452fcf5ef2aSThomas Huth } 2453fcf5ef2aSThomas Huth 2454fcf5ef2aSThomas Huth *overflow = carry; 2455936fda4dSFabiano Rosas return is_zero; 2456fcf5ef2aSThomas Huth } 2457fcf5ef2aSThomas Huth 2458d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2459fcf5ef2aSThomas Huth int *overflow) 2460fcf5ef2aSThomas Huth { 2461fcf5ef2aSThomas Huth int carry = 0; 2462fcf5ef2aSThomas Huth int i; 2463d03b174aSYasmin Beatriz 2464fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2465fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) - 2466fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2467fcf5ef2aSThomas Huth if (digit & 0x80) { 2468fcf5ef2aSThomas Huth carry = -1; 2469fcf5ef2aSThomas Huth digit += 10; 2470fcf5ef2aSThomas Huth } else { 2471fcf5ef2aSThomas Huth carry = 0; 2472fcf5ef2aSThomas Huth } 2473fcf5ef2aSThomas Huth 2474fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2475fcf5ef2aSThomas Huth } 2476fcf5ef2aSThomas Huth 2477fcf5ef2aSThomas Huth *overflow = carry; 2478fcf5ef2aSThomas Huth } 2479fcf5ef2aSThomas Huth 2480fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2481fcf5ef2aSThomas Huth { 2482fcf5ef2aSThomas Huth 2483fcf5ef2aSThomas Huth int sgna = bcd_get_sgn(a); 2484fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2485fcf5ef2aSThomas Huth int invalid = (sgna == 0) || (sgnb == 0); 2486fcf5ef2aSThomas Huth int overflow = 0; 2487936fda4dSFabiano Rosas int zero = 0; 2488fcf5ef2aSThomas Huth uint32_t cr = 0; 2489fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 2490fcf5ef2aSThomas Huth 2491fcf5ef2aSThomas Huth if (!invalid) { 2492fcf5ef2aSThomas Huth if (sgna == sgnb) { 2493428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2494936fda4dSFabiano Rosas zero = bcd_add_mag(&result, a, b, &invalid, &overflow); 2495936fda4dSFabiano Rosas cr = (sgna > 0) ? CRF_GT : CRF_LT; 2496fcf5ef2aSThomas Huth } else { 2497d03b174aSYasmin Beatriz int magnitude = bcd_cmp_mag(a, b); 2498d03b174aSYasmin Beatriz if (magnitude > 0) { 2499428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2500d03b174aSYasmin Beatriz bcd_sub_mag(&result, a, b, &invalid, &overflow); 2501d03b174aSYasmin Beatriz cr = (sgna > 0) ? CRF_GT : CRF_LT; 2502d03b174aSYasmin Beatriz } else if (magnitude < 0) { 2503428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps); 2504d03b174aSYasmin Beatriz bcd_sub_mag(&result, b, a, &invalid, &overflow); 2505efa73196SNikunj A Dadhania cr = (sgnb > 0) ? CRF_GT : CRF_LT; 2506d03b174aSYasmin Beatriz } else { 2507428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps); 2508d03b174aSYasmin Beatriz cr = CRF_EQ; 2509d03b174aSYasmin Beatriz } 2510fcf5ef2aSThomas Huth } 2511fcf5ef2aSThomas Huth } 2512fcf5ef2aSThomas Huth 2513fcf5ef2aSThomas Huth if (unlikely(invalid)) { 25143c385a93SMark Cave-Ayland result.VsrD(0) = result.VsrD(1) = -1; 2515efa73196SNikunj A Dadhania cr = CRF_SO; 2516fcf5ef2aSThomas Huth } else if (overflow) { 2517efa73196SNikunj A Dadhania cr |= CRF_SO; 2518936fda4dSFabiano Rosas } else if (zero) { 2519936fda4dSFabiano Rosas cr |= CRF_EQ; 2520fcf5ef2aSThomas Huth } 2521fcf5ef2aSThomas Huth 2522fcf5ef2aSThomas Huth *r = result; 2523fcf5ef2aSThomas Huth 2524fcf5ef2aSThomas Huth return cr; 2525fcf5ef2aSThomas Huth } 2526fcf5ef2aSThomas Huth 2527fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2528fcf5ef2aSThomas Huth { 2529fcf5ef2aSThomas Huth ppc_avr_t bcopy = *b; 2530fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2531fcf5ef2aSThomas Huth if (sgnb < 0) { 2532fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0); 2533fcf5ef2aSThomas Huth } else if (sgnb > 0) { 2534fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_NEG_PREF, 0); 2535fcf5ef2aSThomas Huth } 2536fcf5ef2aSThomas Huth /* else invalid ... defer to bcdadd code for proper handling */ 2537fcf5ef2aSThomas Huth 2538fcf5ef2aSThomas Huth return helper_bcdadd(r, a, &bcopy, ps); 2539fcf5ef2aSThomas Huth } 2540fcf5ef2aSThomas Huth 2541fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2542fcf5ef2aSThomas Huth { 2543fcf5ef2aSThomas Huth int i; 2544fcf5ef2aSThomas Huth int cr = 0; 2545fcf5ef2aSThomas Huth uint16_t national = 0; 2546fcf5ef2aSThomas Huth uint16_t sgnb = get_national_digit(b, 0); 2547fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2548fcf5ef2aSThomas Huth int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG); 2549fcf5ef2aSThomas Huth 2550fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2551fcf5ef2aSThomas Huth national = get_national_digit(b, i); 2552fcf5ef2aSThomas Huth if (unlikely(national < 0x30 || national > 0x39)) { 2553fcf5ef2aSThomas Huth invalid = 1; 2554fcf5ef2aSThomas Huth break; 2555fcf5ef2aSThomas Huth } 2556fcf5ef2aSThomas Huth 2557fcf5ef2aSThomas Huth bcd_put_digit(&ret, national & 0xf, i); 2558fcf5ef2aSThomas Huth } 2559fcf5ef2aSThomas Huth 2560fcf5ef2aSThomas Huth if (sgnb == NATIONAL_PLUS) { 2561fcf5ef2aSThomas Huth bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0); 2562fcf5ef2aSThomas Huth } else { 2563fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2564fcf5ef2aSThomas Huth } 2565fcf5ef2aSThomas Huth 2566fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2567fcf5ef2aSThomas Huth 2568fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2569efa73196SNikunj A Dadhania cr = CRF_SO; 2570fcf5ef2aSThomas Huth } 2571fcf5ef2aSThomas Huth 2572fcf5ef2aSThomas Huth *r = ret; 2573fcf5ef2aSThomas Huth 2574fcf5ef2aSThomas Huth return cr; 2575fcf5ef2aSThomas Huth } 2576fcf5ef2aSThomas Huth 2577fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2578fcf5ef2aSThomas Huth { 2579fcf5ef2aSThomas Huth int i; 2580fcf5ef2aSThomas Huth int cr = 0; 2581fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2582fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2583fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2584fcf5ef2aSThomas Huth 25853c385a93SMark Cave-Ayland int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0); 2586fcf5ef2aSThomas Huth 2587fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2588fcf5ef2aSThomas Huth set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i); 2589fcf5ef2aSThomas Huth 2590fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2591fcf5ef2aSThomas Huth break; 2592fcf5ef2aSThomas Huth } 2593fcf5ef2aSThomas Huth } 2594fcf5ef2aSThomas Huth set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0); 2595fcf5ef2aSThomas Huth 2596fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2597fcf5ef2aSThomas Huth 2598fcf5ef2aSThomas Huth if (ox_flag) { 2599efa73196SNikunj A Dadhania cr |= CRF_SO; 2600fcf5ef2aSThomas Huth } 2601fcf5ef2aSThomas Huth 2602fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2603efa73196SNikunj A Dadhania cr = CRF_SO; 2604fcf5ef2aSThomas Huth } 2605fcf5ef2aSThomas Huth 2606fcf5ef2aSThomas Huth *r = ret; 2607fcf5ef2aSThomas Huth 2608fcf5ef2aSThomas Huth return cr; 2609fcf5ef2aSThomas Huth } 2610fcf5ef2aSThomas Huth 2611fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2612fcf5ef2aSThomas Huth { 2613fcf5ef2aSThomas Huth int i; 2614fcf5ef2aSThomas Huth int cr = 0; 2615fcf5ef2aSThomas Huth int invalid = 0; 2616fcf5ef2aSThomas Huth int zone_digit = 0; 2617fcf5ef2aSThomas Huth int zone_lead = ps ? 0xF : 0x3; 2618fcf5ef2aSThomas Huth int digit = 0; 2619fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2620428115c3SMark Cave-Ayland int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4; 2621fcf5ef2aSThomas Huth 2622fcf5ef2aSThomas Huth if (unlikely((sgnb < 0xA) && ps)) { 2623fcf5ef2aSThomas Huth invalid = 1; 2624fcf5ef2aSThomas Huth } 2625fcf5ef2aSThomas Huth 2626fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2627428115c3SMark Cave-Ayland zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead; 2628428115c3SMark Cave-Ayland digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF; 2629fcf5ef2aSThomas Huth if (unlikely(zone_digit != zone_lead || digit > 0x9)) { 2630fcf5ef2aSThomas Huth invalid = 1; 2631fcf5ef2aSThomas Huth break; 2632fcf5ef2aSThomas Huth } 2633fcf5ef2aSThomas Huth 2634fcf5ef2aSThomas Huth bcd_put_digit(&ret, digit, i + 1); 2635fcf5ef2aSThomas Huth } 2636fcf5ef2aSThomas Huth 2637fcf5ef2aSThomas Huth if ((ps && (sgnb == 0xB || sgnb == 0xD)) || 2638fcf5ef2aSThomas Huth (!ps && (sgnb & 0x4))) { 2639fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2640fcf5ef2aSThomas Huth } else { 2641fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0); 2642fcf5ef2aSThomas Huth } 2643fcf5ef2aSThomas Huth 2644fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2645fcf5ef2aSThomas Huth 2646fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2647efa73196SNikunj A Dadhania cr = CRF_SO; 2648fcf5ef2aSThomas Huth } 2649fcf5ef2aSThomas Huth 2650fcf5ef2aSThomas Huth *r = ret; 2651fcf5ef2aSThomas Huth 2652fcf5ef2aSThomas Huth return cr; 2653fcf5ef2aSThomas Huth } 2654fcf5ef2aSThomas Huth 2655fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2656fcf5ef2aSThomas Huth { 2657fcf5ef2aSThomas Huth int i; 2658fcf5ef2aSThomas Huth int cr = 0; 2659fcf5ef2aSThomas Huth uint8_t digit = 0; 2660fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2661fcf5ef2aSThomas Huth int zone_lead = (ps) ? 0xF0 : 0x30; 2662fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2663fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2664fcf5ef2aSThomas Huth 26653c385a93SMark Cave-Ayland int ox_flag = ((b->VsrD(0) >> 4) != 0); 2666fcf5ef2aSThomas Huth 2667fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2668fcf5ef2aSThomas Huth digit = bcd_get_digit(b, i + 1, &invalid); 2669fcf5ef2aSThomas Huth 2670fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2671fcf5ef2aSThomas Huth break; 2672fcf5ef2aSThomas Huth } 2673fcf5ef2aSThomas Huth 2674428115c3SMark Cave-Ayland ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit; 2675fcf5ef2aSThomas Huth } 2676fcf5ef2aSThomas Huth 2677fcf5ef2aSThomas Huth if (ps) { 2678fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1); 2679fcf5ef2aSThomas Huth } else { 2680fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1); 2681fcf5ef2aSThomas Huth } 2682fcf5ef2aSThomas Huth 2683fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2684fcf5ef2aSThomas Huth 2685fcf5ef2aSThomas Huth if (ox_flag) { 2686efa73196SNikunj A Dadhania cr |= CRF_SO; 2687fcf5ef2aSThomas Huth } 2688fcf5ef2aSThomas Huth 2689fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2690efa73196SNikunj A Dadhania cr = CRF_SO; 2691fcf5ef2aSThomas Huth } 2692fcf5ef2aSThomas Huth 2693fcf5ef2aSThomas Huth *r = ret; 2694fcf5ef2aSThomas Huth 2695fcf5ef2aSThomas Huth return cr; 2696fcf5ef2aSThomas Huth } 2697fcf5ef2aSThomas Huth 2698a3d67f3eSLuis Pires /** 2699a3d67f3eSLuis Pires * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs 2700a3d67f3eSLuis Pires * 2701a3d67f3eSLuis Pires * Returns: 2702a3d67f3eSLuis Pires * > 0 if ahi|alo > bhi|blo, 2703a3d67f3eSLuis Pires * 0 if ahi|alo == bhi|blo, 2704a3d67f3eSLuis Pires * < 0 if ahi|alo < bhi|blo 2705a3d67f3eSLuis Pires */ 2706a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi, 2707a3d67f3eSLuis Pires uint64_t blo, uint64_t bhi) 2708a3d67f3eSLuis Pires { 2709a3d67f3eSLuis Pires return (ahi == bhi) ? 2710a3d67f3eSLuis Pires (alo > blo ? 1 : (alo == blo ? 0 : -1)) : 2711a3d67f3eSLuis Pires (ahi > bhi ? 1 : -1); 2712a3d67f3eSLuis Pires } 2713a3d67f3eSLuis Pires 2714a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2715a406c058SJose Ricardo Ziviani { 2716a406c058SJose Ricardo Ziviani int i; 2717a3d67f3eSLuis Pires int cr; 2718a406c058SJose Ricardo Ziviani uint64_t lo_value; 2719a406c058SJose Ricardo Ziviani uint64_t hi_value; 272040f3e79aSLuis Pires uint64_t rem; 2721a406c058SJose Ricardo Ziviani ppc_avr_t ret = { .u64 = { 0, 0 } }; 2722a406c058SJose Ricardo Ziviani 27233c385a93SMark Cave-Ayland if (b->VsrSD(0) < 0) { 27243c385a93SMark Cave-Ayland lo_value = -b->VsrSD(1); 27253c385a93SMark Cave-Ayland hi_value = ~b->VsrD(0) + !lo_value; 2726a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, 0xD, 0); 2727a3d67f3eSLuis Pires 2728a3d67f3eSLuis Pires cr = CRF_LT; 2729a406c058SJose Ricardo Ziviani } else { 27303c385a93SMark Cave-Ayland lo_value = b->VsrD(1); 27313c385a93SMark Cave-Ayland hi_value = b->VsrD(0); 2732a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0); 2733a3d67f3eSLuis Pires 2734a3d67f3eSLuis Pires if (hi_value == 0 && lo_value == 0) { 2735a3d67f3eSLuis Pires cr = CRF_EQ; 2736a3d67f3eSLuis Pires } else { 2737a3d67f3eSLuis Pires cr = CRF_GT; 2738a3d67f3eSLuis Pires } 2739a406c058SJose Ricardo Ziviani } 2740a406c058SJose Ricardo Ziviani 2741a3d67f3eSLuis Pires /* 2742a3d67f3eSLuis Pires * Check src limits: abs(src) <= 10^31 - 1 2743a3d67f3eSLuis Pires * 2744a3d67f3eSLuis Pires * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff 2745a3d67f3eSLuis Pires */ 2746a3d67f3eSLuis Pires if (ucmp128(lo_value, hi_value, 2747a3d67f3eSLuis Pires 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) { 2748a3d67f3eSLuis Pires cr |= CRF_SO; 2749a3d67f3eSLuis Pires 2750a3d67f3eSLuis Pires /* 2751a3d67f3eSLuis Pires * According to the ISA, if src wouldn't fit in the destination 2752a3d67f3eSLuis Pires * register, the result is undefined. 2753a3d67f3eSLuis Pires * In that case, we leave r unchanged. 2754a3d67f3eSLuis Pires */ 2755a3d67f3eSLuis Pires } else { 275640f3e79aSLuis Pires rem = divu128(&lo_value, &hi_value, 1000000000000000ULL); 2757a406c058SJose Ricardo Ziviani 275840f3e79aSLuis Pires for (i = 1; i < 16; rem /= 10, i++) { 275940f3e79aSLuis Pires bcd_put_digit(&ret, rem % 10, i); 2760a406c058SJose Ricardo Ziviani } 2761a406c058SJose Ricardo Ziviani 2762a406c058SJose Ricardo Ziviani for (; i < 32; lo_value /= 10, i++) { 2763a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, lo_value % 10, i); 2764a406c058SJose Ricardo Ziviani } 2765a406c058SJose Ricardo Ziviani 2766a406c058SJose Ricardo Ziviani *r = ret; 2767a3d67f3eSLuis Pires } 2768a406c058SJose Ricardo Ziviani 2769a406c058SJose Ricardo Ziviani return cr; 2770a406c058SJose Ricardo Ziviani } 2771a406c058SJose Ricardo Ziviani 2772c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2773c85bc7ddSJose Ricardo Ziviani { 2774c85bc7ddSJose Ricardo Ziviani uint8_t i; 2775c85bc7ddSJose Ricardo Ziviani int cr; 2776c85bc7ddSJose Ricardo Ziviani uint64_t carry; 2777c85bc7ddSJose Ricardo Ziviani uint64_t unused; 2778c85bc7ddSJose Ricardo Ziviani uint64_t lo_value; 2779c85bc7ddSJose Ricardo Ziviani uint64_t hi_value = 0; 2780c85bc7ddSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2781c85bc7ddSJose Ricardo Ziviani int invalid = (sgnb == 0); 2782c85bc7ddSJose Ricardo Ziviani 2783c85bc7ddSJose Ricardo Ziviani lo_value = bcd_get_digit(b, 31, &invalid); 2784c85bc7ddSJose Ricardo Ziviani for (i = 30; i > 0; i--) { 2785c85bc7ddSJose Ricardo Ziviani mulu64(&lo_value, &carry, lo_value, 10ULL); 2786c85bc7ddSJose Ricardo Ziviani mulu64(&hi_value, &unused, hi_value, 10ULL); 2787c85bc7ddSJose Ricardo Ziviani lo_value += bcd_get_digit(b, i, &invalid); 2788c85bc7ddSJose Ricardo Ziviani hi_value += carry; 2789c85bc7ddSJose Ricardo Ziviani 2790c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2791c85bc7ddSJose Ricardo Ziviani break; 2792c85bc7ddSJose Ricardo Ziviani } 2793c85bc7ddSJose Ricardo Ziviani } 2794c85bc7ddSJose Ricardo Ziviani 2795c85bc7ddSJose Ricardo Ziviani if (sgnb == -1) { 27963c385a93SMark Cave-Ayland r->VsrSD(1) = -lo_value; 27973c385a93SMark Cave-Ayland r->VsrSD(0) = ~hi_value + !r->VsrSD(1); 2798c85bc7ddSJose Ricardo Ziviani } else { 27993c385a93SMark Cave-Ayland r->VsrSD(1) = lo_value; 28003c385a93SMark Cave-Ayland r->VsrSD(0) = hi_value; 2801c85bc7ddSJose Ricardo Ziviani } 2802c85bc7ddSJose Ricardo Ziviani 2803c85bc7ddSJose Ricardo Ziviani cr = bcd_cmp_zero(b); 2804c85bc7ddSJose Ricardo Ziviani 2805c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2806c85bc7ddSJose Ricardo Ziviani cr = CRF_SO; 2807c85bc7ddSJose Ricardo Ziviani } 2808c85bc7ddSJose Ricardo Ziviani 2809c85bc7ddSJose Ricardo Ziviani return cr; 2810c85bc7ddSJose Ricardo Ziviani } 2811c85bc7ddSJose Ricardo Ziviani 2812c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2813c3025c3bSJose Ricardo Ziviani { 2814c3025c3bSJose Ricardo Ziviani int i; 2815c3025c3bSJose Ricardo Ziviani int invalid = 0; 2816c3025c3bSJose Ricardo Ziviani 2817c3025c3bSJose Ricardo Ziviani if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) { 2818c3025c3bSJose Ricardo Ziviani return CRF_SO; 2819c3025c3bSJose Ricardo Ziviani } 2820c3025c3bSJose Ricardo Ziviani 2821c3025c3bSJose Ricardo Ziviani *r = *a; 2822428115c3SMark Cave-Ayland bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0); 2823c3025c3bSJose Ricardo Ziviani 2824c3025c3bSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2825c3025c3bSJose Ricardo Ziviani bcd_get_digit(a, i, &invalid); 2826c3025c3bSJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2827c3025c3bSJose Ricardo Ziviani if (unlikely(invalid)) { 2828c3025c3bSJose Ricardo Ziviani return CRF_SO; 2829c3025c3bSJose Ricardo Ziviani } 2830c3025c3bSJose Ricardo Ziviani } 2831c3025c3bSJose Ricardo Ziviani 2832c3025c3bSJose Ricardo Ziviani return bcd_cmp_zero(r); 2833c3025c3bSJose Ricardo Ziviani } 2834c3025c3bSJose Ricardo Ziviani 2835466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2836466a3f9cSJose Ricardo Ziviani { 2837466a3f9cSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2838466a3f9cSJose Ricardo Ziviani 2839466a3f9cSJose Ricardo Ziviani *r = *b; 2840466a3f9cSJose Ricardo Ziviani bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0); 2841466a3f9cSJose Ricardo Ziviani 2842071663dfSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2843466a3f9cSJose Ricardo Ziviani return CRF_SO; 2844466a3f9cSJose Ricardo Ziviani } 2845466a3f9cSJose Ricardo Ziviani 2846466a3f9cSJose Ricardo Ziviani return bcd_cmp_zero(r); 2847466a3f9cSJose Ricardo Ziviani } 2848466a3f9cSJose Ricardo Ziviani 2849e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2850e04797f7SJose Ricardo Ziviani { 2851e04797f7SJose Ricardo Ziviani int cr; 2852428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2853e04797f7SJose Ricardo Ziviani bool ox_flag = false; 2854e04797f7SJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2855e04797f7SJose Ricardo Ziviani ppc_avr_t ret = *b; 28563c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2857e04797f7SJose Ricardo Ziviani 2858e04797f7SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2859e04797f7SJose Ricardo Ziviani return CRF_SO; 2860e04797f7SJose Ricardo Ziviani } 2861e04797f7SJose Ricardo Ziviani 2862e04797f7SJose Ricardo Ziviani if (unlikely(i > 31)) { 2863e04797f7SJose Ricardo Ziviani i = 31; 2864e04797f7SJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2865e04797f7SJose Ricardo Ziviani i = -31; 2866e04797f7SJose Ricardo Ziviani } 2867e04797f7SJose Ricardo Ziviani 2868e04797f7SJose Ricardo Ziviani if (i > 0) { 28693c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2870e04797f7SJose Ricardo Ziviani } else { 28713c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2872e04797f7SJose Ricardo Ziviani } 2873e04797f7SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2874e04797f7SJose Ricardo Ziviani 2875e04797f7SJose Ricardo Ziviani *r = ret; 2876e04797f7SJose Ricardo Ziviani 2877e04797f7SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2878e04797f7SJose Ricardo Ziviani if (ox_flag) { 2879e04797f7SJose Ricardo Ziviani cr |= CRF_SO; 2880e04797f7SJose Ricardo Ziviani } 2881e04797f7SJose Ricardo Ziviani 2882e04797f7SJose Ricardo Ziviani return cr; 2883e04797f7SJose Ricardo Ziviani } 2884e04797f7SJose Ricardo Ziviani 2885a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2886a49a95e9SJose Ricardo Ziviani { 2887a49a95e9SJose Ricardo Ziviani int cr; 2888a49a95e9SJose Ricardo Ziviani int i; 2889a49a95e9SJose Ricardo Ziviani int invalid = 0; 2890a49a95e9SJose Ricardo Ziviani bool ox_flag = false; 2891a49a95e9SJose Ricardo Ziviani ppc_avr_t ret = *b; 2892a49a95e9SJose Ricardo Ziviani 2893a49a95e9SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 2894a49a95e9SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2895a49a95e9SJose Ricardo Ziviani 2896a49a95e9SJose Ricardo Ziviani if (unlikely(invalid)) { 2897a49a95e9SJose Ricardo Ziviani return CRF_SO; 2898a49a95e9SJose Ricardo Ziviani } 2899a49a95e9SJose Ricardo Ziviani } 2900a49a95e9SJose Ricardo Ziviani 2901428115c3SMark Cave-Ayland i = a->VsrSB(7); 2902a49a95e9SJose Ricardo Ziviani if (i >= 32) { 2903a49a95e9SJose Ricardo Ziviani ox_flag = true; 29043c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2905a49a95e9SJose Ricardo Ziviani } else if (i <= -32) { 29063c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2907a49a95e9SJose Ricardo Ziviani } else if (i > 0) { 29083c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2909a49a95e9SJose Ricardo Ziviani } else { 29103c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2911a49a95e9SJose Ricardo Ziviani } 2912a49a95e9SJose Ricardo Ziviani *r = ret; 2913a49a95e9SJose Ricardo Ziviani 2914a49a95e9SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2915a49a95e9SJose Ricardo Ziviani if (ox_flag) { 2916a49a95e9SJose Ricardo Ziviani cr |= CRF_SO; 2917a49a95e9SJose Ricardo Ziviani } 2918a49a95e9SJose Ricardo Ziviani 2919a49a95e9SJose Ricardo Ziviani return cr; 2920a49a95e9SJose Ricardo Ziviani } 2921a49a95e9SJose Ricardo Ziviani 2922a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2923a54238adSJose Ricardo Ziviani { 2924a54238adSJose Ricardo Ziviani int cr; 2925a54238adSJose Ricardo Ziviani int unused = 0; 2926a54238adSJose Ricardo Ziviani int invalid = 0; 2927a54238adSJose Ricardo Ziviani bool ox_flag = false; 2928a54238adSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2929a54238adSJose Ricardo Ziviani ppc_avr_t ret = *b; 29303c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2931a54238adSJose Ricardo Ziviani 2932428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2933428115c3SMark Cave-Ayland ppc_avr_t bcd_one; 2934428115c3SMark Cave-Ayland 2935428115c3SMark Cave-Ayland bcd_one.VsrD(0) = 0; 2936428115c3SMark Cave-Ayland bcd_one.VsrD(1) = 0x10; 2937a54238adSJose Ricardo Ziviani 2938a54238adSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2939a54238adSJose Ricardo Ziviani return CRF_SO; 2940a54238adSJose Ricardo Ziviani } 2941a54238adSJose Ricardo Ziviani 2942a54238adSJose Ricardo Ziviani if (unlikely(i > 31)) { 2943a54238adSJose Ricardo Ziviani i = 31; 2944a54238adSJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2945a54238adSJose Ricardo Ziviani i = -31; 2946a54238adSJose Ricardo Ziviani } 2947a54238adSJose Ricardo Ziviani 2948a54238adSJose Ricardo Ziviani if (i > 0) { 29493c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2950a54238adSJose Ricardo Ziviani } else { 29513c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2952a54238adSJose Ricardo Ziviani 2953a54238adSJose Ricardo Ziviani if (bcd_get_digit(&ret, 0, &invalid) >= 5) { 2954a54238adSJose Ricardo Ziviani bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused); 2955a54238adSJose Ricardo Ziviani } 2956a54238adSJose Ricardo Ziviani } 2957a54238adSJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2958a54238adSJose Ricardo Ziviani 2959a54238adSJose Ricardo Ziviani cr = bcd_cmp_zero(&ret); 2960a54238adSJose Ricardo Ziviani if (ox_flag) { 2961a54238adSJose Ricardo Ziviani cr |= CRF_SO; 2962a54238adSJose Ricardo Ziviani } 2963a54238adSJose Ricardo Ziviani *r = ret; 2964a54238adSJose Ricardo Ziviani 2965a54238adSJose Ricardo Ziviani return cr; 2966a54238adSJose Ricardo Ziviani } 2967a54238adSJose Ricardo Ziviani 296831bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 296931bc4d11SJose Ricardo Ziviani { 297031bc4d11SJose Ricardo Ziviani uint64_t mask; 297131bc4d11SJose Ricardo Ziviani uint32_t ox_flag = 0; 2972428115c3SMark Cave-Ayland int i = a->VsrSH(3) + 1; 297331bc4d11SJose Ricardo Ziviani ppc_avr_t ret = *b; 297431bc4d11SJose Ricardo Ziviani 297531bc4d11SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 297631bc4d11SJose Ricardo Ziviani return CRF_SO; 297731bc4d11SJose Ricardo Ziviani } 297831bc4d11SJose Ricardo Ziviani 297931bc4d11SJose Ricardo Ziviani if (i > 16 && i < 32) { 298031bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 29813c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 298231bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 298331bc4d11SJose Ricardo Ziviani } 298431bc4d11SJose Ricardo Ziviani 29853c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 298631bc4d11SJose Ricardo Ziviani } else if (i >= 0 && i <= 16) { 298731bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 29883c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 298931bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 299031bc4d11SJose Ricardo Ziviani } 299131bc4d11SJose Ricardo Ziviani 29923c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 29933c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 299431bc4d11SJose Ricardo Ziviani } 299531bc4d11SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0); 299631bc4d11SJose Ricardo Ziviani *r = ret; 299731bc4d11SJose Ricardo Ziviani 299831bc4d11SJose Ricardo Ziviani return bcd_cmp_zero(&ret) | ox_flag; 299931bc4d11SJose Ricardo Ziviani } 300031bc4d11SJose Ricardo Ziviani 30015c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 30025c32e2e4SJose Ricardo Ziviani { 30035c32e2e4SJose Ricardo Ziviani int i; 30045c32e2e4SJose Ricardo Ziviani uint64_t mask; 30055c32e2e4SJose Ricardo Ziviani uint32_t ox_flag = 0; 30065c32e2e4SJose Ricardo Ziviani int invalid = 0; 30075c32e2e4SJose Ricardo Ziviani ppc_avr_t ret = *b; 30085c32e2e4SJose Ricardo Ziviani 30095c32e2e4SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 30105c32e2e4SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 30115c32e2e4SJose Ricardo Ziviani 30125c32e2e4SJose Ricardo Ziviani if (unlikely(invalid)) { 30135c32e2e4SJose Ricardo Ziviani return CRF_SO; 30145c32e2e4SJose Ricardo Ziviani } 30155c32e2e4SJose Ricardo Ziviani } 30165c32e2e4SJose Ricardo Ziviani 3017428115c3SMark Cave-Ayland i = a->VsrSH(3); 30185c32e2e4SJose Ricardo Ziviani if (i > 16 && i < 33) { 30195c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 30203c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 30215c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 30225c32e2e4SJose Ricardo Ziviani } 30235c32e2e4SJose Ricardo Ziviani 30243c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 30255c32e2e4SJose Ricardo Ziviani } else if (i > 0 && i <= 16) { 30265c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 30273c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 30285c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 30295c32e2e4SJose Ricardo Ziviani } 30305c32e2e4SJose Ricardo Ziviani 30313c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 30323c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 30335c32e2e4SJose Ricardo Ziviani } else if (i == 0) { 30343c385a93SMark Cave-Ayland if (ret.VsrD(0) || ret.VsrD(1)) { 30355c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 30365c32e2e4SJose Ricardo Ziviani } 30373c385a93SMark Cave-Ayland ret.VsrD(0) = ret.VsrD(1) = 0; 30385c32e2e4SJose Ricardo Ziviani } 30395c32e2e4SJose Ricardo Ziviani 30405c32e2e4SJose Ricardo Ziviani *r = ret; 30413c385a93SMark Cave-Ayland if (r->VsrD(0) == 0 && r->VsrD(1) == 0) { 30425c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_EQ; 30435c32e2e4SJose Ricardo Ziviani } 30445c32e2e4SJose Ricardo Ziviani 30455c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_GT; 30465c32e2e4SJose Ricardo Ziviani } 30475c32e2e4SJose Ricardo Ziviani 3048fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a) 3049fcf5ef2aSThomas Huth { 3050fcf5ef2aSThomas Huth int i; 3051fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 3052fcf5ef2aSThomas Huth r->u8[i] = AES_sbox[a->u8[i]]; 3053fcf5ef2aSThomas Huth } 3054fcf5ef2aSThomas Huth } 3055fcf5ef2aSThomas Huth 3056fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3057fcf5ef2aSThomas Huth { 3058fcf5ef2aSThomas Huth ppc_avr_t result; 3059fcf5ef2aSThomas Huth int i; 3060fcf5ef2aSThomas Huth 3061fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 30622dea57dbSMark Cave-Ayland result.VsrW(i) = b->VsrW(i) ^ 30632dea57dbSMark Cave-Ayland (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^ 30642dea57dbSMark Cave-Ayland AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^ 30652dea57dbSMark Cave-Ayland AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^ 30662dea57dbSMark Cave-Ayland AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]); 3067fcf5ef2aSThomas Huth } 3068fcf5ef2aSThomas Huth *r = result; 3069fcf5ef2aSThomas Huth } 3070fcf5ef2aSThomas Huth 3071fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3072fcf5ef2aSThomas Huth { 3073fcf5ef2aSThomas Huth ppc_avr_t result; 3074fcf5ef2aSThomas Huth int i; 3075fcf5ef2aSThomas Huth 3076fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 30772dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]); 3078fcf5ef2aSThomas Huth } 3079fcf5ef2aSThomas Huth *r = result; 3080fcf5ef2aSThomas Huth } 3081fcf5ef2aSThomas Huth 3082fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3083fcf5ef2aSThomas Huth { 3084fcf5ef2aSThomas Huth /* This differs from what is written in ISA V2.07. The RTL is */ 3085fcf5ef2aSThomas Huth /* incorrect and will be fixed in V2.07B. */ 3086fcf5ef2aSThomas Huth int i; 3087fcf5ef2aSThomas Huth ppc_avr_t tmp; 3088fcf5ef2aSThomas Huth 3089fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 30902dea57dbSMark Cave-Ayland tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])]; 3091fcf5ef2aSThomas Huth } 3092fcf5ef2aSThomas Huth 3093fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 30942dea57dbSMark Cave-Ayland r->VsrW(i) = 30952dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 0)][0] ^ 30962dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 1)][1] ^ 30972dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 2)][2] ^ 30982dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 3)][3]; 3099fcf5ef2aSThomas Huth } 3100fcf5ef2aSThomas Huth } 3101fcf5ef2aSThomas Huth 3102fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3103fcf5ef2aSThomas Huth { 3104fcf5ef2aSThomas Huth ppc_avr_t result; 3105fcf5ef2aSThomas Huth int i; 3106fcf5ef2aSThomas Huth 3107fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 31082dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]); 3109fcf5ef2aSThomas Huth } 3110fcf5ef2aSThomas Huth *r = result; 3111fcf5ef2aSThomas Huth } 3112fcf5ef2aSThomas Huth 3113fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 3114fcf5ef2aSThomas Huth { 3115fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 3116fcf5ef2aSThomas Huth int six = st_six & 0xF; 3117fcf5ef2aSThomas Huth int i; 3118fcf5ef2aSThomas Huth 3119730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 3120fcf5ef2aSThomas Huth if (st == 0) { 3121fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 31220ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 7) ^ 31230ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 18) ^ 3124730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 3); 3125fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 31260ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 17) ^ 31270ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 19) ^ 3128730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 10); 3129fcf5ef2aSThomas Huth } 3130fcf5ef2aSThomas Huth } else { /* st == 1 */ 3131fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 31320ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 2) ^ 31330ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 13) ^ 31340ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 22); 3135fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 31360ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 6) ^ 31370ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 11) ^ 31380ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 25); 3139fcf5ef2aSThomas Huth } 3140fcf5ef2aSThomas Huth } 3141fcf5ef2aSThomas Huth } 3142fcf5ef2aSThomas Huth } 3143fcf5ef2aSThomas Huth 3144fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 3145fcf5ef2aSThomas Huth { 3146fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 3147fcf5ef2aSThomas Huth int six = st_six & 0xF; 3148fcf5ef2aSThomas Huth int i; 3149fcf5ef2aSThomas Huth 3150730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 3151fcf5ef2aSThomas Huth if (st == 0) { 3152fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 31530ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 1) ^ 31540ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 8) ^ 3155730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 7); 3156fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 31570ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 19) ^ 31580ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 61) ^ 3159730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 6); 3160fcf5ef2aSThomas Huth } 3161fcf5ef2aSThomas Huth } else { /* st == 1 */ 3162fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 31630ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 28) ^ 31640ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 34) ^ 31650ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 39); 3166fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 31670ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 14) ^ 31680ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 18) ^ 31690ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 41); 3170fcf5ef2aSThomas Huth } 3171fcf5ef2aSThomas Huth } 3172fcf5ef2aSThomas Huth } 3173fcf5ef2aSThomas Huth } 3174fcf5ef2aSThomas Huth 3175fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 3176fcf5ef2aSThomas Huth { 3177fcf5ef2aSThomas Huth ppc_avr_t result; 3178fcf5ef2aSThomas Huth int i; 3179fcf5ef2aSThomas Huth 318060594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 318160594feaSMark Cave-Ayland int indexA = c->VsrB(i) >> 4; 318260594feaSMark Cave-Ayland int indexB = c->VsrB(i) & 0xF; 318360594feaSMark Cave-Ayland 318460594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB); 3185fcf5ef2aSThomas Huth } 3186fcf5ef2aSThomas Huth *r = result; 3187fcf5ef2aSThomas Huth } 3188fcf5ef2aSThomas Huth 3189fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I 3190fcf5ef2aSThomas Huth 3191fcf5ef2aSThomas Huth /*****************************************************************************/ 3192fcf5ef2aSThomas Huth /* SPE extension helpers */ 3193fcf5ef2aSThomas Huth /* Use a table to make this quicker */ 3194fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = { 3195fcf5ef2aSThomas Huth 0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE, 3196fcf5ef2aSThomas Huth 0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF, 3197fcf5ef2aSThomas Huth }; 3198fcf5ef2aSThomas Huth 3199fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val) 3200fcf5ef2aSThomas Huth { 3201fcf5ef2aSThomas Huth return hbrev[val >> 4] | (hbrev[val & 0xF] << 4); 3202fcf5ef2aSThomas Huth } 3203fcf5ef2aSThomas Huth 3204fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val) 3205fcf5ef2aSThomas Huth { 3206fcf5ef2aSThomas Huth return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) | 3207fcf5ef2aSThomas Huth (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24); 3208fcf5ef2aSThomas Huth } 3209fcf5ef2aSThomas Huth 3210fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */ 3211fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2) 3212fcf5ef2aSThomas Huth { 3213fcf5ef2aSThomas Huth uint32_t a, b, d, mask; 3214fcf5ef2aSThomas Huth 3215fcf5ef2aSThomas Huth mask = UINT32_MAX >> (32 - MASKBITS); 3216fcf5ef2aSThomas Huth a = arg1 & mask; 3217fcf5ef2aSThomas Huth b = arg2 & mask; 3218fcf5ef2aSThomas Huth d = word_reverse(1 + word_reverse(a | ~b)); 3219fcf5ef2aSThomas Huth return (arg1 & ~mask) | (d & b); 3220fcf5ef2aSThomas Huth } 3221fcf5ef2aSThomas Huth 3222fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val) 3223fcf5ef2aSThomas Huth { 3224fcf5ef2aSThomas Huth if (val & 0x80000000) { 3225fcf5ef2aSThomas Huth return clz32(~val); 3226fcf5ef2aSThomas Huth } else { 3227fcf5ef2aSThomas Huth return clz32(val); 3228fcf5ef2aSThomas Huth } 3229fcf5ef2aSThomas Huth } 3230fcf5ef2aSThomas Huth 3231fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val) 3232fcf5ef2aSThomas Huth { 3233fcf5ef2aSThomas Huth return clz32(val); 3234fcf5ef2aSThomas Huth } 3235fcf5ef2aSThomas Huth 3236fcf5ef2aSThomas Huth /* 440 specific */ 3237fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high, 3238fcf5ef2aSThomas Huth target_ulong low, uint32_t update_Rc) 3239fcf5ef2aSThomas Huth { 3240fcf5ef2aSThomas Huth target_ulong mask; 3241fcf5ef2aSThomas Huth int i; 3242fcf5ef2aSThomas Huth 3243fcf5ef2aSThomas Huth i = 1; 3244fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3245fcf5ef2aSThomas Huth if ((high & mask) == 0) { 3246fcf5ef2aSThomas Huth if (update_Rc) { 3247fcf5ef2aSThomas Huth env->crf[0] = 0x4; 3248fcf5ef2aSThomas Huth } 3249fcf5ef2aSThomas Huth goto done; 3250fcf5ef2aSThomas Huth } 3251fcf5ef2aSThomas Huth i++; 3252fcf5ef2aSThomas Huth } 3253fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3254fcf5ef2aSThomas Huth if ((low & mask) == 0) { 3255fcf5ef2aSThomas Huth if (update_Rc) { 3256fcf5ef2aSThomas Huth env->crf[0] = 0x8; 3257fcf5ef2aSThomas Huth } 3258fcf5ef2aSThomas Huth goto done; 3259fcf5ef2aSThomas Huth } 3260fcf5ef2aSThomas Huth i++; 3261fcf5ef2aSThomas Huth } 3262fcf5ef2aSThomas Huth i = 8; 3263fcf5ef2aSThomas Huth if (update_Rc) { 3264fcf5ef2aSThomas Huth env->crf[0] = 0x2; 3265fcf5ef2aSThomas Huth } 3266fcf5ef2aSThomas Huth done: 3267fcf5ef2aSThomas Huth env->xer = (env->xer & ~0x7F) | i; 3268fcf5ef2aSThomas Huth if (update_Rc) { 3269fcf5ef2aSThomas Huth env->crf[0] |= xer_so; 3270fcf5ef2aSThomas Huth } 3271fcf5ef2aSThomas Huth return i; 3272fcf5ef2aSThomas Huth } 3273