1fcf5ef2aSThomas Huth /* 2fcf5ef2aSThomas Huth * PowerPC integer and vector emulation helpers for QEMU. 3fcf5ef2aSThomas Huth * 4fcf5ef2aSThomas Huth * Copyright (c) 2003-2007 Jocelyn Mayer 5fcf5ef2aSThomas Huth * 6fcf5ef2aSThomas Huth * This library is free software; you can redistribute it and/or 7fcf5ef2aSThomas Huth * modify it under the terms of the GNU Lesser General Public 8fcf5ef2aSThomas Huth * License as published by the Free Software Foundation; either 96bd039cdSChetan Pant * version 2.1 of the License, or (at your option) any later version. 10fcf5ef2aSThomas Huth * 11fcf5ef2aSThomas Huth * This library is distributed in the hope that it will be useful, 12fcf5ef2aSThomas Huth * but WITHOUT ANY WARRANTY; without even the implied warranty of 13fcf5ef2aSThomas Huth * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14fcf5ef2aSThomas Huth * Lesser General Public License for more details. 15fcf5ef2aSThomas Huth * 16fcf5ef2aSThomas Huth * You should have received a copy of the GNU Lesser General Public 17fcf5ef2aSThomas Huth * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18fcf5ef2aSThomas Huth */ 19db725815SMarkus Armbruster 20fcf5ef2aSThomas Huth #include "qemu/osdep.h" 21fcf5ef2aSThomas Huth #include "cpu.h" 22fcf5ef2aSThomas Huth #include "internal.h" 23fcf5ef2aSThomas Huth #include "qemu/host-utils.h" 24db725815SMarkus Armbruster #include "qemu/main-loop.h" 258a05fd9aSRichard Henderson #include "qemu/log.h" 26fcf5ef2aSThomas Huth #include "exec/helper-proto.h" 27fcf5ef2aSThomas Huth #include "crypto/aes.h" 2824f91e81SAlex Bennée #include "fpu/softfloat.h" 293f74b632SRichard Henderson #include "qapi/error.h" 303f74b632SRichard Henderson #include "qemu/guest-random.h" 31fcf5ef2aSThomas Huth 32fcf5ef2aSThomas Huth #include "helper_regs.h" 33fcf5ef2aSThomas Huth /*****************************************************************************/ 34fcf5ef2aSThomas Huth /* Fixed point operations helpers */ 35fcf5ef2aSThomas Huth 36f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov) 37f32899deSNikunj A Dadhania { 38f32899deSNikunj A Dadhania if (unlikely(ov)) { 39f32899deSNikunj A Dadhania env->so = env->ov = 1; 40f32899deSNikunj A Dadhania } else { 41f32899deSNikunj A Dadhania env->ov = 0; 42f32899deSNikunj A Dadhania } 43f32899deSNikunj A Dadhania } 44f32899deSNikunj A Dadhania 45fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb, 46fcf5ef2aSThomas Huth uint32_t oe) 47fcf5ef2aSThomas Huth { 48fcf5ef2aSThomas Huth uint64_t rt = 0; 49fcf5ef2aSThomas Huth int overflow = 0; 50fcf5ef2aSThomas Huth 51fcf5ef2aSThomas Huth uint64_t dividend = (uint64_t)ra << 32; 52fcf5ef2aSThomas Huth uint64_t divisor = (uint32_t)rb; 53fcf5ef2aSThomas Huth 54fcf5ef2aSThomas Huth if (unlikely(divisor == 0)) { 55fcf5ef2aSThomas Huth overflow = 1; 56fcf5ef2aSThomas Huth } else { 57fcf5ef2aSThomas Huth rt = dividend / divisor; 58fcf5ef2aSThomas Huth overflow = rt > UINT32_MAX; 59fcf5ef2aSThomas Huth } 60fcf5ef2aSThomas Huth 61fcf5ef2aSThomas Huth if (unlikely(overflow)) { 62fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 63fcf5ef2aSThomas Huth } 64fcf5ef2aSThomas Huth 65fcf5ef2aSThomas Huth if (oe) { 66f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 67fcf5ef2aSThomas Huth } 68fcf5ef2aSThomas Huth 69fcf5ef2aSThomas Huth return (target_ulong)rt; 70fcf5ef2aSThomas Huth } 71fcf5ef2aSThomas Huth 72fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb, 73fcf5ef2aSThomas Huth uint32_t oe) 74fcf5ef2aSThomas Huth { 75fcf5ef2aSThomas Huth int64_t rt = 0; 76fcf5ef2aSThomas Huth int overflow = 0; 77fcf5ef2aSThomas Huth 78fcf5ef2aSThomas Huth int64_t dividend = (int64_t)ra << 32; 79fcf5ef2aSThomas Huth int64_t divisor = (int64_t)((int32_t)rb); 80fcf5ef2aSThomas Huth 81fcf5ef2aSThomas Huth if (unlikely((divisor == 0) || 82fcf5ef2aSThomas Huth ((divisor == -1ull) && (dividend == INT64_MIN)))) { 83fcf5ef2aSThomas Huth overflow = 1; 84fcf5ef2aSThomas Huth } else { 85fcf5ef2aSThomas Huth rt = dividend / divisor; 86fcf5ef2aSThomas Huth overflow = rt != (int32_t)rt; 87fcf5ef2aSThomas Huth } 88fcf5ef2aSThomas Huth 89fcf5ef2aSThomas Huth if (unlikely(overflow)) { 90fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 91fcf5ef2aSThomas Huth } 92fcf5ef2aSThomas Huth 93fcf5ef2aSThomas Huth if (oe) { 94f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 95fcf5ef2aSThomas Huth } 96fcf5ef2aSThomas Huth 97fcf5ef2aSThomas Huth return (target_ulong)rt; 98fcf5ef2aSThomas Huth } 99fcf5ef2aSThomas Huth 100fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 101fcf5ef2aSThomas Huth 102fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe) 103fcf5ef2aSThomas Huth { 104fcf5ef2aSThomas Huth uint64_t rt = 0; 105fcf5ef2aSThomas Huth int overflow = 0; 106fcf5ef2aSThomas Huth 1079276a31cSLuis Pires if (unlikely(rb == 0 || ra >= rb)) { 1089276a31cSLuis Pires overflow = 1; 109fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1109276a31cSLuis Pires } else { 1119276a31cSLuis Pires divu128(&rt, &ra, rb); 112fcf5ef2aSThomas Huth } 113fcf5ef2aSThomas Huth 114fcf5ef2aSThomas Huth if (oe) { 115f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 116fcf5ef2aSThomas Huth } 117fcf5ef2aSThomas Huth 118fcf5ef2aSThomas Huth return rt; 119fcf5ef2aSThomas Huth } 120fcf5ef2aSThomas Huth 121fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe) 122fcf5ef2aSThomas Huth { 12340f3e79aSLuis Pires uint64_t rt = 0; 124fcf5ef2aSThomas Huth int64_t ra = (int64_t)rau; 125fcf5ef2aSThomas Huth int64_t rb = (int64_t)rbu; 1269276a31cSLuis Pires int overflow = 0; 127fcf5ef2aSThomas Huth 1289276a31cSLuis Pires if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) { 1299276a31cSLuis Pires overflow = 1; 130fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1319276a31cSLuis Pires } else { 1329276a31cSLuis Pires divs128(&rt, &ra, rb); 133fcf5ef2aSThomas Huth } 134fcf5ef2aSThomas Huth 135fcf5ef2aSThomas Huth if (oe) { 136f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 137fcf5ef2aSThomas Huth } 138fcf5ef2aSThomas Huth 139fcf5ef2aSThomas Huth return rt; 140fcf5ef2aSThomas Huth } 141fcf5ef2aSThomas Huth 142fcf5ef2aSThomas Huth #endif 143fcf5ef2aSThomas Huth 144fcf5ef2aSThomas Huth 145fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 146fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */ 147fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff)) 148fcf5ef2aSThomas Huth 149b6cb41b2SDavid Gibson /* 150b6cb41b2SDavid Gibson * subtract 1 from each byte, and with inverse, check if MSB is set at each 151fcf5ef2aSThomas Huth * byte. 152fcf5ef2aSThomas Huth * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80 153fcf5ef2aSThomas Huth * (0xFF & 0xFF) & 0x80 = 0x80 (zero found) 154fcf5ef2aSThomas Huth */ 155fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80)) 156fcf5ef2aSThomas Huth 157fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */ 158fcf5ef2aSThomas Huth #define hasvalue(x, n) (haszero((x) ^ pattern(n))) 159fcf5ef2aSThomas Huth 160fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb) 161fcf5ef2aSThomas Huth { 162efa73196SNikunj A Dadhania return hasvalue(rb, ra) ? CRF_GT : 0; 163fcf5ef2aSThomas Huth } 164fcf5ef2aSThomas Huth 165fcf5ef2aSThomas Huth #undef pattern 166fcf5ef2aSThomas Huth #undef haszero 167fcf5ef2aSThomas Huth #undef hasvalue 168fcf5ef2aSThomas Huth 169b6cb41b2SDavid Gibson /* 1703f74b632SRichard Henderson * Return a random number. 171fcf5ef2aSThomas Huth */ 1723f74b632SRichard Henderson uint64_t helper_darn32(void) 173fcf5ef2aSThomas Huth { 1743f74b632SRichard Henderson Error *err = NULL; 1753f74b632SRichard Henderson uint32_t ret; 1763f74b632SRichard Henderson 1773f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1783f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1793f74b632SRichard Henderson error_get_pretty(err)); 1803f74b632SRichard Henderson error_free(err); 181fcf5ef2aSThomas Huth return -1; 182fcf5ef2aSThomas Huth } 183fcf5ef2aSThomas Huth 1843f74b632SRichard Henderson return ret; 1853f74b632SRichard Henderson } 1863f74b632SRichard Henderson 1873f74b632SRichard Henderson uint64_t helper_darn64(void) 188fcf5ef2aSThomas Huth { 1893f74b632SRichard Henderson Error *err = NULL; 1903f74b632SRichard Henderson uint64_t ret; 1913f74b632SRichard Henderson 1923f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1933f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1943f74b632SRichard Henderson error_get_pretty(err)); 1953f74b632SRichard Henderson error_free(err); 196fcf5ef2aSThomas Huth return -1; 197fcf5ef2aSThomas Huth } 198fcf5ef2aSThomas Huth 1993f74b632SRichard Henderson return ret; 2003f74b632SRichard Henderson } 201fcf5ef2aSThomas Huth 202fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb) 203fcf5ef2aSThomas Huth { 204fcf5ef2aSThomas Huth int i; 205fcf5ef2aSThomas Huth uint64_t ra = 0; 206fcf5ef2aSThomas Huth 207fcf5ef2aSThomas Huth for (i = 0; i < 8; i++) { 208fcf5ef2aSThomas Huth int index = (rs >> (i * 8)) & 0xFF; 209fcf5ef2aSThomas Huth if (index < 64) { 210a6a444a8SCédric Le Goater if (rb & PPC_BIT(index)) { 211fcf5ef2aSThomas Huth ra |= 1 << i; 212fcf5ef2aSThomas Huth } 213fcf5ef2aSThomas Huth } 214fcf5ef2aSThomas Huth } 215fcf5ef2aSThomas Huth return ra; 216fcf5ef2aSThomas Huth } 217fcf5ef2aSThomas Huth 218fcf5ef2aSThomas Huth #endif 219fcf5ef2aSThomas Huth 220fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb) 221fcf5ef2aSThomas Huth { 222fcf5ef2aSThomas Huth target_ulong mask = 0xff; 223fcf5ef2aSThomas Huth target_ulong ra = 0; 224fcf5ef2aSThomas Huth int i; 225fcf5ef2aSThomas Huth 226fcf5ef2aSThomas Huth for (i = 0; i < sizeof(target_ulong); i++) { 227fcf5ef2aSThomas Huth if ((rs & mask) == (rb & mask)) { 228fcf5ef2aSThomas Huth ra |= mask; 229fcf5ef2aSThomas Huth } 230fcf5ef2aSThomas Huth mask <<= 8; 231fcf5ef2aSThomas Huth } 232fcf5ef2aSThomas Huth return ra; 233fcf5ef2aSThomas Huth } 234fcf5ef2aSThomas Huth 235fcf5ef2aSThomas Huth /* shift right arithmetic helper */ 236fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value, 237fcf5ef2aSThomas Huth target_ulong shift) 238fcf5ef2aSThomas Huth { 239fcf5ef2aSThomas Huth int32_t ret; 240fcf5ef2aSThomas Huth 241fcf5ef2aSThomas Huth if (likely(!(shift & 0x20))) { 242fcf5ef2aSThomas Huth if (likely((uint32_t)shift != 0)) { 243fcf5ef2aSThomas Huth shift &= 0x1f; 244fcf5ef2aSThomas Huth ret = (int32_t)value >> shift; 245fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) { 246af1c259fSSandipan Das env->ca32 = env->ca = 0; 247fcf5ef2aSThomas Huth } else { 248af1c259fSSandipan Das env->ca32 = env->ca = 1; 249fcf5ef2aSThomas Huth } 250fcf5ef2aSThomas Huth } else { 251fcf5ef2aSThomas Huth ret = (int32_t)value; 252af1c259fSSandipan Das env->ca32 = env->ca = 0; 253fcf5ef2aSThomas Huth } 254fcf5ef2aSThomas Huth } else { 255fcf5ef2aSThomas Huth ret = (int32_t)value >> 31; 256af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 257fcf5ef2aSThomas Huth } 258fcf5ef2aSThomas Huth return (target_long)ret; 259fcf5ef2aSThomas Huth } 260fcf5ef2aSThomas Huth 261fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 262fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value, 263fcf5ef2aSThomas Huth target_ulong shift) 264fcf5ef2aSThomas Huth { 265fcf5ef2aSThomas Huth int64_t ret; 266fcf5ef2aSThomas Huth 267fcf5ef2aSThomas Huth if (likely(!(shift & 0x40))) { 268fcf5ef2aSThomas Huth if (likely((uint64_t)shift != 0)) { 269fcf5ef2aSThomas Huth shift &= 0x3f; 270fcf5ef2aSThomas Huth ret = (int64_t)value >> shift; 271fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) { 272af1c259fSSandipan Das env->ca32 = env->ca = 0; 273fcf5ef2aSThomas Huth } else { 274af1c259fSSandipan Das env->ca32 = env->ca = 1; 275fcf5ef2aSThomas Huth } 276fcf5ef2aSThomas Huth } else { 277fcf5ef2aSThomas Huth ret = (int64_t)value; 278af1c259fSSandipan Das env->ca32 = env->ca = 0; 279fcf5ef2aSThomas Huth } 280fcf5ef2aSThomas Huth } else { 281fcf5ef2aSThomas Huth ret = (int64_t)value >> 63; 282af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 283fcf5ef2aSThomas Huth } 284fcf5ef2aSThomas Huth return ret; 285fcf5ef2aSThomas Huth } 286fcf5ef2aSThomas Huth #endif 287fcf5ef2aSThomas Huth 288fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 289fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 290fcf5ef2aSThomas Huth { 29179770002SRichard Henderson /* Note that we don't fold past bytes */ 292fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 293fcf5ef2aSThomas Huth 0x5555555555555555ULL); 294fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 295fcf5ef2aSThomas Huth 0x3333333333333333ULL); 296fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 297fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 298fcf5ef2aSThomas Huth return val; 299fcf5ef2aSThomas Huth } 300fcf5ef2aSThomas Huth 301fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val) 302fcf5ef2aSThomas Huth { 30379770002SRichard Henderson /* Note that we don't fold past words. */ 304fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 305fcf5ef2aSThomas Huth 0x5555555555555555ULL); 306fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 307fcf5ef2aSThomas Huth 0x3333333333333333ULL); 308fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 309fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 310fcf5ef2aSThomas Huth val = (val & 0x00ff00ff00ff00ffULL) + ((val >> 8) & 311fcf5ef2aSThomas Huth 0x00ff00ff00ff00ffULL); 312fcf5ef2aSThomas Huth val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) & 313fcf5ef2aSThomas Huth 0x0000ffff0000ffffULL); 314fcf5ef2aSThomas Huth return val; 315fcf5ef2aSThomas Huth } 316fcf5ef2aSThomas Huth #else 317fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 318fcf5ef2aSThomas Huth { 31979770002SRichard Henderson /* Note that we don't fold past bytes */ 320fcf5ef2aSThomas Huth val = (val & 0x55555555) + ((val >> 1) & 0x55555555); 321fcf5ef2aSThomas Huth val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 322fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f) + ((val >> 4) & 0x0f0f0f0f); 323fcf5ef2aSThomas Huth return val; 324fcf5ef2aSThomas Huth } 325fcf5ef2aSThomas Huth #endif 326fcf5ef2aSThomas Huth 3276e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask) 32889ccd7dcSMatheus Ferst { 32989ccd7dcSMatheus Ferst /* 33089ccd7dcSMatheus Ferst * Instead of processing the mask bit-by-bit from the most significant to 33189ccd7dcSMatheus Ferst * the least significant bit, as described in PowerISA, we'll handle it in 33289ccd7dcSMatheus Ferst * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use 33389ccd7dcSMatheus Ferst * ctz or cto, we negate the mask at the end of the loop. 33489ccd7dcSMatheus Ferst */ 33589ccd7dcSMatheus Ferst target_ulong m, left = 0, right = 0; 33689ccd7dcSMatheus Ferst unsigned int n, i = 64; 33789ccd7dcSMatheus Ferst bool bit = false; /* tracks if we are processing zeros or ones */ 33889ccd7dcSMatheus Ferst 33989ccd7dcSMatheus Ferst if (mask == 0 || mask == -1) { 34089ccd7dcSMatheus Ferst return src; 34189ccd7dcSMatheus Ferst } 34289ccd7dcSMatheus Ferst 34389ccd7dcSMatheus Ferst /* Processes the mask in blocks, from LSB to MSB */ 34489ccd7dcSMatheus Ferst while (i) { 34589ccd7dcSMatheus Ferst /* Find how many bits we should take */ 34689ccd7dcSMatheus Ferst n = ctz64(mask); 34789ccd7dcSMatheus Ferst if (n > i) { 34889ccd7dcSMatheus Ferst n = i; 34989ccd7dcSMatheus Ferst } 35089ccd7dcSMatheus Ferst 35189ccd7dcSMatheus Ferst /* 35289ccd7dcSMatheus Ferst * Extracts 'n' trailing bits of src and put them on the leading 'n' 35389ccd7dcSMatheus Ferst * bits of 'right' or 'left', pushing down the previously extracted 35489ccd7dcSMatheus Ferst * values. 35589ccd7dcSMatheus Ferst */ 35689ccd7dcSMatheus Ferst m = (1ll << n) - 1; 35789ccd7dcSMatheus Ferst if (bit) { 35889ccd7dcSMatheus Ferst right = ror64(right | (src & m), n); 35989ccd7dcSMatheus Ferst } else { 36089ccd7dcSMatheus Ferst left = ror64(left | (src & m), n); 36189ccd7dcSMatheus Ferst } 36289ccd7dcSMatheus Ferst 36389ccd7dcSMatheus Ferst /* 36489ccd7dcSMatheus Ferst * Discards the processed bits from 'src' and 'mask'. Note that we are 36589ccd7dcSMatheus Ferst * removing 'n' trailing zeros from 'mask', but the logical shift will 36689ccd7dcSMatheus Ferst * add 'n' leading zeros back, so the population count of 'mask' is kept 36789ccd7dcSMatheus Ferst * the same. 36889ccd7dcSMatheus Ferst */ 36989ccd7dcSMatheus Ferst src >>= n; 37089ccd7dcSMatheus Ferst mask >>= n; 37189ccd7dcSMatheus Ferst i -= n; 37289ccd7dcSMatheus Ferst bit = !bit; 37389ccd7dcSMatheus Ferst mask = ~mask; 37489ccd7dcSMatheus Ferst } 37589ccd7dcSMatheus Ferst 37689ccd7dcSMatheus Ferst /* 37789ccd7dcSMatheus Ferst * At the end, right was ror'ed ctpop(mask) times. To put it back in place, 37889ccd7dcSMatheus Ferst * we'll shift it more 64-ctpop(mask) times. 37989ccd7dcSMatheus Ferst */ 38089ccd7dcSMatheus Ferst if (bit) { 38189ccd7dcSMatheus Ferst n = ctpop64(mask); 38289ccd7dcSMatheus Ferst } else { 38389ccd7dcSMatheus Ferst n = 64 - ctpop64(mask); 38489ccd7dcSMatheus Ferst } 38589ccd7dcSMatheus Ferst 38689ccd7dcSMatheus Ferst return left | (right >> n); 38789ccd7dcSMatheus Ferst } 38889ccd7dcSMatheus Ferst 38921ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask) 39021ba6e58SMatheus Ferst { 39121ba6e58SMatheus Ferst int i, o; 39221ba6e58SMatheus Ferst uint64_t result = 0; 39321ba6e58SMatheus Ferst 39421ba6e58SMatheus Ferst if (mask == -1) { 39521ba6e58SMatheus Ferst return src; 39621ba6e58SMatheus Ferst } 39721ba6e58SMatheus Ferst 39821ba6e58SMatheus Ferst for (i = 0; mask != 0; i++) { 39921ba6e58SMatheus Ferst o = ctz64(mask); 40021ba6e58SMatheus Ferst mask &= mask - 1; 40121ba6e58SMatheus Ferst result |= ((src >> i) & 1) << o; 40221ba6e58SMatheus Ferst } 40321ba6e58SMatheus Ferst 40421ba6e58SMatheus Ferst return result; 40521ba6e58SMatheus Ferst } 4068bdb7606SMatheus Ferst 4078bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask) 4088bdb7606SMatheus Ferst { 4098bdb7606SMatheus Ferst int i, o; 4108bdb7606SMatheus Ferst uint64_t result = 0; 4118bdb7606SMatheus Ferst 4128bdb7606SMatheus Ferst if (mask == -1) { 4138bdb7606SMatheus Ferst return src; 4148bdb7606SMatheus Ferst } 4158bdb7606SMatheus Ferst 4168bdb7606SMatheus Ferst for (o = 0; mask != 0; o++) { 4178bdb7606SMatheus Ferst i = ctz64(mask); 4188bdb7606SMatheus Ferst mask &= mask - 1; 4198bdb7606SMatheus Ferst result |= ((src >> i) & 1) << o; 4208bdb7606SMatheus Ferst } 4218bdb7606SMatheus Ferst 4228bdb7606SMatheus Ferst return result; 4238bdb7606SMatheus Ferst } 42421ba6e58SMatheus Ferst 425fcf5ef2aSThomas Huth /*****************************************************************************/ 426fcf5ef2aSThomas Huth /* Altivec extension helpers */ 427fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 428fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 429fcf5ef2aSThomas Huth for (index = 0; index < ARRAY_SIZE(r->element); index++) 430fcf5ef2aSThomas Huth #else 431fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 432fcf5ef2aSThomas Huth for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--) 433fcf5ef2aSThomas Huth #endif 434fcf5ef2aSThomas Huth 435fcf5ef2aSThomas Huth /* Saturating arithmetic helpers. */ 436fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max) \ 437fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 438fcf5ef2aSThomas Huth { \ 439fcf5ef2aSThomas Huth to_type r; \ 440fcf5ef2aSThomas Huth \ 441fcf5ef2aSThomas Huth if (x < (from_type)min) { \ 442fcf5ef2aSThomas Huth r = min; \ 443fcf5ef2aSThomas Huth *sat = 1; \ 444fcf5ef2aSThomas Huth } else if (x > (from_type)max) { \ 445fcf5ef2aSThomas Huth r = max; \ 446fcf5ef2aSThomas Huth *sat = 1; \ 447fcf5ef2aSThomas Huth } else { \ 448fcf5ef2aSThomas Huth r = x; \ 449fcf5ef2aSThomas Huth } \ 450fcf5ef2aSThomas Huth return r; \ 451fcf5ef2aSThomas Huth } 452fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max) \ 453fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 454fcf5ef2aSThomas Huth { \ 455fcf5ef2aSThomas Huth to_type r; \ 456fcf5ef2aSThomas Huth \ 457fcf5ef2aSThomas Huth if (x > (from_type)max) { \ 458fcf5ef2aSThomas Huth r = max; \ 459fcf5ef2aSThomas Huth *sat = 1; \ 460fcf5ef2aSThomas Huth } else { \ 461fcf5ef2aSThomas Huth r = x; \ 462fcf5ef2aSThomas Huth } \ 463fcf5ef2aSThomas Huth return r; \ 464fcf5ef2aSThomas Huth } 465fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX) 466fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX) 467fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX) 468fcf5ef2aSThomas Huth 469fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX) 470fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX) 471fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX) 472fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX) 473fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX) 474fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX) 475fcf5ef2aSThomas Huth #undef SATCVT 476fcf5ef2aSThomas Huth #undef SATCVTU 477fcf5ef2aSThomas Huth 478dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr) 479fcf5ef2aSThomas Huth { 480c19940dbSBruno Larsen (billionai) ppc_store_vscr(env, vscr); 481fcf5ef2aSThomas Huth } 482fcf5ef2aSThomas Huth 483cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env) 484cc2b90d7SRichard Henderson { 485c19940dbSBruno Larsen (billionai) return ppc_get_vscr(env); 486cc2b90d7SRichard Henderson } 487cc2b90d7SRichard Henderson 4886175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env) 4896175f5a0SRichard Henderson { 4909b5b74daSRichard Henderson /* The choice of non-zero value is arbitrary. */ 4919b5b74daSRichard Henderson env->vscr_sat.u32[0] = 1; 4926175f5a0SRichard Henderson } 4936175f5a0SRichard Henderson 494fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 495fcf5ef2aSThomas Huth { 496fcf5ef2aSThomas Huth int i; 497fcf5ef2aSThomas Huth 498fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 499fcf5ef2aSThomas Huth r->u32[i] = ~a->u32[i] < b->u32[i]; 500fcf5ef2aSThomas Huth } 501fcf5ef2aSThomas Huth } 502fcf5ef2aSThomas Huth 503fcf5ef2aSThomas Huth /* vprtybw */ 504fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b) 505fcf5ef2aSThomas Huth { 506fcf5ef2aSThomas Huth int i; 507fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 508fcf5ef2aSThomas Huth uint64_t res = b->u32[i] ^ (b->u32[i] >> 16); 509fcf5ef2aSThomas Huth res ^= res >> 8; 510fcf5ef2aSThomas Huth r->u32[i] = res & 1; 511fcf5ef2aSThomas Huth } 512fcf5ef2aSThomas Huth } 513fcf5ef2aSThomas Huth 514fcf5ef2aSThomas Huth /* vprtybd */ 515fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b) 516fcf5ef2aSThomas Huth { 517fcf5ef2aSThomas Huth int i; 518fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 519fcf5ef2aSThomas Huth uint64_t res = b->u64[i] ^ (b->u64[i] >> 32); 520fcf5ef2aSThomas Huth res ^= res >> 16; 521fcf5ef2aSThomas Huth res ^= res >> 8; 522fcf5ef2aSThomas Huth r->u64[i] = res & 1; 523fcf5ef2aSThomas Huth } 524fcf5ef2aSThomas Huth } 525fcf5ef2aSThomas Huth 526fcf5ef2aSThomas Huth /* vprtybq */ 527fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b) 528fcf5ef2aSThomas Huth { 529fcf5ef2aSThomas Huth uint64_t res = b->u64[0] ^ b->u64[1]; 530fcf5ef2aSThomas Huth res ^= res >> 32; 531fcf5ef2aSThomas Huth res ^= res >> 16; 532fcf5ef2aSThomas Huth res ^= res >> 8; 5333c385a93SMark Cave-Ayland r->VsrD(1) = res & 1; 5343c385a93SMark Cave-Ayland r->VsrD(0) = 0; 535fcf5ef2aSThomas Huth } 536fcf5ef2aSThomas Huth 537fcf5ef2aSThomas Huth #define VARITHFP(suffix, func) \ 538fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 539fcf5ef2aSThomas Huth ppc_avr_t *b) \ 540fcf5ef2aSThomas Huth { \ 541fcf5ef2aSThomas Huth int i; \ 542fcf5ef2aSThomas Huth \ 54305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 54405ee3e8aSMark Cave-Ayland r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status); \ 545fcf5ef2aSThomas Huth } \ 546fcf5ef2aSThomas Huth } 547fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add) 548fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub) 549fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min) 550fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max) 551fcf5ef2aSThomas Huth #undef VARITHFP 552fcf5ef2aSThomas Huth 553fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type) \ 554fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 555fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) \ 556fcf5ef2aSThomas Huth { \ 557fcf5ef2aSThomas Huth int i; \ 55805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 55905ee3e8aSMark Cave-Ayland r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \ 560fcf5ef2aSThomas Huth type, &env->vec_status); \ 561fcf5ef2aSThomas Huth } \ 562fcf5ef2aSThomas Huth } 563fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0); 564fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c); 565fcf5ef2aSThomas Huth #undef VARITHFPFMA 566fcf5ef2aSThomas Huth 567fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element) \ 568fcf5ef2aSThomas Huth { \ 569fcf5ef2aSThomas Huth type result = (type)a->element[i] op (type)b->element[i]; \ 570fcf5ef2aSThomas Huth r->element[i] = cvt(result, &sat); \ 571fcf5ef2aSThomas Huth } 572fcf5ef2aSThomas Huth 573fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element) \ 574fb11ae7dSRichard Henderson void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat, \ 575fb11ae7dSRichard Henderson ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 576fcf5ef2aSThomas Huth { \ 577fcf5ef2aSThomas Huth int sat = 0; \ 578fcf5ef2aSThomas Huth int i; \ 579fcf5ef2aSThomas Huth \ 580fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 581fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 582fcf5ef2aSThomas Huth } \ 583fcf5ef2aSThomas Huth if (sat) { \ 584fb11ae7dSRichard Henderson vscr_sat->u32[0] = 1; \ 585fcf5ef2aSThomas Huth } \ 586fcf5ef2aSThomas Huth } 587fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt) \ 588fcf5ef2aSThomas Huth VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element) \ 589fcf5ef2aSThomas Huth VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element) 590fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt) \ 591fcf5ef2aSThomas Huth VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element) \ 592fcf5ef2aSThomas Huth VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element) 593fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb) 594fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh) 595fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw) 596fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub) 597fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh) 598fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw) 599fcf5ef2aSThomas Huth #undef VARITHSAT_CASE 600fcf5ef2aSThomas Huth #undef VARITHSAT_DO 601fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED 602fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED 603fcf5ef2aSThomas Huth 604fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype) \ 605fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 606fcf5ef2aSThomas Huth { \ 607fcf5ef2aSThomas Huth int i; \ 608fcf5ef2aSThomas Huth \ 609fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 610fcf5ef2aSThomas Huth etype x = (etype)a->element[i] + (etype)b->element[i] + 1; \ 611fcf5ef2aSThomas Huth r->element[i] = x >> 1; \ 612fcf5ef2aSThomas Huth } \ 613fcf5ef2aSThomas Huth } 614fcf5ef2aSThomas Huth 615fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element, \ 616fcf5ef2aSThomas Huth unsigned_type) \ 617fcf5ef2aSThomas Huth VAVG_DO(avgs##type, signed_element, signed_type) \ 618fcf5ef2aSThomas Huth VAVG_DO(avgu##type, unsigned_element, unsigned_type) 619fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t) 620fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t) 621fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t) 622fcf5ef2aSThomas Huth #undef VAVG_DO 623fcf5ef2aSThomas Huth #undef VAVG 624fcf5ef2aSThomas Huth 625fcf5ef2aSThomas Huth #define VABSDU_DO(name, element) \ 626fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 627fcf5ef2aSThomas Huth { \ 628fcf5ef2aSThomas Huth int i; \ 629fcf5ef2aSThomas Huth \ 630fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 631fcf5ef2aSThomas Huth r->element[i] = (a->element[i] > b->element[i]) ? \ 632fcf5ef2aSThomas Huth (a->element[i] - b->element[i]) : \ 633fcf5ef2aSThomas Huth (b->element[i] - a->element[i]); \ 634fcf5ef2aSThomas Huth } \ 635fcf5ef2aSThomas Huth } 636fcf5ef2aSThomas Huth 637b6cb41b2SDavid Gibson /* 638b6cb41b2SDavid Gibson * VABSDU - Vector absolute difference unsigned 639fcf5ef2aSThomas Huth * name - instruction mnemonic suffix (b: byte, h: halfword, w: word) 640fcf5ef2aSThomas Huth * element - element type to access from vector 641fcf5ef2aSThomas Huth */ 642fcf5ef2aSThomas Huth #define VABSDU(type, element) \ 643fcf5ef2aSThomas Huth VABSDU_DO(absdu##type, element) 644fcf5ef2aSThomas Huth VABSDU(b, u8) 645fcf5ef2aSThomas Huth VABSDU(h, u16) 646fcf5ef2aSThomas Huth VABSDU(w, u32) 647fcf5ef2aSThomas Huth #undef VABSDU_DO 648fcf5ef2aSThomas Huth #undef VABSDU 649fcf5ef2aSThomas Huth 650fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element) \ 651fcf5ef2aSThomas Huth void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r, \ 652fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 653fcf5ef2aSThomas Huth { \ 654fcf5ef2aSThomas Huth int i; \ 655fcf5ef2aSThomas Huth \ 65605ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 657fcf5ef2aSThomas Huth float32 t = cvt(b->element[i], &env->vec_status); \ 65805ee3e8aSMark Cave-Ayland r->f32[i] = float32_scalbn(t, -uim, &env->vec_status); \ 659fcf5ef2aSThomas Huth } \ 660fcf5ef2aSThomas Huth } 661fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32) 662fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32) 663fcf5ef2aSThomas Huth #undef VCF 664fcf5ef2aSThomas Huth 665eb936dc0SMatheus Ferst #define VCMPNEZ(NAME, ELEM) \ 666eb936dc0SMatheus Ferst void helper_##NAME(ppc_vsr_t *t, ppc_vsr_t *a, ppc_vsr_t *b, uint32_t desc) \ 667fcf5ef2aSThomas Huth { \ 668eb936dc0SMatheus Ferst for (int i = 0; i < ARRAY_SIZE(t->ELEM); i++) { \ 669eb936dc0SMatheus Ferst t->ELEM[i] = ((a->ELEM[i] == 0) || (b->ELEM[i] == 0) || \ 670eb936dc0SMatheus Ferst (a->ELEM[i] != b->ELEM[i])) ? -1 : 0; \ 671fcf5ef2aSThomas Huth } \ 672fcf5ef2aSThomas Huth } 673eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZB, u8) 674eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZH, u16) 675eb936dc0SMatheus Ferst VCMPNEZ(VCMPNEZW, u32) 676eb936dc0SMatheus Ferst #undef VCMPNEZ 677fcf5ef2aSThomas Huth 678fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record) \ 679fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 680fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 681fcf5ef2aSThomas Huth { \ 682fcf5ef2aSThomas Huth uint32_t ones = (uint32_t)-1; \ 683fcf5ef2aSThomas Huth uint32_t all = ones; \ 684fcf5ef2aSThomas Huth uint32_t none = 0; \ 685fcf5ef2aSThomas Huth int i; \ 686fcf5ef2aSThomas Huth \ 68705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 688fcf5ef2aSThomas Huth uint32_t result; \ 68971bfd65cSRichard Henderson FloatRelation rel = \ 69071bfd65cSRichard Henderson float32_compare_quiet(a->f32[i], b->f32[i], \ 691fcf5ef2aSThomas Huth &env->vec_status); \ 692fcf5ef2aSThomas Huth if (rel == float_relation_unordered) { \ 693fcf5ef2aSThomas Huth result = 0; \ 694fcf5ef2aSThomas Huth } else if (rel compare order) { \ 695fcf5ef2aSThomas Huth result = ones; \ 696fcf5ef2aSThomas Huth } else { \ 697fcf5ef2aSThomas Huth result = 0; \ 698fcf5ef2aSThomas Huth } \ 699fcf5ef2aSThomas Huth r->u32[i] = result; \ 700fcf5ef2aSThomas Huth all &= result; \ 701fcf5ef2aSThomas Huth none |= result; \ 702fcf5ef2aSThomas Huth } \ 703fcf5ef2aSThomas Huth if (record) { \ 704fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 705fcf5ef2aSThomas Huth } \ 706fcf5ef2aSThomas Huth } 707fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order) \ 708fcf5ef2aSThomas Huth VCMPFP_DO(suffix, compare, order, 0) \ 709fcf5ef2aSThomas Huth VCMPFP_DO(suffix##_dot, compare, order, 1) 710fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal) 711fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less) 712fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater) 713fcf5ef2aSThomas Huth #undef VCMPFP_DO 714fcf5ef2aSThomas Huth #undef VCMPFP 715fcf5ef2aSThomas Huth 716fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r, 717fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b, int record) 718fcf5ef2aSThomas Huth { 719fcf5ef2aSThomas Huth int i; 720fcf5ef2aSThomas Huth int all_in = 0; 721fcf5ef2aSThomas Huth 72205ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 72371bfd65cSRichard Henderson FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i], 72405ee3e8aSMark Cave-Ayland &env->vec_status); 725fcf5ef2aSThomas Huth if (le_rel == float_relation_unordered) { 726fcf5ef2aSThomas Huth r->u32[i] = 0xc0000000; 727fcf5ef2aSThomas Huth all_in = 1; 728fcf5ef2aSThomas Huth } else { 72905ee3e8aSMark Cave-Ayland float32 bneg = float32_chs(b->f32[i]); 73071bfd65cSRichard Henderson FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg, 73105ee3e8aSMark Cave-Ayland &env->vec_status); 732fcf5ef2aSThomas Huth int le = le_rel != float_relation_greater; 733fcf5ef2aSThomas Huth int ge = ge_rel != float_relation_less; 734fcf5ef2aSThomas Huth 735fcf5ef2aSThomas Huth r->u32[i] = ((!le) << 31) | ((!ge) << 30); 736fcf5ef2aSThomas Huth all_in |= (!le | !ge); 737fcf5ef2aSThomas Huth } 738fcf5ef2aSThomas Huth } 739fcf5ef2aSThomas Huth if (record) { 740fcf5ef2aSThomas Huth env->crf[6] = (all_in == 0) << 1; 741fcf5ef2aSThomas Huth } 742fcf5ef2aSThomas Huth } 743fcf5ef2aSThomas Huth 744fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 745fcf5ef2aSThomas Huth { 746fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 0); 747fcf5ef2aSThomas Huth } 748fcf5ef2aSThomas Huth 749fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 750fcf5ef2aSThomas Huth ppc_avr_t *b) 751fcf5ef2aSThomas Huth { 752fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 1); 753fcf5ef2aSThomas Huth } 754fcf5ef2aSThomas Huth 755fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element) \ 756fcf5ef2aSThomas Huth void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r, \ 757fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 758fcf5ef2aSThomas Huth { \ 759fcf5ef2aSThomas Huth int i; \ 760fcf5ef2aSThomas Huth int sat = 0; \ 761fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 762fcf5ef2aSThomas Huth \ 763fcf5ef2aSThomas Huth set_float_rounding_mode(float_round_to_zero, &s); \ 76405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 76505ee3e8aSMark Cave-Ayland if (float32_is_any_nan(b->f32[i])) { \ 766fcf5ef2aSThomas Huth r->element[i] = 0; \ 767fcf5ef2aSThomas Huth } else { \ 76805ee3e8aSMark Cave-Ayland float64 t = float32_to_float64(b->f32[i], &s); \ 769fcf5ef2aSThomas Huth int64_t j; \ 770fcf5ef2aSThomas Huth \ 771fcf5ef2aSThomas Huth t = float64_scalbn(t, uim, &s); \ 772fcf5ef2aSThomas Huth j = float64_to_int64(t, &s); \ 773fcf5ef2aSThomas Huth r->element[i] = satcvt(j, &sat); \ 774fcf5ef2aSThomas Huth } \ 775fcf5ef2aSThomas Huth } \ 776fcf5ef2aSThomas Huth if (sat) { \ 7776175f5a0SRichard Henderson set_vscr_sat(env); \ 778fcf5ef2aSThomas Huth } \ 779fcf5ef2aSThomas Huth } 780fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32) 781fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32) 782fcf5ef2aSThomas Huth #undef VCT 783fcf5ef2aSThomas Huth 784fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r) 785fcf5ef2aSThomas Huth { 786fcf5ef2aSThomas Huth target_ulong count = 0; 787fcf5ef2aSThomas Huth int i; 78860594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 78960594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 790fcf5ef2aSThomas Huth break; 791fcf5ef2aSThomas Huth } 792fcf5ef2aSThomas Huth count++; 793fcf5ef2aSThomas Huth } 794fcf5ef2aSThomas Huth return count; 795fcf5ef2aSThomas Huth } 796fcf5ef2aSThomas Huth 797fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r) 798fcf5ef2aSThomas Huth { 799fcf5ef2aSThomas Huth target_ulong count = 0; 800fcf5ef2aSThomas Huth int i; 801fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 80260594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 803fcf5ef2aSThomas Huth break; 804fcf5ef2aSThomas Huth } 805fcf5ef2aSThomas Huth count++; 806fcf5ef2aSThomas Huth } 807fcf5ef2aSThomas Huth return count; 808fcf5ef2aSThomas Huth } 809fcf5ef2aSThomas Huth 810fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 811fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 812fcf5ef2aSThomas Huth { 813fcf5ef2aSThomas Huth int sat = 0; 814fcf5ef2aSThomas Huth int i; 815fcf5ef2aSThomas Huth 816fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 817fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 818fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 819fcf5ef2aSThomas Huth 820fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 821fcf5ef2aSThomas Huth } 822fcf5ef2aSThomas Huth 823fcf5ef2aSThomas Huth if (sat) { 8246175f5a0SRichard Henderson set_vscr_sat(env); 825fcf5ef2aSThomas Huth } 826fcf5ef2aSThomas Huth } 827fcf5ef2aSThomas Huth 828fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 829fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 830fcf5ef2aSThomas Huth { 831fcf5ef2aSThomas Huth int sat = 0; 832fcf5ef2aSThomas Huth int i; 833fcf5ef2aSThomas Huth 834fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 835fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i] + 0x00004000; 836fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 837fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 838fcf5ef2aSThomas Huth } 839fcf5ef2aSThomas Huth 840fcf5ef2aSThomas Huth if (sat) { 8416175f5a0SRichard Henderson set_vscr_sat(env); 842fcf5ef2aSThomas Huth } 843fcf5ef2aSThomas Huth } 844fcf5ef2aSThomas Huth 845fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 846fcf5ef2aSThomas Huth { 847fcf5ef2aSThomas Huth int i; 848fcf5ef2aSThomas Huth 849fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 850fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 851fcf5ef2aSThomas Huth r->s16[i] = (int16_t) (prod + c->s16[i]); 852fcf5ef2aSThomas Huth } 853fcf5ef2aSThomas Huth } 854fcf5ef2aSThomas Huth 855d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs) \ 856fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 857fcf5ef2aSThomas Huth { \ 858fcf5ef2aSThomas Huth ppc_avr_t result; \ 859d81c2040SMark Cave-Ayland int i, half = ARRAY_SIZE(r->element) / 2; \ 860fcf5ef2aSThomas Huth \ 861d81c2040SMark Cave-Ayland for (i = 0; i < half; i++) { \ 862d81c2040SMark Cave-Ayland result.access(i * 2 + 0) = a->access(i + ofs); \ 863d81c2040SMark Cave-Ayland result.access(i * 2 + 1) = b->access(i + ofs); \ 864fcf5ef2aSThomas Huth } \ 865fcf5ef2aSThomas Huth *r = result; \ 866fcf5ef2aSThomas Huth } 867d81c2040SMark Cave-Ayland 868d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access) \ 869d81c2040SMark Cave-Ayland VMRG_DO(mrgl##suffix, element, access, half) \ 870d81c2040SMark Cave-Ayland VMRG_DO(mrgh##suffix, element, access, 0) 871d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB) 872d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH) 873d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW) 874fcf5ef2aSThomas Huth #undef VMRG_DO 875fcf5ef2aSThomas Huth #undef VMRG 876fcf5ef2aSThomas Huth 877fcf5ef2aSThomas Huth void helper_vmsummbm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 878fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 879fcf5ef2aSThomas Huth { 880fcf5ef2aSThomas Huth int32_t prod[16]; 881fcf5ef2aSThomas Huth int i; 882fcf5ef2aSThomas Huth 883fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s8); i++) { 884fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s8[i] * b->u8[i]; 885fcf5ef2aSThomas Huth } 886fcf5ef2aSThomas Huth 887fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 888fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] + 889fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 890fcf5ef2aSThomas Huth } 891fcf5ef2aSThomas Huth } 892fcf5ef2aSThomas Huth 893fcf5ef2aSThomas Huth void helper_vmsumshm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 894fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 895fcf5ef2aSThomas Huth { 896fcf5ef2aSThomas Huth int32_t prod[8]; 897fcf5ef2aSThomas Huth int i; 898fcf5ef2aSThomas Huth 899fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 900fcf5ef2aSThomas Huth prod[i] = a->s16[i] * b->s16[i]; 901fcf5ef2aSThomas Huth } 902fcf5ef2aSThomas Huth 903fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 904fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 905fcf5ef2aSThomas Huth } 906fcf5ef2aSThomas Huth } 907fcf5ef2aSThomas Huth 908fcf5ef2aSThomas Huth void helper_vmsumshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 909fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 910fcf5ef2aSThomas Huth { 911fcf5ef2aSThomas Huth int32_t prod[8]; 912fcf5ef2aSThomas Huth int i; 913fcf5ef2aSThomas Huth int sat = 0; 914fcf5ef2aSThomas Huth 915fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 916fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s16[i] * b->s16[i]; 917fcf5ef2aSThomas Huth } 918fcf5ef2aSThomas Huth 919fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 920fcf5ef2aSThomas Huth int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 921fcf5ef2aSThomas Huth 922fcf5ef2aSThomas Huth r->u32[i] = cvtsdsw(t, &sat); 923fcf5ef2aSThomas Huth } 924fcf5ef2aSThomas Huth 925fcf5ef2aSThomas Huth if (sat) { 9266175f5a0SRichard Henderson set_vscr_sat(env); 927fcf5ef2aSThomas Huth } 928fcf5ef2aSThomas Huth } 929fcf5ef2aSThomas Huth 930fcf5ef2aSThomas Huth void helper_vmsumubm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 931fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 932fcf5ef2aSThomas Huth { 933fcf5ef2aSThomas Huth uint16_t prod[16]; 934fcf5ef2aSThomas Huth int i; 935fcf5ef2aSThomas Huth 936fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 937fcf5ef2aSThomas Huth prod[i] = a->u8[i] * b->u8[i]; 938fcf5ef2aSThomas Huth } 939fcf5ef2aSThomas Huth 940fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 941fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] + 942fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 943fcf5ef2aSThomas Huth } 944fcf5ef2aSThomas Huth } 945fcf5ef2aSThomas Huth 946fcf5ef2aSThomas Huth void helper_vmsumuhm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 947fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 948fcf5ef2aSThomas Huth { 949fcf5ef2aSThomas Huth uint32_t prod[8]; 950fcf5ef2aSThomas Huth int i; 951fcf5ef2aSThomas Huth 952fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 953fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 954fcf5ef2aSThomas Huth } 955fcf5ef2aSThomas Huth 956fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 957fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 958fcf5ef2aSThomas Huth } 959fcf5ef2aSThomas Huth } 960fcf5ef2aSThomas Huth 961fcf5ef2aSThomas Huth void helper_vmsumuhs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 962fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 963fcf5ef2aSThomas Huth { 964fcf5ef2aSThomas Huth uint32_t prod[8]; 965fcf5ef2aSThomas Huth int i; 966fcf5ef2aSThomas Huth int sat = 0; 967fcf5ef2aSThomas Huth 968fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 969fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 970fcf5ef2aSThomas Huth } 971fcf5ef2aSThomas Huth 972fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 973fcf5ef2aSThomas Huth uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 974fcf5ef2aSThomas Huth 975fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 976fcf5ef2aSThomas Huth } 977fcf5ef2aSThomas Huth 978fcf5ef2aSThomas Huth if (sat) { 9796175f5a0SRichard Henderson set_vscr_sat(env); 980fcf5ef2aSThomas Huth } 981fcf5ef2aSThomas Huth } 982fcf5ef2aSThomas Huth 9834fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast) \ 98480eca687SLucas Mateus Castro (alqotel) void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 985fcf5ef2aSThomas Huth { \ 986fcf5ef2aSThomas Huth int i; \ 987fcf5ef2aSThomas Huth \ 9884fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 9894fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i) * \ 9904fbc89edSMark Cave-Ayland (cast)b->mul_access(i); \ 991fcf5ef2aSThomas Huth } \ 992fcf5ef2aSThomas Huth } 9934fbc89edSMark Cave-Ayland 9944fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast) \ 99580eca687SLucas Mateus Castro (alqotel) void helper_V##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 9964fbc89edSMark Cave-Ayland { \ 9974fbc89edSMark Cave-Ayland int i; \ 9984fbc89edSMark Cave-Ayland \ 9994fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 10004fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) * \ 10014fbc89edSMark Cave-Ayland (cast)b->mul_access(i + 1); \ 10024fbc89edSMark Cave-Ayland } \ 10034fbc89edSMark Cave-Ayland } 10044fbc89edSMark Cave-Ayland 10054fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast) \ 100680eca687SLucas Mateus Castro (alqotel) VMUL_DO_EVN(MULE##suffix, mul_element, mul_access, prod_access, cast) \ 100780eca687SLucas Mateus Castro (alqotel) VMUL_DO_ODD(MULO##suffix, mul_element, mul_access, prod_access, cast) 100880eca687SLucas Mateus Castro (alqotel) VMUL(SB, s8, VsrSB, VsrSH, int16_t) 100980eca687SLucas Mateus Castro (alqotel) VMUL(SH, s16, VsrSH, VsrSW, int32_t) 101080eca687SLucas Mateus Castro (alqotel) VMUL(SW, s32, VsrSW, VsrSD, int64_t) 101180eca687SLucas Mateus Castro (alqotel) VMUL(UB, u8, VsrB, VsrH, uint16_t) 101280eca687SLucas Mateus Castro (alqotel) VMUL(UH, u16, VsrH, VsrW, uint32_t) 101380eca687SLucas Mateus Castro (alqotel) VMUL(UW, u32, VsrW, VsrD, uint64_t) 10144fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN 10154fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD 1016fcf5ef2aSThomas Huth #undef VMUL 1017fcf5ef2aSThomas Huth 1018fcf5ef2aSThomas Huth void helper_vperm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1019fcf5ef2aSThomas Huth ppc_avr_t *c) 1020fcf5ef2aSThomas Huth { 1021fcf5ef2aSThomas Huth ppc_avr_t result; 1022fcf5ef2aSThomas Huth int i; 1023fcf5ef2aSThomas Huth 102460594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 102560594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1026fcf5ef2aSThomas Huth int index = s & 0xf; 1027fcf5ef2aSThomas Huth 1028fcf5ef2aSThomas Huth if (s & 0x10) { 102960594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1030fcf5ef2aSThomas Huth } else { 103160594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1032fcf5ef2aSThomas Huth } 1033fcf5ef2aSThomas Huth } 1034fcf5ef2aSThomas Huth *r = result; 1035fcf5ef2aSThomas Huth } 1036fcf5ef2aSThomas Huth 1037fcf5ef2aSThomas Huth void helper_vpermr(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1038fcf5ef2aSThomas Huth ppc_avr_t *c) 1039fcf5ef2aSThomas Huth { 1040fcf5ef2aSThomas Huth ppc_avr_t result; 1041fcf5ef2aSThomas Huth int i; 1042fcf5ef2aSThomas Huth 104360594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 104460594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1045fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1046fcf5ef2aSThomas Huth 1047fcf5ef2aSThomas Huth if (s & 0x10) { 104860594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1049fcf5ef2aSThomas Huth } else { 105060594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1051fcf5ef2aSThomas Huth } 1052fcf5ef2aSThomas Huth } 1053fcf5ef2aSThomas Huth *r = result; 1054fcf5ef2aSThomas Huth } 1055fcf5ef2aSThomas Huth 1056fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1057fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)]) 1058fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i) 1059fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0) 1060fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1)) 1061fcf5ef2aSThomas Huth #else 1062fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)]) 1063fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i) 1064fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0) 1065fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \ 1066fcf5ef2aSThomas Huth (extract64((avr)->u64[1 - i], 63 - index, 1)) 1067fcf5ef2aSThomas Huth #endif 1068fcf5ef2aSThomas Huth 1069fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1070fcf5ef2aSThomas Huth { 1071fcf5ef2aSThomas Huth int i, j; 1072fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 1073fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1074fcf5ef2aSThomas Huth for (j = 0; j < 8; j++) { 1075fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, (i * 8) + j); 1076fcf5ef2aSThomas Huth if (index < 64 && EXTRACT_BIT(a, i, index)) { 1077fcf5ef2aSThomas Huth result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j); 1078fcf5ef2aSThomas Huth } 1079fcf5ef2aSThomas Huth } 1080fcf5ef2aSThomas Huth } 1081fcf5ef2aSThomas Huth *r = result; 1082fcf5ef2aSThomas Huth } 1083fcf5ef2aSThomas Huth 1084fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1085fcf5ef2aSThomas Huth { 1086fcf5ef2aSThomas Huth int i; 1087fcf5ef2aSThomas Huth uint64_t perm = 0; 1088fcf5ef2aSThomas Huth 1089fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1090fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, i); 1091fcf5ef2aSThomas Huth 1092fcf5ef2aSThomas Huth if (index < 128) { 1093fcf5ef2aSThomas Huth uint64_t mask = (1ull << (63 - (index & 0x3F))); 1094fcf5ef2aSThomas Huth if (a->u64[VBPERMQ_DW(index)] & mask) { 1095fcf5ef2aSThomas Huth perm |= (0x8000 >> i); 1096fcf5ef2aSThomas Huth } 1097fcf5ef2aSThomas Huth } 1098fcf5ef2aSThomas Huth } 1099fcf5ef2aSThomas Huth 11003c385a93SMark Cave-Ayland r->VsrD(0) = perm; 11013c385a93SMark Cave-Ayland r->VsrD(1) = 0; 1102fcf5ef2aSThomas Huth } 1103fcf5ef2aSThomas Huth 1104fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX 1105fcf5ef2aSThomas Huth #undef VBPERMQ_DW 1106fcf5ef2aSThomas Huth 1107fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp) \ 1108fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1109fcf5ef2aSThomas Huth { \ 1110fcf5ef2aSThomas Huth int i, j; \ 1111fcf5ef2aSThomas Huth trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])]; \ 1112fcf5ef2aSThomas Huth \ 1113fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, srcfld) { \ 1114fcf5ef2aSThomas Huth prod[i] = 0; \ 1115fcf5ef2aSThomas Huth for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) { \ 1116fcf5ef2aSThomas Huth if (a->srcfld[i] & (1ull << j)) { \ 1117fcf5ef2aSThomas Huth prod[i] ^= ((trgtyp)b->srcfld[i] << j); \ 1118fcf5ef2aSThomas Huth } \ 1119fcf5ef2aSThomas Huth } \ 1120fcf5ef2aSThomas Huth } \ 1121fcf5ef2aSThomas Huth \ 1122fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, trgfld) { \ 1123fcf5ef2aSThomas Huth r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1]; \ 1124fcf5ef2aSThomas Huth } \ 1125fcf5ef2aSThomas Huth } 1126fcf5ef2aSThomas Huth 1127fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t) 1128fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t) 1129fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t) 1130fcf5ef2aSThomas Huth 1131fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1132fcf5ef2aSThomas Huth { 1133fcf5ef2aSThomas Huth 1134fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1135fcf5ef2aSThomas Huth int i, j; 1136fcf5ef2aSThomas Huth __uint128_t prod[2]; 1137fcf5ef2aSThomas Huth 1138fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1139fcf5ef2aSThomas Huth prod[i] = 0; 1140fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1141fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1142fcf5ef2aSThomas Huth prod[i] ^= (((__uint128_t)b->u64[i]) << j); 1143fcf5ef2aSThomas Huth } 1144fcf5ef2aSThomas Huth } 1145fcf5ef2aSThomas Huth } 1146fcf5ef2aSThomas Huth 1147fcf5ef2aSThomas Huth r->u128 = prod[0] ^ prod[1]; 1148fcf5ef2aSThomas Huth 1149fcf5ef2aSThomas Huth #else 1150fcf5ef2aSThomas Huth int i, j; 1151fcf5ef2aSThomas Huth ppc_avr_t prod[2]; 1152fcf5ef2aSThomas Huth 1153fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 11543c385a93SMark Cave-Ayland prod[i].VsrD(1) = prod[i].VsrD(0) = 0; 1155fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1156fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1157fcf5ef2aSThomas Huth ppc_avr_t bshift; 1158fcf5ef2aSThomas Huth if (j == 0) { 11593c385a93SMark Cave-Ayland bshift.VsrD(0) = 0; 11603c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i]; 1161fcf5ef2aSThomas Huth } else { 11623c385a93SMark Cave-Ayland bshift.VsrD(0) = b->u64[i] >> (64 - j); 11633c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i] << j; 1164fcf5ef2aSThomas Huth } 11653c385a93SMark Cave-Ayland prod[i].VsrD(1) ^= bshift.VsrD(1); 11663c385a93SMark Cave-Ayland prod[i].VsrD(0) ^= bshift.VsrD(0); 1167fcf5ef2aSThomas Huth } 1168fcf5ef2aSThomas Huth } 1169fcf5ef2aSThomas Huth } 1170fcf5ef2aSThomas Huth 11713c385a93SMark Cave-Ayland r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1); 11723c385a93SMark Cave-Ayland r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0); 1173fcf5ef2aSThomas Huth #endif 1174fcf5ef2aSThomas Huth } 1175fcf5ef2aSThomas Huth 1176fcf5ef2aSThomas Huth 1177fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1178fcf5ef2aSThomas Huth #define PKBIG 1 1179fcf5ef2aSThomas Huth #else 1180fcf5ef2aSThomas Huth #define PKBIG 0 1181fcf5ef2aSThomas Huth #endif 1182fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1183fcf5ef2aSThomas Huth { 1184fcf5ef2aSThomas Huth int i, j; 1185fcf5ef2aSThomas Huth ppc_avr_t result; 1186fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1187fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { a, b }; 1188fcf5ef2aSThomas Huth #else 1189fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { b, a }; 1190fcf5ef2aSThomas Huth #endif 1191fcf5ef2aSThomas Huth 1192fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1193fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(j, u32) { 1194fcf5ef2aSThomas Huth uint32_t e = x[i]->u32[j]; 1195fcf5ef2aSThomas Huth 1196fcf5ef2aSThomas Huth result.u16[4 * i + j] = (((e >> 9) & 0xfc00) | 1197fcf5ef2aSThomas Huth ((e >> 6) & 0x3e0) | 1198fcf5ef2aSThomas Huth ((e >> 3) & 0x1f)); 1199fcf5ef2aSThomas Huth } 1200fcf5ef2aSThomas Huth } 1201fcf5ef2aSThomas Huth *r = result; 1202fcf5ef2aSThomas Huth } 1203fcf5ef2aSThomas Huth 1204fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat) \ 1205fcf5ef2aSThomas Huth void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1206fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 1207fcf5ef2aSThomas Huth { \ 1208fcf5ef2aSThomas Huth int i; \ 1209fcf5ef2aSThomas Huth int sat = 0; \ 1210fcf5ef2aSThomas Huth ppc_avr_t result; \ 1211fcf5ef2aSThomas Huth ppc_avr_t *a0 = PKBIG ? a : b; \ 1212fcf5ef2aSThomas Huth ppc_avr_t *a1 = PKBIG ? b : a; \ 1213fcf5ef2aSThomas Huth \ 1214fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, from) { \ 1215fcf5ef2aSThomas Huth result.to[i] = cvt(a0->from[i], &sat); \ 1216fcf5ef2aSThomas Huth result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\ 1217fcf5ef2aSThomas Huth } \ 1218fcf5ef2aSThomas Huth *r = result; \ 1219fcf5ef2aSThomas Huth if (dosat && sat) { \ 12206175f5a0SRichard Henderson set_vscr_sat(env); \ 1221fcf5ef2aSThomas Huth } \ 1222fcf5ef2aSThomas Huth } 1223fcf5ef2aSThomas Huth #define I(x, y) (x) 1224fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1) 1225fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1) 1226fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1) 1227fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1) 1228fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1) 1229fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1) 1230fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1) 1231fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1) 1232fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1) 1233fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0) 1234fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0) 1235fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0) 1236fcf5ef2aSThomas Huth #undef I 1237fcf5ef2aSThomas Huth #undef VPK 1238fcf5ef2aSThomas Huth #undef PKBIG 1239fcf5ef2aSThomas Huth 1240fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1241fcf5ef2aSThomas Huth { 1242fcf5ef2aSThomas Huth int i; 1243fcf5ef2aSThomas Huth 124405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 124505ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status); 1246fcf5ef2aSThomas Huth } 1247fcf5ef2aSThomas Huth } 1248fcf5ef2aSThomas Huth 1249fcf5ef2aSThomas Huth #define VRFI(suffix, rounding) \ 1250fcf5ef2aSThomas Huth void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1251fcf5ef2aSThomas Huth ppc_avr_t *b) \ 1252fcf5ef2aSThomas Huth { \ 1253fcf5ef2aSThomas Huth int i; \ 1254fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 1255fcf5ef2aSThomas Huth \ 1256fcf5ef2aSThomas Huth set_float_rounding_mode(rounding, &s); \ 125705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 125805ee3e8aSMark Cave-Ayland r->f32[i] = float32_round_to_int (b->f32[i], &s); \ 1259fcf5ef2aSThomas Huth } \ 1260fcf5ef2aSThomas Huth } 1261fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even) 1262fcf5ef2aSThomas Huth VRFI(m, float_round_down) 1263fcf5ef2aSThomas Huth VRFI(p, float_round_up) 1264fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero) 1265fcf5ef2aSThomas Huth #undef VRFI 1266fcf5ef2aSThomas Huth 1267fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1268fcf5ef2aSThomas Huth { 1269fcf5ef2aSThomas Huth int i; 1270fcf5ef2aSThomas Huth 127105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 127205ee3e8aSMark Cave-Ayland float32 t = float32_sqrt(b->f32[i], &env->vec_status); 1273fcf5ef2aSThomas Huth 127405ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, t, &env->vec_status); 1275fcf5ef2aSThomas Huth } 1276fcf5ef2aSThomas Huth } 1277fcf5ef2aSThomas Huth 1278fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert) \ 1279fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1280fcf5ef2aSThomas Huth { \ 1281fcf5ef2aSThomas Huth int i; \ 1282fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1283fcf5ef2aSThomas Huth uint##size##_t src1 = a->element[i]; \ 1284fcf5ef2aSThomas Huth uint##size##_t src2 = b->element[i]; \ 1285fcf5ef2aSThomas Huth uint##size##_t src3 = r->element[i]; \ 1286fcf5ef2aSThomas Huth uint##size##_t begin, end, shift, mask, rot_val; \ 1287fcf5ef2aSThomas Huth \ 1288fcf5ef2aSThomas Huth shift = extract##size(src2, 0, 6); \ 1289fcf5ef2aSThomas Huth end = extract##size(src2, 8, 6); \ 1290fcf5ef2aSThomas Huth begin = extract##size(src2, 16, 6); \ 1291fcf5ef2aSThomas Huth rot_val = rol##size(src1, shift); \ 1292fcf5ef2aSThomas Huth mask = mask_u##size(begin, end); \ 1293fcf5ef2aSThomas Huth if (insert) { \ 1294fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask) | (src3 & ~mask); \ 1295fcf5ef2aSThomas Huth } else { \ 1296fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask); \ 1297fcf5ef2aSThomas Huth } \ 1298fcf5ef2aSThomas Huth } \ 1299fcf5ef2aSThomas Huth } 1300fcf5ef2aSThomas Huth 1301fcf5ef2aSThomas Huth VRLMI(vrldmi, 64, u64, 1); 1302fcf5ef2aSThomas Huth VRLMI(vrlwmi, 32, u32, 1); 1303fcf5ef2aSThomas Huth VRLMI(vrldnm, 64, u64, 0); 1304fcf5ef2aSThomas Huth VRLMI(vrlwnm, 32, u32, 0); 1305fcf5ef2aSThomas Huth 1306fcf5ef2aSThomas Huth void helper_vsel(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1307fcf5ef2aSThomas Huth ppc_avr_t *c) 1308fcf5ef2aSThomas Huth { 1309fcf5ef2aSThomas Huth r->u64[0] = (a->u64[0] & ~c->u64[0]) | (b->u64[0] & c->u64[0]); 1310fcf5ef2aSThomas Huth r->u64[1] = (a->u64[1] & ~c->u64[1]) | (b->u64[1] & c->u64[1]); 1311fcf5ef2aSThomas Huth } 1312fcf5ef2aSThomas Huth 1313fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1314fcf5ef2aSThomas Huth { 1315fcf5ef2aSThomas Huth int i; 1316fcf5ef2aSThomas Huth 131705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 131805ee3e8aSMark Cave-Ayland r->f32[i] = float32_exp2(b->f32[i], &env->vec_status); 1319fcf5ef2aSThomas Huth } 1320fcf5ef2aSThomas Huth } 1321fcf5ef2aSThomas Huth 1322fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1323fcf5ef2aSThomas Huth { 1324fcf5ef2aSThomas Huth int i; 1325fcf5ef2aSThomas Huth 132605ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 132705ee3e8aSMark Cave-Ayland r->f32[i] = float32_log2(b->f32[i], &env->vec_status); 1328fcf5ef2aSThomas Huth } 1329fcf5ef2aSThomas Huth } 1330fcf5ef2aSThomas Huth 133160caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 133260caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 133360caf221SAvinesh Kumar { \ 1334f297c4c6SMatheus Ferst int index = (a & 0xf) * 8; \ 133560caf221SAvinesh Kumar if (left) { \ 1336f297c4c6SMatheus Ferst index = 128 - index - size; \ 133760caf221SAvinesh Kumar } \ 133860caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 133960caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 134060caf221SAvinesh Kumar } 134160caf221SAvinesh Kumar VEXTU_X_DO(vextublx, 8, 1) 134260caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1) 134360caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1) 134460caf221SAvinesh Kumar VEXTU_X_DO(vextubrx, 8, 0) 134560caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0) 134660caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0) 134760caf221SAvinesh Kumar #undef VEXTU_X_DO 134860caf221SAvinesh Kumar 1349fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1350fcf5ef2aSThomas Huth { 1351fcf5ef2aSThomas Huth int i; 1352fcf5ef2aSThomas Huth unsigned int shift, bytes, size; 1353fcf5ef2aSThomas Huth 1354fcf5ef2aSThomas Huth size = ARRAY_SIZE(r->u8); 1355fcf5ef2aSThomas Huth for (i = 0; i < size; i++) { 135663be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 135763be02fcSAnton Blanchard bytes = (a->VsrB(i) << 8) + /* extract adjacent bytes */ 135863be02fcSAnton Blanchard (((i + 1) < size) ? a->VsrB(i + 1) : 0); 135963be02fcSAnton Blanchard r->VsrB(i) = (bytes << shift) >> 8; /* shift and store result */ 1360fcf5ef2aSThomas Huth } 1361fcf5ef2aSThomas Huth } 1362fcf5ef2aSThomas Huth 1363fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1364fcf5ef2aSThomas Huth { 1365fcf5ef2aSThomas Huth int i; 1366fcf5ef2aSThomas Huth unsigned int shift, bytes; 1367fcf5ef2aSThomas Huth 1368b6cb41b2SDavid Gibson /* 1369b6cb41b2SDavid Gibson * Use reverse order, as destination and source register can be 1370b6cb41b2SDavid Gibson * same. Its being modified in place saving temporary, reverse 1371b6cb41b2SDavid Gibson * order will guarantee that computed result is not fed back. 1372fcf5ef2aSThomas Huth */ 1373fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 137463be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 137563be02fcSAnton Blanchard bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i); 1376fcf5ef2aSThomas Huth /* extract adjacent bytes */ 137763be02fcSAnton Blanchard r->VsrB(i) = (bytes >> shift) & 0xFF; /* shift and store result */ 1378fcf5ef2aSThomas Huth } 1379fcf5ef2aSThomas Huth } 1380fcf5ef2aSThomas Huth 1381fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift) 1382fcf5ef2aSThomas Huth { 1383fcf5ef2aSThomas Huth int sh = shift & 0xf; 1384fcf5ef2aSThomas Huth int i; 1385fcf5ef2aSThomas Huth ppc_avr_t result; 1386fcf5ef2aSThomas Huth 1387fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1388fcf5ef2aSThomas Huth int index = sh + i; 1389fcf5ef2aSThomas Huth if (index > 0xf) { 139060594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index - 0x10); 1391fcf5ef2aSThomas Huth } else { 139260594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1393fcf5ef2aSThomas Huth } 1394fcf5ef2aSThomas Huth } 1395fcf5ef2aSThomas Huth *r = result; 1396fcf5ef2aSThomas Huth } 1397fcf5ef2aSThomas Huth 1398fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1399fcf5ef2aSThomas Huth { 14003c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1401fcf5ef2aSThomas Huth 1402fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1403fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1404fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1405fcf5ef2aSThomas Huth #else 1406fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1407fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1408fcf5ef2aSThomas Huth #endif 1409fcf5ef2aSThomas Huth } 1410fcf5ef2aSThomas Huth 1411fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 14122cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[IDX]) 14132cc12af3SMatheus Ferst #else 14142cc12af3SMatheus Ferst #define ELEM_ADDR(VEC, IDX, SIZE) (&(VEC)->u8[15 - (IDX)] - (SIZE) + 1) 14152cc12af3SMatheus Ferst #endif 14162cc12af3SMatheus Ferst 14172cc12af3SMatheus Ferst #define VINSX(SUFFIX, TYPE) \ 14182cc12af3SMatheus Ferst void glue(glue(helper_VINS, SUFFIX), LX)(CPUPPCState *env, ppc_avr_t *t, \ 14192cc12af3SMatheus Ferst uint64_t val, target_ulong index) \ 14202cc12af3SMatheus Ferst { \ 14212cc12af3SMatheus Ferst const int maxidx = ARRAY_SIZE(t->u8) - sizeof(TYPE); \ 14222cc12af3SMatheus Ferst target_long idx = index; \ 14232cc12af3SMatheus Ferst \ 14242cc12af3SMatheus Ferst if (idx < 0 || idx > maxidx) { \ 14252cc12af3SMatheus Ferst idx = idx < 0 ? sizeof(TYPE) - idx : idx; \ 14262cc12af3SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, \ 14272cc12af3SMatheus Ferst "Invalid index for Vector Insert Element after 0x" TARGET_FMT_lx \ 14282cc12af3SMatheus Ferst ", RA = " TARGET_FMT_ld " > %d\n", env->nip, idx, maxidx); \ 14292cc12af3SMatheus Ferst } else { \ 14302cc12af3SMatheus Ferst TYPE src = val; \ 14312cc12af3SMatheus Ferst memcpy(ELEM_ADDR(t, idx, sizeof(TYPE)), &src, sizeof(TYPE)); \ 14322cc12af3SMatheus Ferst } \ 14332cc12af3SMatheus Ferst } 14342cc12af3SMatheus Ferst VINSX(B, uint8_t) 14352cc12af3SMatheus Ferst VINSX(H, uint16_t) 14362cc12af3SMatheus Ferst VINSX(W, uint32_t) 14372cc12af3SMatheus Ferst VINSX(D, uint64_t) 14382cc12af3SMatheus Ferst #undef ELEM_ADDR 14392cc12af3SMatheus Ferst #undef VINSX 1440fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 144128110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \ 144228110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 144328110b72SMatheus Ferst target_ulong index) \ 144428110b72SMatheus Ferst { \ 144528110b72SMatheus Ferst const target_long idx = index; \ 144628110b72SMatheus Ferst ppc_avr_t tmp[2] = { *a, *b }; \ 144728110b72SMatheus Ferst memset(t, 0, sizeof(*t)); \ 144828110b72SMatheus Ferst if (idx >= 0 && idx + SIZE <= sizeof(tmp)) { \ 144928110b72SMatheus Ferst memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2 - SIZE], (void *)tmp + idx, SIZE); \ 145028110b72SMatheus Ferst } else { \ 145128110b72SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x" \ 145228110b72SMatheus Ferst TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n", \ 145328110b72SMatheus Ferst env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE); \ 145428110b72SMatheus Ferst } \ 145528110b72SMatheus Ferst } 145628110b72SMatheus Ferst #else 145728110b72SMatheus Ferst #define VEXTDVLX(NAME, SIZE) \ 145828110b72SMatheus Ferst void helper_##NAME(CPUPPCState *env, ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 145928110b72SMatheus Ferst target_ulong index) \ 146028110b72SMatheus Ferst { \ 146128110b72SMatheus Ferst const target_long idx = index; \ 146228110b72SMatheus Ferst ppc_avr_t tmp[2] = { *b, *a }; \ 146328110b72SMatheus Ferst memset(t, 0, sizeof(*t)); \ 146428110b72SMatheus Ferst if (idx >= 0 && idx + SIZE <= sizeof(tmp)) { \ 146528110b72SMatheus Ferst memcpy(&t->u8[ARRAY_SIZE(t->u8) / 2], \ 146628110b72SMatheus Ferst (void *)tmp + sizeof(tmp) - SIZE - idx, SIZE); \ 146728110b72SMatheus Ferst } else { \ 146828110b72SMatheus Ferst qemu_log_mask(LOG_GUEST_ERROR, "Invalid index for " #NAME " after 0x" \ 146928110b72SMatheus Ferst TARGET_FMT_lx ", RC = " TARGET_FMT_ld " > %d\n", \ 147028110b72SMatheus Ferst env->nip, idx < 0 ? SIZE - idx : idx, 32 - SIZE); \ 147128110b72SMatheus Ferst } \ 147228110b72SMatheus Ferst } 147328110b72SMatheus Ferst #endif 147428110b72SMatheus Ferst VEXTDVLX(VEXTDUBVLX, 1) 147528110b72SMatheus Ferst VEXTDVLX(VEXTDUHVLX, 2) 147628110b72SMatheus Ferst VEXTDVLX(VEXTDUWVLX, 4) 147728110b72SMatheus Ferst VEXTDVLX(VEXTDDVLX, 8) 147828110b72SMatheus Ferst #undef VEXTDVLX 147928110b72SMatheus Ferst #if defined(HOST_WORDS_BIGENDIAN) 1480fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1481fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1482fcf5ef2aSThomas Huth { \ 1483fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1484fcf5ef2aSThomas Huth memmove(&r->u8[8 - es], &b->u8[index], es); \ 1485fcf5ef2aSThomas Huth memset(&r->u8[8], 0, 8); \ 1486fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8 - es); \ 1487fcf5ef2aSThomas Huth } 1488fcf5ef2aSThomas Huth #else 1489fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1490fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1491fcf5ef2aSThomas Huth { \ 1492fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1493fcf5ef2aSThomas Huth uint32_t s = (16 - index) - es; \ 1494fcf5ef2aSThomas Huth memmove(&r->u8[8], &b->u8[s], es); \ 1495fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8); \ 1496fcf5ef2aSThomas Huth memset(&r->u8[8 + es], 0, 8 - es); \ 1497fcf5ef2aSThomas Huth } 1498fcf5ef2aSThomas Huth #endif 1499fcf5ef2aSThomas Huth VEXTRACT(ub, u8) 1500fcf5ef2aSThomas Huth VEXTRACT(uh, u16) 1501fcf5ef2aSThomas Huth VEXTRACT(uw, u32) 1502fcf5ef2aSThomas Huth VEXTRACT(d, u64) 1503fcf5ef2aSThomas Huth #undef VEXTRACT 1504fcf5ef2aSThomas Huth 1505*fb5303ccSMatheus Ferst #define VSTRI(NAME, ELEM, NUM_ELEMS, LEFT) \ 1506*fb5303ccSMatheus Ferst uint32_t helper_##NAME(ppc_avr_t *t, ppc_avr_t *b) \ 1507*fb5303ccSMatheus Ferst { \ 1508*fb5303ccSMatheus Ferst int i, idx, crf = 0; \ 1509*fb5303ccSMatheus Ferst \ 1510*fb5303ccSMatheus Ferst for (i = 0; i < NUM_ELEMS; i++) { \ 1511*fb5303ccSMatheus Ferst idx = LEFT ? i : NUM_ELEMS - i - 1; \ 1512*fb5303ccSMatheus Ferst if (b->Vsr##ELEM(idx)) { \ 1513*fb5303ccSMatheus Ferst t->Vsr##ELEM(idx) = b->Vsr##ELEM(idx); \ 1514*fb5303ccSMatheus Ferst } else { \ 1515*fb5303ccSMatheus Ferst crf = 0b0010; \ 1516*fb5303ccSMatheus Ferst break; \ 1517*fb5303ccSMatheus Ferst } \ 1518*fb5303ccSMatheus Ferst } \ 1519*fb5303ccSMatheus Ferst \ 1520*fb5303ccSMatheus Ferst for (; i < NUM_ELEMS; i++) { \ 1521*fb5303ccSMatheus Ferst idx = LEFT ? i : NUM_ELEMS - i - 1; \ 1522*fb5303ccSMatheus Ferst t->Vsr##ELEM(idx) = 0; \ 1523*fb5303ccSMatheus Ferst } \ 1524*fb5303ccSMatheus Ferst \ 1525*fb5303ccSMatheus Ferst return crf; \ 1526*fb5303ccSMatheus Ferst } 1527*fb5303ccSMatheus Ferst VSTRI(VSTRIBL, B, 16, true) 1528*fb5303ccSMatheus Ferst VSTRI(VSTRIBR, B, 16, false) 1529*fb5303ccSMatheus Ferst VSTRI(VSTRIHL, H, 8, true) 1530*fb5303ccSMatheus Ferst VSTRI(VSTRIHR, H, 8, false) 1531*fb5303ccSMatheus Ferst #undef VSTRI 1532*fb5303ccSMatheus Ferst 15335ba5335dSMark Cave-Ayland void helper_xxextractuw(CPUPPCState *env, ppc_vsr_t *xt, 15345ba5335dSMark Cave-Ayland ppc_vsr_t *xb, uint32_t index) 15358ad901e5SNikunj A Dadhania { 153603b32c09SMark Cave-Ayland ppc_vsr_t t = { }; 15378ad901e5SNikunj A Dadhania size_t es = sizeof(uint32_t); 15388ad901e5SNikunj A Dadhania uint32_t ext_index; 15398ad901e5SNikunj A Dadhania int i; 15408ad901e5SNikunj A Dadhania 15418ad901e5SNikunj A Dadhania ext_index = index; 15428ad901e5SNikunj A Dadhania for (i = 0; i < es; i++, ext_index++) { 154303b32c09SMark Cave-Ayland t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16); 15448ad901e5SNikunj A Dadhania } 15458ad901e5SNikunj A Dadhania 154603b32c09SMark Cave-Ayland *xt = t; 15478ad901e5SNikunj A Dadhania } 15488ad901e5SNikunj A Dadhania 15495ba5335dSMark Cave-Ayland void helper_xxinsertw(CPUPPCState *env, ppc_vsr_t *xt, 15505ba5335dSMark Cave-Ayland ppc_vsr_t *xb, uint32_t index) 15513398b742SNikunj A Dadhania { 155203b32c09SMark Cave-Ayland ppc_vsr_t t = *xt; 15533398b742SNikunj A Dadhania size_t es = sizeof(uint32_t); 15543398b742SNikunj A Dadhania int ins_index, i = 0; 15553398b742SNikunj A Dadhania 15563398b742SNikunj A Dadhania ins_index = index; 15573398b742SNikunj A Dadhania for (i = 0; i < es && ins_index < 16; i++, ins_index++) { 155803b32c09SMark Cave-Ayland t.VsrB(ins_index) = xb->VsrB(8 - es + i); 15593398b742SNikunj A Dadhania } 15603398b742SNikunj A Dadhania 156103b32c09SMark Cave-Ayland *xt = t; 15623398b742SNikunj A Dadhania } 15633398b742SNikunj A Dadhania 1564788c6399SMatheus Ferst #define XXBLEND(name, sz) \ 1565788c6399SMatheus Ferst void glue(helper_XXBLENDV, name)(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, \ 1566788c6399SMatheus Ferst ppc_avr_t *c, uint32_t desc) \ 1567788c6399SMatheus Ferst { \ 1568788c6399SMatheus Ferst for (int i = 0; i < ARRAY_SIZE(t->glue(u, sz)); i++) { \ 1569788c6399SMatheus Ferst t->glue(u, sz)[i] = (c->glue(s, sz)[i] >> (sz - 1)) ? \ 1570788c6399SMatheus Ferst b->glue(u, sz)[i] : a->glue(u, sz)[i]; \ 1571788c6399SMatheus Ferst } \ 1572788c6399SMatheus Ferst } 1573788c6399SMatheus Ferst XXBLEND(B, 8) 1574788c6399SMatheus Ferst XXBLEND(H, 16) 1575788c6399SMatheus Ferst XXBLEND(W, 32) 1576788c6399SMatheus Ferst XXBLEND(D, 64) 1577788c6399SMatheus Ferst #undef XXBLEND 1578788c6399SMatheus Ferst 1579fcf5ef2aSThomas Huth #define VNEG(name, element) \ 1580fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 1581fcf5ef2aSThomas Huth { \ 1582fcf5ef2aSThomas Huth int i; \ 158360594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1584fcf5ef2aSThomas Huth r->element[i] = -b->element[i]; \ 1585fcf5ef2aSThomas Huth } \ 1586fcf5ef2aSThomas Huth } 1587fcf5ef2aSThomas Huth VNEG(vnegw, s32) 1588fcf5ef2aSThomas Huth VNEG(vnegd, s64) 1589fcf5ef2aSThomas Huth #undef VNEG 1590fcf5ef2aSThomas Huth 1591fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1592fcf5ef2aSThomas Huth { 15933c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1594fcf5ef2aSThomas Huth 1595fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1596fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1597fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1598fcf5ef2aSThomas Huth #else 1599fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1600fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1601fcf5ef2aSThomas Huth #endif 1602fcf5ef2aSThomas Huth } 1603fcf5ef2aSThomas Huth 1604fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1605fcf5ef2aSThomas Huth { 1606fcf5ef2aSThomas Huth int i; 1607fcf5ef2aSThomas Huth 1608fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1609fcf5ef2aSThomas Huth r->u32[i] = a->u32[i] >= b->u32[i]; 1610fcf5ef2aSThomas Huth } 1611fcf5ef2aSThomas Huth } 1612fcf5ef2aSThomas Huth 1613fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1614fcf5ef2aSThomas Huth { 1615fcf5ef2aSThomas Huth int64_t t; 1616fcf5ef2aSThomas Huth int i, upper; 1617fcf5ef2aSThomas Huth ppc_avr_t result; 1618fcf5ef2aSThomas Huth int sat = 0; 1619fcf5ef2aSThomas Huth 1620fcf5ef2aSThomas Huth upper = ARRAY_SIZE(r->s32) - 1; 162160594feaSMark Cave-Ayland t = (int64_t)b->VsrSW(upper); 1622fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 162360594feaSMark Cave-Ayland t += a->VsrSW(i); 162460594feaSMark Cave-Ayland result.VsrSW(i) = 0; 1625fcf5ef2aSThomas Huth } 162660594feaSMark Cave-Ayland result.VsrSW(upper) = cvtsdsw(t, &sat); 1627fcf5ef2aSThomas Huth *r = result; 1628fcf5ef2aSThomas Huth 1629fcf5ef2aSThomas Huth if (sat) { 16306175f5a0SRichard Henderson set_vscr_sat(env); 1631fcf5ef2aSThomas Huth } 1632fcf5ef2aSThomas Huth } 1633fcf5ef2aSThomas Huth 1634fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1635fcf5ef2aSThomas Huth { 1636fcf5ef2aSThomas Huth int i, j, upper; 1637fcf5ef2aSThomas Huth ppc_avr_t result; 1638fcf5ef2aSThomas Huth int sat = 0; 1639fcf5ef2aSThomas Huth 1640fcf5ef2aSThomas Huth upper = 1; 1641fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 164260594feaSMark Cave-Ayland int64_t t = (int64_t)b->VsrSW(upper + i * 2); 1643fcf5ef2aSThomas Huth 16447fa0ddc1SAnton Blanchard result.VsrD(i) = 0; 1645fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u64); j++) { 164660594feaSMark Cave-Ayland t += a->VsrSW(2 * i + j); 1647fcf5ef2aSThomas Huth } 164860594feaSMark Cave-Ayland result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat); 1649fcf5ef2aSThomas Huth } 1650fcf5ef2aSThomas Huth 1651fcf5ef2aSThomas Huth *r = result; 1652fcf5ef2aSThomas Huth if (sat) { 16536175f5a0SRichard Henderson set_vscr_sat(env); 1654fcf5ef2aSThomas Huth } 1655fcf5ef2aSThomas Huth } 1656fcf5ef2aSThomas Huth 1657fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1658fcf5ef2aSThomas Huth { 1659fcf5ef2aSThomas Huth int i, j; 1660fcf5ef2aSThomas Huth int sat = 0; 1661fcf5ef2aSThomas Huth 1662fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1663fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1664fcf5ef2aSThomas Huth 1665fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->s32); j++) { 1666fcf5ef2aSThomas Huth t += a->s8[4 * i + j]; 1667fcf5ef2aSThomas Huth } 1668fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1669fcf5ef2aSThomas Huth } 1670fcf5ef2aSThomas Huth 1671fcf5ef2aSThomas Huth if (sat) { 16726175f5a0SRichard Henderson set_vscr_sat(env); 1673fcf5ef2aSThomas Huth } 1674fcf5ef2aSThomas Huth } 1675fcf5ef2aSThomas Huth 1676fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1677fcf5ef2aSThomas Huth { 1678fcf5ef2aSThomas Huth int sat = 0; 1679fcf5ef2aSThomas Huth int i; 1680fcf5ef2aSThomas Huth 1681fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1682fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1683fcf5ef2aSThomas Huth 1684fcf5ef2aSThomas Huth t += a->s16[2 * i] + a->s16[2 * i + 1]; 1685fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1686fcf5ef2aSThomas Huth } 1687fcf5ef2aSThomas Huth 1688fcf5ef2aSThomas Huth if (sat) { 16896175f5a0SRichard Henderson set_vscr_sat(env); 1690fcf5ef2aSThomas Huth } 1691fcf5ef2aSThomas Huth } 1692fcf5ef2aSThomas Huth 1693fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1694fcf5ef2aSThomas Huth { 1695fcf5ef2aSThomas Huth int i, j; 1696fcf5ef2aSThomas Huth int sat = 0; 1697fcf5ef2aSThomas Huth 1698fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1699fcf5ef2aSThomas Huth uint64_t t = (uint64_t)b->u32[i]; 1700fcf5ef2aSThomas Huth 1701fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u32); j++) { 1702fcf5ef2aSThomas Huth t += a->u8[4 * i + j]; 1703fcf5ef2aSThomas Huth } 1704fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1705fcf5ef2aSThomas Huth } 1706fcf5ef2aSThomas Huth 1707fcf5ef2aSThomas Huth if (sat) { 17086175f5a0SRichard Henderson set_vscr_sat(env); 1709fcf5ef2aSThomas Huth } 1710fcf5ef2aSThomas Huth } 1711fcf5ef2aSThomas Huth 1712fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1713fcf5ef2aSThomas Huth #define UPKHI 1 1714fcf5ef2aSThomas Huth #define UPKLO 0 1715fcf5ef2aSThomas Huth #else 1716fcf5ef2aSThomas Huth #define UPKHI 0 1717fcf5ef2aSThomas Huth #define UPKLO 1 1718fcf5ef2aSThomas Huth #endif 1719fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi) \ 1720fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 1721fcf5ef2aSThomas Huth { \ 1722fcf5ef2aSThomas Huth int i; \ 1723fcf5ef2aSThomas Huth ppc_avr_t result; \ 1724fcf5ef2aSThomas Huth \ 1725fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { \ 1726fcf5ef2aSThomas Huth uint16_t e = b->u16[hi ? i : i + 4]; \ 1727fcf5ef2aSThomas Huth uint8_t a = (e >> 15) ? 0xff : 0; \ 1728fcf5ef2aSThomas Huth uint8_t r = (e >> 10) & 0x1f; \ 1729fcf5ef2aSThomas Huth uint8_t g = (e >> 5) & 0x1f; \ 1730fcf5ef2aSThomas Huth uint8_t b = e & 0x1f; \ 1731fcf5ef2aSThomas Huth \ 1732fcf5ef2aSThomas Huth result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b; \ 1733fcf5ef2aSThomas Huth } \ 1734fcf5ef2aSThomas Huth *r = result; \ 1735fcf5ef2aSThomas Huth } 1736fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO) 1737fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI) 1738fcf5ef2aSThomas Huth #undef VUPKPX 1739fcf5ef2aSThomas Huth 1740fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi) \ 1741fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 1742fcf5ef2aSThomas Huth { \ 1743fcf5ef2aSThomas Huth int i; \ 1744fcf5ef2aSThomas Huth ppc_avr_t result; \ 1745fcf5ef2aSThomas Huth \ 1746fcf5ef2aSThomas Huth if (hi) { \ 1747fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) { \ 1748fcf5ef2aSThomas Huth result.unpacked[i] = b->packee[i]; \ 1749fcf5ef2aSThomas Huth } \ 1750fcf5ef2aSThomas Huth } else { \ 1751fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \ 1752fcf5ef2aSThomas Huth i++) { \ 1753fcf5ef2aSThomas Huth result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \ 1754fcf5ef2aSThomas Huth } \ 1755fcf5ef2aSThomas Huth } \ 1756fcf5ef2aSThomas Huth *r = result; \ 1757fcf5ef2aSThomas Huth } 1758fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI) 1759fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI) 1760fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI) 1761fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO) 1762fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO) 1763fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO) 1764fcf5ef2aSThomas Huth #undef VUPK 1765fcf5ef2aSThomas Huth #undef UPKHI 1766fcf5ef2aSThomas Huth #undef UPKLO 1767fcf5ef2aSThomas Huth 1768fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element) \ 1769fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *b) \ 1770fcf5ef2aSThomas Huth { \ 1771fcf5ef2aSThomas Huth int i; \ 1772fcf5ef2aSThomas Huth \ 177360594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1774fcf5ef2aSThomas Huth r->element[i] = name(b->element[i]); \ 1775fcf5ef2aSThomas Huth } \ 1776fcf5ef2aSThomas Huth } 1777fcf5ef2aSThomas Huth 1778fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8) 1779fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16) 1780fcf5ef2aSThomas Huth 1781fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8) 1782fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16) 1783fcf5ef2aSThomas Huth 1784fcf5ef2aSThomas Huth #undef clzb 1785fcf5ef2aSThomas Huth #undef clzh 1786fcf5ef2aSThomas Huth 1787fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8) 1788fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16) 1789fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v)) 1790fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v)) 1791fcf5ef2aSThomas Huth 1792fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8) 1793fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16) 1794fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32) 1795fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64) 1796fcf5ef2aSThomas Huth 1797fcf5ef2aSThomas Huth #undef ctzb 1798fcf5ef2aSThomas Huth #undef ctzh 1799fcf5ef2aSThomas Huth #undef ctzw 1800fcf5ef2aSThomas Huth #undef ctzd 1801fcf5ef2aSThomas Huth 1802fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v) 1803fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v) 1804fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v) 1805fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v) 1806fcf5ef2aSThomas Huth 1807fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8) 1808fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16) 1809fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32) 1810fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64) 1811fcf5ef2aSThomas Huth 1812fcf5ef2aSThomas Huth #undef popcntb 1813fcf5ef2aSThomas Huth #undef popcnth 1814fcf5ef2aSThomas Huth #undef popcntw 1815fcf5ef2aSThomas Huth #undef popcntd 1816fcf5ef2aSThomas Huth 1817fcf5ef2aSThomas Huth #undef VGENERIC_DO 1818fcf5ef2aSThomas Huth 1819fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1820fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } } 1821fcf5ef2aSThomas Huth #else 1822fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } } 1823fcf5ef2aSThomas Huth #endif 1824fcf5ef2aSThomas Huth 1825fcf5ef2aSThomas Huth #ifndef CONFIG_INT128 1826fcf5ef2aSThomas Huth 1827fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a) 1828fcf5ef2aSThomas Huth { 1829fcf5ef2aSThomas Huth t->u64[0] = ~a.u64[0]; 1830fcf5ef2aSThomas Huth t->u64[1] = ~a.u64[1]; 1831fcf5ef2aSThomas Huth } 1832fcf5ef2aSThomas Huth 1833fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b) 1834fcf5ef2aSThomas Huth { 18353c385a93SMark Cave-Ayland if (a.VsrD(0) < b.VsrD(0)) { 1836fcf5ef2aSThomas Huth return -1; 18373c385a93SMark Cave-Ayland } else if (a.VsrD(0) > b.VsrD(0)) { 1838fcf5ef2aSThomas Huth return 1; 18393c385a93SMark Cave-Ayland } else if (a.VsrD(1) < b.VsrD(1)) { 1840fcf5ef2aSThomas Huth return -1; 18413c385a93SMark Cave-Ayland } else if (a.VsrD(1) > b.VsrD(1)) { 1842fcf5ef2aSThomas Huth return 1; 1843fcf5ef2aSThomas Huth } else { 1844fcf5ef2aSThomas Huth return 0; 1845fcf5ef2aSThomas Huth } 1846fcf5ef2aSThomas Huth } 1847fcf5ef2aSThomas Huth 1848fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 1849fcf5ef2aSThomas Huth { 18503c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 18513c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 18523c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 1853fcf5ef2aSThomas Huth } 1854fcf5ef2aSThomas Huth 1855fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 1856fcf5ef2aSThomas Huth { 1857fcf5ef2aSThomas Huth ppc_avr_t not_a; 18583c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 18593c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 18603c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 1861fcf5ef2aSThomas Huth avr_qw_not(¬_a, a); 1862fcf5ef2aSThomas Huth return avr_qw_cmpu(not_a, b) < 0; 1863fcf5ef2aSThomas Huth } 1864fcf5ef2aSThomas Huth 1865fcf5ef2aSThomas Huth #endif 1866fcf5ef2aSThomas Huth 1867fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1868fcf5ef2aSThomas Huth { 1869fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1870fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128; 1871fcf5ef2aSThomas Huth #else 1872fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 1873fcf5ef2aSThomas Huth #endif 1874fcf5ef2aSThomas Huth } 1875fcf5ef2aSThomas Huth 1876fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1877fcf5ef2aSThomas Huth { 1878fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1879fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128 + (c->u128 & 1); 1880fcf5ef2aSThomas Huth #else 1881fcf5ef2aSThomas Huth 18823c385a93SMark Cave-Ayland if (c->VsrD(1) & 1) { 1883fcf5ef2aSThomas Huth ppc_avr_t tmp; 1884fcf5ef2aSThomas Huth 18853c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 18863c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 1887fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 1888fcf5ef2aSThomas Huth avr_qw_add(r, tmp, *b); 1889fcf5ef2aSThomas Huth } else { 1890fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 1891fcf5ef2aSThomas Huth } 1892fcf5ef2aSThomas Huth #endif 1893fcf5ef2aSThomas Huth } 1894fcf5ef2aSThomas Huth 1895fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1896fcf5ef2aSThomas Huth { 1897fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1898fcf5ef2aSThomas Huth r->u128 = (~a->u128 < b->u128); 1899fcf5ef2aSThomas Huth #else 1900fcf5ef2aSThomas Huth ppc_avr_t not_a; 1901fcf5ef2aSThomas Huth 1902fcf5ef2aSThomas Huth avr_qw_not(¬_a, *a); 1903fcf5ef2aSThomas Huth 19043c385a93SMark Cave-Ayland r->VsrD(0) = 0; 19053c385a93SMark Cave-Ayland r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0); 1906fcf5ef2aSThomas Huth #endif 1907fcf5ef2aSThomas Huth } 1908fcf5ef2aSThomas Huth 1909fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1910fcf5ef2aSThomas Huth { 1911fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1912fcf5ef2aSThomas Huth int carry_out = (~a->u128 < b->u128); 1913fcf5ef2aSThomas Huth if (!carry_out && (c->u128 & 1)) { 1914fcf5ef2aSThomas Huth carry_out = ((a->u128 + b->u128 + 1) == 0) && 1915fcf5ef2aSThomas Huth ((a->u128 != 0) || (b->u128 != 0)); 1916fcf5ef2aSThomas Huth } 1917fcf5ef2aSThomas Huth r->u128 = carry_out; 1918fcf5ef2aSThomas Huth #else 1919fcf5ef2aSThomas Huth 19203c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 1921fcf5ef2aSThomas Huth int carry_out = 0; 1922fcf5ef2aSThomas Huth ppc_avr_t tmp; 1923fcf5ef2aSThomas Huth 1924fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, *a, *b); 1925fcf5ef2aSThomas Huth 1926fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 1927fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 1928fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, tmp, one); 1929fcf5ef2aSThomas Huth } 19303c385a93SMark Cave-Ayland r->VsrD(0) = 0; 19313c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 1932fcf5ef2aSThomas Huth #endif 1933fcf5ef2aSThomas Huth } 1934fcf5ef2aSThomas Huth 1935fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1936fcf5ef2aSThomas Huth { 1937fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1938fcf5ef2aSThomas Huth r->u128 = a->u128 - b->u128; 1939fcf5ef2aSThomas Huth #else 1940fcf5ef2aSThomas Huth ppc_avr_t tmp; 1941fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 1942fcf5ef2aSThomas Huth 1943fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 1944fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 1945fcf5ef2aSThomas Huth avr_qw_add(r, tmp, one); 1946fcf5ef2aSThomas Huth #endif 1947fcf5ef2aSThomas Huth } 1948fcf5ef2aSThomas Huth 1949fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1950fcf5ef2aSThomas Huth { 1951fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1952fcf5ef2aSThomas Huth r->u128 = a->u128 + ~b->u128 + (c->u128 & 1); 1953fcf5ef2aSThomas Huth #else 1954fcf5ef2aSThomas Huth ppc_avr_t tmp, sum; 1955fcf5ef2aSThomas Huth 1956fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 1957fcf5ef2aSThomas Huth avr_qw_add(&sum, *a, tmp); 1958fcf5ef2aSThomas Huth 19593c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 19603c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 1961fcf5ef2aSThomas Huth avr_qw_add(r, sum, tmp); 1962fcf5ef2aSThomas Huth #endif 1963fcf5ef2aSThomas Huth } 1964fcf5ef2aSThomas Huth 1965fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1966fcf5ef2aSThomas Huth { 1967fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1968fcf5ef2aSThomas Huth r->u128 = (~a->u128 < ~b->u128) || 1969fcf5ef2aSThomas Huth (a->u128 + ~b->u128 == (__uint128_t)-1); 1970fcf5ef2aSThomas Huth #else 1971fcf5ef2aSThomas Huth int carry = (avr_qw_cmpu(*a, *b) > 0); 1972fcf5ef2aSThomas Huth if (!carry) { 1973fcf5ef2aSThomas Huth ppc_avr_t tmp; 1974fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 1975fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 19763c385a93SMark Cave-Ayland carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull)); 1977fcf5ef2aSThomas Huth } 19783c385a93SMark Cave-Ayland r->VsrD(0) = 0; 19793c385a93SMark Cave-Ayland r->VsrD(1) = carry; 1980fcf5ef2aSThomas Huth #endif 1981fcf5ef2aSThomas Huth } 1982fcf5ef2aSThomas Huth 1983fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1984fcf5ef2aSThomas Huth { 1985fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1986fcf5ef2aSThomas Huth r->u128 = 1987fcf5ef2aSThomas Huth (~a->u128 < ~b->u128) || 1988fcf5ef2aSThomas Huth ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1)); 1989fcf5ef2aSThomas Huth #else 19903c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 1991fcf5ef2aSThomas Huth int carry_out = (avr_qw_cmpu(*a, *b) > 0); 1992fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 1993fcf5ef2aSThomas Huth ppc_avr_t tmp; 1994fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 1995fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 19963c385a93SMark Cave-Ayland carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull)); 1997fcf5ef2aSThomas Huth } 1998fcf5ef2aSThomas Huth 19993c385a93SMark Cave-Ayland r->VsrD(0) = 0; 20003c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2001fcf5ef2aSThomas Huth #endif 2002fcf5ef2aSThomas Huth } 2003fcf5ef2aSThomas Huth 2004fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC 2005fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF 2006fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1 0xA 2007fcf5ef2aSThomas Huth #define BCD_NEG_PREF 0xD 2008fcf5ef2aSThomas Huth #define BCD_NEG_ALT 0xB 2009fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2 0xE 2010fcf5ef2aSThomas Huth #define NATIONAL_PLUS 0x2B 2011fcf5ef2aSThomas Huth #define NATIONAL_NEG 0x2D 2012fcf5ef2aSThomas Huth 2013365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2)) 2014fcf5ef2aSThomas Huth 2015fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd) 2016fcf5ef2aSThomas Huth { 2017428115c3SMark Cave-Ayland switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) { 2018fcf5ef2aSThomas Huth case BCD_PLUS_PREF_1: 2019fcf5ef2aSThomas Huth case BCD_PLUS_PREF_2: 2020fcf5ef2aSThomas Huth case BCD_PLUS_ALT_1: 2021fcf5ef2aSThomas Huth case BCD_PLUS_ALT_2: 2022fcf5ef2aSThomas Huth { 2023fcf5ef2aSThomas Huth return 1; 2024fcf5ef2aSThomas Huth } 2025fcf5ef2aSThomas Huth 2026fcf5ef2aSThomas Huth case BCD_NEG_PREF: 2027fcf5ef2aSThomas Huth case BCD_NEG_ALT: 2028fcf5ef2aSThomas Huth { 2029fcf5ef2aSThomas Huth return -1; 2030fcf5ef2aSThomas Huth } 2031fcf5ef2aSThomas Huth 2032fcf5ef2aSThomas Huth default: 2033fcf5ef2aSThomas Huth { 2034fcf5ef2aSThomas Huth return 0; 2035fcf5ef2aSThomas Huth } 2036fcf5ef2aSThomas Huth } 2037fcf5ef2aSThomas Huth } 2038fcf5ef2aSThomas Huth 2039fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps) 2040fcf5ef2aSThomas Huth { 2041fcf5ef2aSThomas Huth if (sgn >= 0) { 2042fcf5ef2aSThomas Huth return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2; 2043fcf5ef2aSThomas Huth } else { 2044fcf5ef2aSThomas Huth return BCD_NEG_PREF; 2045fcf5ef2aSThomas Huth } 2046fcf5ef2aSThomas Huth } 2047fcf5ef2aSThomas Huth 2048fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid) 2049fcf5ef2aSThomas Huth { 2050fcf5ef2aSThomas Huth uint8_t result; 2051fcf5ef2aSThomas Huth if (n & 1) { 2052428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4; 2053fcf5ef2aSThomas Huth } else { 2054428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF; 2055fcf5ef2aSThomas Huth } 2056fcf5ef2aSThomas Huth 2057fcf5ef2aSThomas Huth if (unlikely(result > 9)) { 2058fcf5ef2aSThomas Huth *invalid = true; 2059fcf5ef2aSThomas Huth } 2060fcf5ef2aSThomas Huth return result; 2061fcf5ef2aSThomas Huth } 2062fcf5ef2aSThomas Huth 2063fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n) 2064fcf5ef2aSThomas Huth { 2065fcf5ef2aSThomas Huth if (n & 1) { 2066428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F; 2067428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4); 2068fcf5ef2aSThomas Huth } else { 2069428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0; 2070428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= digit; 2071fcf5ef2aSThomas Huth } 2072fcf5ef2aSThomas Huth } 2073fcf5ef2aSThomas Huth 2074071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd) 2075071663dfSJose Ricardo Ziviani { 2076071663dfSJose Ricardo Ziviani int i; 2077071663dfSJose Ricardo Ziviani int invalid = 0; 2078071663dfSJose Ricardo Ziviani 2079071663dfSJose Ricardo Ziviani if (bcd_get_sgn(bcd) == 0) { 2080071663dfSJose Ricardo Ziviani return false; 2081071663dfSJose Ricardo Ziviani } 2082071663dfSJose Ricardo Ziviani 2083071663dfSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2084071663dfSJose Ricardo Ziviani bcd_get_digit(bcd, i, &invalid); 2085071663dfSJose Ricardo Ziviani if (unlikely(invalid)) { 2086071663dfSJose Ricardo Ziviani return false; 2087071663dfSJose Ricardo Ziviani } 2088071663dfSJose Ricardo Ziviani } 2089071663dfSJose Ricardo Ziviani return true; 2090071663dfSJose Ricardo Ziviani } 2091071663dfSJose Ricardo Ziviani 2092fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd) 2093fcf5ef2aSThomas Huth { 20943c385a93SMark Cave-Ayland if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) { 2095efa73196SNikunj A Dadhania return CRF_EQ; 2096fcf5ef2aSThomas Huth } else { 2097efa73196SNikunj A Dadhania return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT; 2098fcf5ef2aSThomas Huth } 2099fcf5ef2aSThomas Huth } 2100fcf5ef2aSThomas Huth 2101fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n) 2102fcf5ef2aSThomas Huth { 210360594feaSMark Cave-Ayland return reg->VsrH(7 - n); 2104fcf5ef2aSThomas Huth } 2105fcf5ef2aSThomas Huth 2106fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n) 2107fcf5ef2aSThomas Huth { 210860594feaSMark Cave-Ayland reg->VsrH(7 - n) = val; 2109fcf5ef2aSThomas Huth } 2110fcf5ef2aSThomas Huth 2111fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b) 2112fcf5ef2aSThomas Huth { 2113fcf5ef2aSThomas Huth int i; 2114fcf5ef2aSThomas Huth int invalid = 0; 2115fcf5ef2aSThomas Huth for (i = 31; i > 0; i--) { 2116fcf5ef2aSThomas Huth uint8_t dig_a = bcd_get_digit(a, i, &invalid); 2117fcf5ef2aSThomas Huth uint8_t dig_b = bcd_get_digit(b, i, &invalid); 2118fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2119fcf5ef2aSThomas Huth return 0; /* doesn't matter */ 2120fcf5ef2aSThomas Huth } else if (dig_a > dig_b) { 2121fcf5ef2aSThomas Huth return 1; 2122fcf5ef2aSThomas Huth } else if (dig_a < dig_b) { 2123fcf5ef2aSThomas Huth return -1; 2124fcf5ef2aSThomas Huth } 2125fcf5ef2aSThomas Huth } 2126fcf5ef2aSThomas Huth 2127fcf5ef2aSThomas Huth return 0; 2128fcf5ef2aSThomas Huth } 2129fcf5ef2aSThomas Huth 2130936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2131fcf5ef2aSThomas Huth int *overflow) 2132fcf5ef2aSThomas Huth { 2133fcf5ef2aSThomas Huth int carry = 0; 2134fcf5ef2aSThomas Huth int i; 2135936fda4dSFabiano Rosas int is_zero = 1; 2136936fda4dSFabiano Rosas 2137fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2138fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) + 2139fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2140936fda4dSFabiano Rosas is_zero &= (digit == 0); 2141fcf5ef2aSThomas Huth if (digit > 9) { 2142fcf5ef2aSThomas Huth carry = 1; 2143fcf5ef2aSThomas Huth digit -= 10; 2144fcf5ef2aSThomas Huth } else { 2145fcf5ef2aSThomas Huth carry = 0; 2146fcf5ef2aSThomas Huth } 2147fcf5ef2aSThomas Huth 2148fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2149fcf5ef2aSThomas Huth } 2150fcf5ef2aSThomas Huth 2151fcf5ef2aSThomas Huth *overflow = carry; 2152936fda4dSFabiano Rosas return is_zero; 2153fcf5ef2aSThomas Huth } 2154fcf5ef2aSThomas Huth 2155d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2156fcf5ef2aSThomas Huth int *overflow) 2157fcf5ef2aSThomas Huth { 2158fcf5ef2aSThomas Huth int carry = 0; 2159fcf5ef2aSThomas Huth int i; 2160d03b174aSYasmin Beatriz 2161fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2162fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) - 2163fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2164fcf5ef2aSThomas Huth if (digit & 0x80) { 2165fcf5ef2aSThomas Huth carry = -1; 2166fcf5ef2aSThomas Huth digit += 10; 2167fcf5ef2aSThomas Huth } else { 2168fcf5ef2aSThomas Huth carry = 0; 2169fcf5ef2aSThomas Huth } 2170fcf5ef2aSThomas Huth 2171fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2172fcf5ef2aSThomas Huth } 2173fcf5ef2aSThomas Huth 2174fcf5ef2aSThomas Huth *overflow = carry; 2175fcf5ef2aSThomas Huth } 2176fcf5ef2aSThomas Huth 2177fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2178fcf5ef2aSThomas Huth { 2179fcf5ef2aSThomas Huth 2180fcf5ef2aSThomas Huth int sgna = bcd_get_sgn(a); 2181fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2182fcf5ef2aSThomas Huth int invalid = (sgna == 0) || (sgnb == 0); 2183fcf5ef2aSThomas Huth int overflow = 0; 2184936fda4dSFabiano Rosas int zero = 0; 2185fcf5ef2aSThomas Huth uint32_t cr = 0; 2186fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 2187fcf5ef2aSThomas Huth 2188fcf5ef2aSThomas Huth if (!invalid) { 2189fcf5ef2aSThomas Huth if (sgna == sgnb) { 2190428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2191936fda4dSFabiano Rosas zero = bcd_add_mag(&result, a, b, &invalid, &overflow); 2192936fda4dSFabiano Rosas cr = (sgna > 0) ? CRF_GT : CRF_LT; 2193fcf5ef2aSThomas Huth } else { 2194d03b174aSYasmin Beatriz int magnitude = bcd_cmp_mag(a, b); 2195d03b174aSYasmin Beatriz if (magnitude > 0) { 2196428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2197d03b174aSYasmin Beatriz bcd_sub_mag(&result, a, b, &invalid, &overflow); 2198d03b174aSYasmin Beatriz cr = (sgna > 0) ? CRF_GT : CRF_LT; 2199d03b174aSYasmin Beatriz } else if (magnitude < 0) { 2200428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps); 2201d03b174aSYasmin Beatriz bcd_sub_mag(&result, b, a, &invalid, &overflow); 2202efa73196SNikunj A Dadhania cr = (sgnb > 0) ? CRF_GT : CRF_LT; 2203d03b174aSYasmin Beatriz } else { 2204428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps); 2205d03b174aSYasmin Beatriz cr = CRF_EQ; 2206d03b174aSYasmin Beatriz } 2207fcf5ef2aSThomas Huth } 2208fcf5ef2aSThomas Huth } 2209fcf5ef2aSThomas Huth 2210fcf5ef2aSThomas Huth if (unlikely(invalid)) { 22113c385a93SMark Cave-Ayland result.VsrD(0) = result.VsrD(1) = -1; 2212efa73196SNikunj A Dadhania cr = CRF_SO; 2213fcf5ef2aSThomas Huth } else if (overflow) { 2214efa73196SNikunj A Dadhania cr |= CRF_SO; 2215936fda4dSFabiano Rosas } else if (zero) { 2216936fda4dSFabiano Rosas cr |= CRF_EQ; 2217fcf5ef2aSThomas Huth } 2218fcf5ef2aSThomas Huth 2219fcf5ef2aSThomas Huth *r = result; 2220fcf5ef2aSThomas Huth 2221fcf5ef2aSThomas Huth return cr; 2222fcf5ef2aSThomas Huth } 2223fcf5ef2aSThomas Huth 2224fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2225fcf5ef2aSThomas Huth { 2226fcf5ef2aSThomas Huth ppc_avr_t bcopy = *b; 2227fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2228fcf5ef2aSThomas Huth if (sgnb < 0) { 2229fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0); 2230fcf5ef2aSThomas Huth } else if (sgnb > 0) { 2231fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_NEG_PREF, 0); 2232fcf5ef2aSThomas Huth } 2233fcf5ef2aSThomas Huth /* else invalid ... defer to bcdadd code for proper handling */ 2234fcf5ef2aSThomas Huth 2235fcf5ef2aSThomas Huth return helper_bcdadd(r, a, &bcopy, ps); 2236fcf5ef2aSThomas Huth } 2237fcf5ef2aSThomas Huth 2238fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2239fcf5ef2aSThomas Huth { 2240fcf5ef2aSThomas Huth int i; 2241fcf5ef2aSThomas Huth int cr = 0; 2242fcf5ef2aSThomas Huth uint16_t national = 0; 2243fcf5ef2aSThomas Huth uint16_t sgnb = get_national_digit(b, 0); 2244fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2245fcf5ef2aSThomas Huth int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG); 2246fcf5ef2aSThomas Huth 2247fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2248fcf5ef2aSThomas Huth national = get_national_digit(b, i); 2249fcf5ef2aSThomas Huth if (unlikely(national < 0x30 || national > 0x39)) { 2250fcf5ef2aSThomas Huth invalid = 1; 2251fcf5ef2aSThomas Huth break; 2252fcf5ef2aSThomas Huth } 2253fcf5ef2aSThomas Huth 2254fcf5ef2aSThomas Huth bcd_put_digit(&ret, national & 0xf, i); 2255fcf5ef2aSThomas Huth } 2256fcf5ef2aSThomas Huth 2257fcf5ef2aSThomas Huth if (sgnb == NATIONAL_PLUS) { 2258fcf5ef2aSThomas Huth bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0); 2259fcf5ef2aSThomas Huth } else { 2260fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2261fcf5ef2aSThomas Huth } 2262fcf5ef2aSThomas Huth 2263fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2264fcf5ef2aSThomas Huth 2265fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2266efa73196SNikunj A Dadhania cr = CRF_SO; 2267fcf5ef2aSThomas Huth } 2268fcf5ef2aSThomas Huth 2269fcf5ef2aSThomas Huth *r = ret; 2270fcf5ef2aSThomas Huth 2271fcf5ef2aSThomas Huth return cr; 2272fcf5ef2aSThomas Huth } 2273fcf5ef2aSThomas Huth 2274fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2275fcf5ef2aSThomas Huth { 2276fcf5ef2aSThomas Huth int i; 2277fcf5ef2aSThomas Huth int cr = 0; 2278fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2279fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2280fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2281fcf5ef2aSThomas Huth 22823c385a93SMark Cave-Ayland int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0); 2283fcf5ef2aSThomas Huth 2284fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2285fcf5ef2aSThomas Huth set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i); 2286fcf5ef2aSThomas Huth 2287fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2288fcf5ef2aSThomas Huth break; 2289fcf5ef2aSThomas Huth } 2290fcf5ef2aSThomas Huth } 2291fcf5ef2aSThomas Huth set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0); 2292fcf5ef2aSThomas Huth 2293fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2294fcf5ef2aSThomas Huth 2295fcf5ef2aSThomas Huth if (ox_flag) { 2296efa73196SNikunj A Dadhania cr |= CRF_SO; 2297fcf5ef2aSThomas Huth } 2298fcf5ef2aSThomas Huth 2299fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2300efa73196SNikunj A Dadhania cr = CRF_SO; 2301fcf5ef2aSThomas Huth } 2302fcf5ef2aSThomas Huth 2303fcf5ef2aSThomas Huth *r = ret; 2304fcf5ef2aSThomas Huth 2305fcf5ef2aSThomas Huth return cr; 2306fcf5ef2aSThomas Huth } 2307fcf5ef2aSThomas Huth 2308fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2309fcf5ef2aSThomas Huth { 2310fcf5ef2aSThomas Huth int i; 2311fcf5ef2aSThomas Huth int cr = 0; 2312fcf5ef2aSThomas Huth int invalid = 0; 2313fcf5ef2aSThomas Huth int zone_digit = 0; 2314fcf5ef2aSThomas Huth int zone_lead = ps ? 0xF : 0x3; 2315fcf5ef2aSThomas Huth int digit = 0; 2316fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2317428115c3SMark Cave-Ayland int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4; 2318fcf5ef2aSThomas Huth 2319fcf5ef2aSThomas Huth if (unlikely((sgnb < 0xA) && ps)) { 2320fcf5ef2aSThomas Huth invalid = 1; 2321fcf5ef2aSThomas Huth } 2322fcf5ef2aSThomas Huth 2323fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2324428115c3SMark Cave-Ayland zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead; 2325428115c3SMark Cave-Ayland digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF; 2326fcf5ef2aSThomas Huth if (unlikely(zone_digit != zone_lead || digit > 0x9)) { 2327fcf5ef2aSThomas Huth invalid = 1; 2328fcf5ef2aSThomas Huth break; 2329fcf5ef2aSThomas Huth } 2330fcf5ef2aSThomas Huth 2331fcf5ef2aSThomas Huth bcd_put_digit(&ret, digit, i + 1); 2332fcf5ef2aSThomas Huth } 2333fcf5ef2aSThomas Huth 2334fcf5ef2aSThomas Huth if ((ps && (sgnb == 0xB || sgnb == 0xD)) || 2335fcf5ef2aSThomas Huth (!ps && (sgnb & 0x4))) { 2336fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2337fcf5ef2aSThomas Huth } else { 2338fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0); 2339fcf5ef2aSThomas Huth } 2340fcf5ef2aSThomas Huth 2341fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2342fcf5ef2aSThomas Huth 2343fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2344efa73196SNikunj A Dadhania cr = CRF_SO; 2345fcf5ef2aSThomas Huth } 2346fcf5ef2aSThomas Huth 2347fcf5ef2aSThomas Huth *r = ret; 2348fcf5ef2aSThomas Huth 2349fcf5ef2aSThomas Huth return cr; 2350fcf5ef2aSThomas Huth } 2351fcf5ef2aSThomas Huth 2352fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2353fcf5ef2aSThomas Huth { 2354fcf5ef2aSThomas Huth int i; 2355fcf5ef2aSThomas Huth int cr = 0; 2356fcf5ef2aSThomas Huth uint8_t digit = 0; 2357fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2358fcf5ef2aSThomas Huth int zone_lead = (ps) ? 0xF0 : 0x30; 2359fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2360fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2361fcf5ef2aSThomas Huth 23623c385a93SMark Cave-Ayland int ox_flag = ((b->VsrD(0) >> 4) != 0); 2363fcf5ef2aSThomas Huth 2364fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2365fcf5ef2aSThomas Huth digit = bcd_get_digit(b, i + 1, &invalid); 2366fcf5ef2aSThomas Huth 2367fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2368fcf5ef2aSThomas Huth break; 2369fcf5ef2aSThomas Huth } 2370fcf5ef2aSThomas Huth 2371428115c3SMark Cave-Ayland ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit; 2372fcf5ef2aSThomas Huth } 2373fcf5ef2aSThomas Huth 2374fcf5ef2aSThomas Huth if (ps) { 2375fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1); 2376fcf5ef2aSThomas Huth } else { 2377fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1); 2378fcf5ef2aSThomas Huth } 2379fcf5ef2aSThomas Huth 2380fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2381fcf5ef2aSThomas Huth 2382fcf5ef2aSThomas Huth if (ox_flag) { 2383efa73196SNikunj A Dadhania cr |= CRF_SO; 2384fcf5ef2aSThomas Huth } 2385fcf5ef2aSThomas Huth 2386fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2387efa73196SNikunj A Dadhania cr = CRF_SO; 2388fcf5ef2aSThomas Huth } 2389fcf5ef2aSThomas Huth 2390fcf5ef2aSThomas Huth *r = ret; 2391fcf5ef2aSThomas Huth 2392fcf5ef2aSThomas Huth return cr; 2393fcf5ef2aSThomas Huth } 2394fcf5ef2aSThomas Huth 2395a3d67f3eSLuis Pires /** 2396a3d67f3eSLuis Pires * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs 2397a3d67f3eSLuis Pires * 2398a3d67f3eSLuis Pires * Returns: 2399a3d67f3eSLuis Pires * > 0 if ahi|alo > bhi|blo, 2400a3d67f3eSLuis Pires * 0 if ahi|alo == bhi|blo, 2401a3d67f3eSLuis Pires * < 0 if ahi|alo < bhi|blo 2402a3d67f3eSLuis Pires */ 2403a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi, 2404a3d67f3eSLuis Pires uint64_t blo, uint64_t bhi) 2405a3d67f3eSLuis Pires { 2406a3d67f3eSLuis Pires return (ahi == bhi) ? 2407a3d67f3eSLuis Pires (alo > blo ? 1 : (alo == blo ? 0 : -1)) : 2408a3d67f3eSLuis Pires (ahi > bhi ? 1 : -1); 2409a3d67f3eSLuis Pires } 2410a3d67f3eSLuis Pires 2411a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2412a406c058SJose Ricardo Ziviani { 2413a406c058SJose Ricardo Ziviani int i; 2414a3d67f3eSLuis Pires int cr; 2415a406c058SJose Ricardo Ziviani uint64_t lo_value; 2416a406c058SJose Ricardo Ziviani uint64_t hi_value; 241740f3e79aSLuis Pires uint64_t rem; 2418a406c058SJose Ricardo Ziviani ppc_avr_t ret = { .u64 = { 0, 0 } }; 2419a406c058SJose Ricardo Ziviani 24203c385a93SMark Cave-Ayland if (b->VsrSD(0) < 0) { 24213c385a93SMark Cave-Ayland lo_value = -b->VsrSD(1); 24223c385a93SMark Cave-Ayland hi_value = ~b->VsrD(0) + !lo_value; 2423a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, 0xD, 0); 2424a3d67f3eSLuis Pires 2425a3d67f3eSLuis Pires cr = CRF_LT; 2426a406c058SJose Ricardo Ziviani } else { 24273c385a93SMark Cave-Ayland lo_value = b->VsrD(1); 24283c385a93SMark Cave-Ayland hi_value = b->VsrD(0); 2429a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0); 2430a3d67f3eSLuis Pires 2431a3d67f3eSLuis Pires if (hi_value == 0 && lo_value == 0) { 2432a3d67f3eSLuis Pires cr = CRF_EQ; 2433a3d67f3eSLuis Pires } else { 2434a3d67f3eSLuis Pires cr = CRF_GT; 2435a3d67f3eSLuis Pires } 2436a406c058SJose Ricardo Ziviani } 2437a406c058SJose Ricardo Ziviani 2438a3d67f3eSLuis Pires /* 2439a3d67f3eSLuis Pires * Check src limits: abs(src) <= 10^31 - 1 2440a3d67f3eSLuis Pires * 2441a3d67f3eSLuis Pires * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff 2442a3d67f3eSLuis Pires */ 2443a3d67f3eSLuis Pires if (ucmp128(lo_value, hi_value, 2444a3d67f3eSLuis Pires 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) { 2445a3d67f3eSLuis Pires cr |= CRF_SO; 2446a3d67f3eSLuis Pires 2447a3d67f3eSLuis Pires /* 2448a3d67f3eSLuis Pires * According to the ISA, if src wouldn't fit in the destination 2449a3d67f3eSLuis Pires * register, the result is undefined. 2450a3d67f3eSLuis Pires * In that case, we leave r unchanged. 2451a3d67f3eSLuis Pires */ 2452a3d67f3eSLuis Pires } else { 245340f3e79aSLuis Pires rem = divu128(&lo_value, &hi_value, 1000000000000000ULL); 2454a406c058SJose Ricardo Ziviani 245540f3e79aSLuis Pires for (i = 1; i < 16; rem /= 10, i++) { 245640f3e79aSLuis Pires bcd_put_digit(&ret, rem % 10, i); 2457a406c058SJose Ricardo Ziviani } 2458a406c058SJose Ricardo Ziviani 2459a406c058SJose Ricardo Ziviani for (; i < 32; lo_value /= 10, i++) { 2460a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, lo_value % 10, i); 2461a406c058SJose Ricardo Ziviani } 2462a406c058SJose Ricardo Ziviani 2463a406c058SJose Ricardo Ziviani *r = ret; 2464a3d67f3eSLuis Pires } 2465a406c058SJose Ricardo Ziviani 2466a406c058SJose Ricardo Ziviani return cr; 2467a406c058SJose Ricardo Ziviani } 2468a406c058SJose Ricardo Ziviani 2469c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2470c85bc7ddSJose Ricardo Ziviani { 2471c85bc7ddSJose Ricardo Ziviani uint8_t i; 2472c85bc7ddSJose Ricardo Ziviani int cr; 2473c85bc7ddSJose Ricardo Ziviani uint64_t carry; 2474c85bc7ddSJose Ricardo Ziviani uint64_t unused; 2475c85bc7ddSJose Ricardo Ziviani uint64_t lo_value; 2476c85bc7ddSJose Ricardo Ziviani uint64_t hi_value = 0; 2477c85bc7ddSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2478c85bc7ddSJose Ricardo Ziviani int invalid = (sgnb == 0); 2479c85bc7ddSJose Ricardo Ziviani 2480c85bc7ddSJose Ricardo Ziviani lo_value = bcd_get_digit(b, 31, &invalid); 2481c85bc7ddSJose Ricardo Ziviani for (i = 30; i > 0; i--) { 2482c85bc7ddSJose Ricardo Ziviani mulu64(&lo_value, &carry, lo_value, 10ULL); 2483c85bc7ddSJose Ricardo Ziviani mulu64(&hi_value, &unused, hi_value, 10ULL); 2484c85bc7ddSJose Ricardo Ziviani lo_value += bcd_get_digit(b, i, &invalid); 2485c85bc7ddSJose Ricardo Ziviani hi_value += carry; 2486c85bc7ddSJose Ricardo Ziviani 2487c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2488c85bc7ddSJose Ricardo Ziviani break; 2489c85bc7ddSJose Ricardo Ziviani } 2490c85bc7ddSJose Ricardo Ziviani } 2491c85bc7ddSJose Ricardo Ziviani 2492c85bc7ddSJose Ricardo Ziviani if (sgnb == -1) { 24933c385a93SMark Cave-Ayland r->VsrSD(1) = -lo_value; 24943c385a93SMark Cave-Ayland r->VsrSD(0) = ~hi_value + !r->VsrSD(1); 2495c85bc7ddSJose Ricardo Ziviani } else { 24963c385a93SMark Cave-Ayland r->VsrSD(1) = lo_value; 24973c385a93SMark Cave-Ayland r->VsrSD(0) = hi_value; 2498c85bc7ddSJose Ricardo Ziviani } 2499c85bc7ddSJose Ricardo Ziviani 2500c85bc7ddSJose Ricardo Ziviani cr = bcd_cmp_zero(b); 2501c85bc7ddSJose Ricardo Ziviani 2502c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2503c85bc7ddSJose Ricardo Ziviani cr = CRF_SO; 2504c85bc7ddSJose Ricardo Ziviani } 2505c85bc7ddSJose Ricardo Ziviani 2506c85bc7ddSJose Ricardo Ziviani return cr; 2507c85bc7ddSJose Ricardo Ziviani } 2508c85bc7ddSJose Ricardo Ziviani 2509c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2510c3025c3bSJose Ricardo Ziviani { 2511c3025c3bSJose Ricardo Ziviani int i; 2512c3025c3bSJose Ricardo Ziviani int invalid = 0; 2513c3025c3bSJose Ricardo Ziviani 2514c3025c3bSJose Ricardo Ziviani if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) { 2515c3025c3bSJose Ricardo Ziviani return CRF_SO; 2516c3025c3bSJose Ricardo Ziviani } 2517c3025c3bSJose Ricardo Ziviani 2518c3025c3bSJose Ricardo Ziviani *r = *a; 2519428115c3SMark Cave-Ayland bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0); 2520c3025c3bSJose Ricardo Ziviani 2521c3025c3bSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2522c3025c3bSJose Ricardo Ziviani bcd_get_digit(a, i, &invalid); 2523c3025c3bSJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2524c3025c3bSJose Ricardo Ziviani if (unlikely(invalid)) { 2525c3025c3bSJose Ricardo Ziviani return CRF_SO; 2526c3025c3bSJose Ricardo Ziviani } 2527c3025c3bSJose Ricardo Ziviani } 2528c3025c3bSJose Ricardo Ziviani 2529c3025c3bSJose Ricardo Ziviani return bcd_cmp_zero(r); 2530c3025c3bSJose Ricardo Ziviani } 2531c3025c3bSJose Ricardo Ziviani 2532466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2533466a3f9cSJose Ricardo Ziviani { 2534466a3f9cSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2535466a3f9cSJose Ricardo Ziviani 2536466a3f9cSJose Ricardo Ziviani *r = *b; 2537466a3f9cSJose Ricardo Ziviani bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0); 2538466a3f9cSJose Ricardo Ziviani 2539071663dfSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2540466a3f9cSJose Ricardo Ziviani return CRF_SO; 2541466a3f9cSJose Ricardo Ziviani } 2542466a3f9cSJose Ricardo Ziviani 2543466a3f9cSJose Ricardo Ziviani return bcd_cmp_zero(r); 2544466a3f9cSJose Ricardo Ziviani } 2545466a3f9cSJose Ricardo Ziviani 2546e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2547e04797f7SJose Ricardo Ziviani { 2548e04797f7SJose Ricardo Ziviani int cr; 2549428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2550e04797f7SJose Ricardo Ziviani bool ox_flag = false; 2551e04797f7SJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2552e04797f7SJose Ricardo Ziviani ppc_avr_t ret = *b; 25533c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2554e04797f7SJose Ricardo Ziviani 2555e04797f7SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2556e04797f7SJose Ricardo Ziviani return CRF_SO; 2557e04797f7SJose Ricardo Ziviani } 2558e04797f7SJose Ricardo Ziviani 2559e04797f7SJose Ricardo Ziviani if (unlikely(i > 31)) { 2560e04797f7SJose Ricardo Ziviani i = 31; 2561e04797f7SJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2562e04797f7SJose Ricardo Ziviani i = -31; 2563e04797f7SJose Ricardo Ziviani } 2564e04797f7SJose Ricardo Ziviani 2565e04797f7SJose Ricardo Ziviani if (i > 0) { 25663c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2567e04797f7SJose Ricardo Ziviani } else { 25683c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2569e04797f7SJose Ricardo Ziviani } 2570e04797f7SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2571e04797f7SJose Ricardo Ziviani 2572e04797f7SJose Ricardo Ziviani *r = ret; 2573e04797f7SJose Ricardo Ziviani 2574e04797f7SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2575e04797f7SJose Ricardo Ziviani if (ox_flag) { 2576e04797f7SJose Ricardo Ziviani cr |= CRF_SO; 2577e04797f7SJose Ricardo Ziviani } 2578e04797f7SJose Ricardo Ziviani 2579e04797f7SJose Ricardo Ziviani return cr; 2580e04797f7SJose Ricardo Ziviani } 2581e04797f7SJose Ricardo Ziviani 2582a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2583a49a95e9SJose Ricardo Ziviani { 2584a49a95e9SJose Ricardo Ziviani int cr; 2585a49a95e9SJose Ricardo Ziviani int i; 2586a49a95e9SJose Ricardo Ziviani int invalid = 0; 2587a49a95e9SJose Ricardo Ziviani bool ox_flag = false; 2588a49a95e9SJose Ricardo Ziviani ppc_avr_t ret = *b; 2589a49a95e9SJose Ricardo Ziviani 2590a49a95e9SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 2591a49a95e9SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2592a49a95e9SJose Ricardo Ziviani 2593a49a95e9SJose Ricardo Ziviani if (unlikely(invalid)) { 2594a49a95e9SJose Ricardo Ziviani return CRF_SO; 2595a49a95e9SJose Ricardo Ziviani } 2596a49a95e9SJose Ricardo Ziviani } 2597a49a95e9SJose Ricardo Ziviani 2598428115c3SMark Cave-Ayland i = a->VsrSB(7); 2599a49a95e9SJose Ricardo Ziviani if (i >= 32) { 2600a49a95e9SJose Ricardo Ziviani ox_flag = true; 26013c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2602a49a95e9SJose Ricardo Ziviani } else if (i <= -32) { 26033c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2604a49a95e9SJose Ricardo Ziviani } else if (i > 0) { 26053c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2606a49a95e9SJose Ricardo Ziviani } else { 26073c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2608a49a95e9SJose Ricardo Ziviani } 2609a49a95e9SJose Ricardo Ziviani *r = ret; 2610a49a95e9SJose Ricardo Ziviani 2611a49a95e9SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2612a49a95e9SJose Ricardo Ziviani if (ox_flag) { 2613a49a95e9SJose Ricardo Ziviani cr |= CRF_SO; 2614a49a95e9SJose Ricardo Ziviani } 2615a49a95e9SJose Ricardo Ziviani 2616a49a95e9SJose Ricardo Ziviani return cr; 2617a49a95e9SJose Ricardo Ziviani } 2618a49a95e9SJose Ricardo Ziviani 2619a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2620a54238adSJose Ricardo Ziviani { 2621a54238adSJose Ricardo Ziviani int cr; 2622a54238adSJose Ricardo Ziviani int unused = 0; 2623a54238adSJose Ricardo Ziviani int invalid = 0; 2624a54238adSJose Ricardo Ziviani bool ox_flag = false; 2625a54238adSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2626a54238adSJose Ricardo Ziviani ppc_avr_t ret = *b; 26273c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2628a54238adSJose Ricardo Ziviani 2629428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2630428115c3SMark Cave-Ayland ppc_avr_t bcd_one; 2631428115c3SMark Cave-Ayland 2632428115c3SMark Cave-Ayland bcd_one.VsrD(0) = 0; 2633428115c3SMark Cave-Ayland bcd_one.VsrD(1) = 0x10; 2634a54238adSJose Ricardo Ziviani 2635a54238adSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2636a54238adSJose Ricardo Ziviani return CRF_SO; 2637a54238adSJose Ricardo Ziviani } 2638a54238adSJose Ricardo Ziviani 2639a54238adSJose Ricardo Ziviani if (unlikely(i > 31)) { 2640a54238adSJose Ricardo Ziviani i = 31; 2641a54238adSJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2642a54238adSJose Ricardo Ziviani i = -31; 2643a54238adSJose Ricardo Ziviani } 2644a54238adSJose Ricardo Ziviani 2645a54238adSJose Ricardo Ziviani if (i > 0) { 26463c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2647a54238adSJose Ricardo Ziviani } else { 26483c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2649a54238adSJose Ricardo Ziviani 2650a54238adSJose Ricardo Ziviani if (bcd_get_digit(&ret, 0, &invalid) >= 5) { 2651a54238adSJose Ricardo Ziviani bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused); 2652a54238adSJose Ricardo Ziviani } 2653a54238adSJose Ricardo Ziviani } 2654a54238adSJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2655a54238adSJose Ricardo Ziviani 2656a54238adSJose Ricardo Ziviani cr = bcd_cmp_zero(&ret); 2657a54238adSJose Ricardo Ziviani if (ox_flag) { 2658a54238adSJose Ricardo Ziviani cr |= CRF_SO; 2659a54238adSJose Ricardo Ziviani } 2660a54238adSJose Ricardo Ziviani *r = ret; 2661a54238adSJose Ricardo Ziviani 2662a54238adSJose Ricardo Ziviani return cr; 2663a54238adSJose Ricardo Ziviani } 2664a54238adSJose Ricardo Ziviani 266531bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 266631bc4d11SJose Ricardo Ziviani { 266731bc4d11SJose Ricardo Ziviani uint64_t mask; 266831bc4d11SJose Ricardo Ziviani uint32_t ox_flag = 0; 2669428115c3SMark Cave-Ayland int i = a->VsrSH(3) + 1; 267031bc4d11SJose Ricardo Ziviani ppc_avr_t ret = *b; 267131bc4d11SJose Ricardo Ziviani 267231bc4d11SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 267331bc4d11SJose Ricardo Ziviani return CRF_SO; 267431bc4d11SJose Ricardo Ziviani } 267531bc4d11SJose Ricardo Ziviani 267631bc4d11SJose Ricardo Ziviani if (i > 16 && i < 32) { 267731bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 26783c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 267931bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 268031bc4d11SJose Ricardo Ziviani } 268131bc4d11SJose Ricardo Ziviani 26823c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 268331bc4d11SJose Ricardo Ziviani } else if (i >= 0 && i <= 16) { 268431bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 26853c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 268631bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 268731bc4d11SJose Ricardo Ziviani } 268831bc4d11SJose Ricardo Ziviani 26893c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 26903c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 269131bc4d11SJose Ricardo Ziviani } 269231bc4d11SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0); 269331bc4d11SJose Ricardo Ziviani *r = ret; 269431bc4d11SJose Ricardo Ziviani 269531bc4d11SJose Ricardo Ziviani return bcd_cmp_zero(&ret) | ox_flag; 269631bc4d11SJose Ricardo Ziviani } 269731bc4d11SJose Ricardo Ziviani 26985c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 26995c32e2e4SJose Ricardo Ziviani { 27005c32e2e4SJose Ricardo Ziviani int i; 27015c32e2e4SJose Ricardo Ziviani uint64_t mask; 27025c32e2e4SJose Ricardo Ziviani uint32_t ox_flag = 0; 27035c32e2e4SJose Ricardo Ziviani int invalid = 0; 27045c32e2e4SJose Ricardo Ziviani ppc_avr_t ret = *b; 27055c32e2e4SJose Ricardo Ziviani 27065c32e2e4SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 27075c32e2e4SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 27085c32e2e4SJose Ricardo Ziviani 27095c32e2e4SJose Ricardo Ziviani if (unlikely(invalid)) { 27105c32e2e4SJose Ricardo Ziviani return CRF_SO; 27115c32e2e4SJose Ricardo Ziviani } 27125c32e2e4SJose Ricardo Ziviani } 27135c32e2e4SJose Ricardo Ziviani 2714428115c3SMark Cave-Ayland i = a->VsrSH(3); 27155c32e2e4SJose Ricardo Ziviani if (i > 16 && i < 33) { 27165c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 27173c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 27185c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 27195c32e2e4SJose Ricardo Ziviani } 27205c32e2e4SJose Ricardo Ziviani 27213c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 27225c32e2e4SJose Ricardo Ziviani } else if (i > 0 && i <= 16) { 27235c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 27243c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 27255c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 27265c32e2e4SJose Ricardo Ziviani } 27275c32e2e4SJose Ricardo Ziviani 27283c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 27293c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 27305c32e2e4SJose Ricardo Ziviani } else if (i == 0) { 27313c385a93SMark Cave-Ayland if (ret.VsrD(0) || ret.VsrD(1)) { 27325c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 27335c32e2e4SJose Ricardo Ziviani } 27343c385a93SMark Cave-Ayland ret.VsrD(0) = ret.VsrD(1) = 0; 27355c32e2e4SJose Ricardo Ziviani } 27365c32e2e4SJose Ricardo Ziviani 27375c32e2e4SJose Ricardo Ziviani *r = ret; 27383c385a93SMark Cave-Ayland if (r->VsrD(0) == 0 && r->VsrD(1) == 0) { 27395c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_EQ; 27405c32e2e4SJose Ricardo Ziviani } 27415c32e2e4SJose Ricardo Ziviani 27425c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_GT; 27435c32e2e4SJose Ricardo Ziviani } 27445c32e2e4SJose Ricardo Ziviani 2745fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a) 2746fcf5ef2aSThomas Huth { 2747fcf5ef2aSThomas Huth int i; 2748fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 2749fcf5ef2aSThomas Huth r->u8[i] = AES_sbox[a->u8[i]]; 2750fcf5ef2aSThomas Huth } 2751fcf5ef2aSThomas Huth } 2752fcf5ef2aSThomas Huth 2753fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2754fcf5ef2aSThomas Huth { 2755fcf5ef2aSThomas Huth ppc_avr_t result; 2756fcf5ef2aSThomas Huth int i; 2757fcf5ef2aSThomas Huth 2758fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 27592dea57dbSMark Cave-Ayland result.VsrW(i) = b->VsrW(i) ^ 27602dea57dbSMark Cave-Ayland (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^ 27612dea57dbSMark Cave-Ayland AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^ 27622dea57dbSMark Cave-Ayland AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^ 27632dea57dbSMark Cave-Ayland AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]); 2764fcf5ef2aSThomas Huth } 2765fcf5ef2aSThomas Huth *r = result; 2766fcf5ef2aSThomas Huth } 2767fcf5ef2aSThomas Huth 2768fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2769fcf5ef2aSThomas Huth { 2770fcf5ef2aSThomas Huth ppc_avr_t result; 2771fcf5ef2aSThomas Huth int i; 2772fcf5ef2aSThomas Huth 2773fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 27742dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]); 2775fcf5ef2aSThomas Huth } 2776fcf5ef2aSThomas Huth *r = result; 2777fcf5ef2aSThomas Huth } 2778fcf5ef2aSThomas Huth 2779fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2780fcf5ef2aSThomas Huth { 2781fcf5ef2aSThomas Huth /* This differs from what is written in ISA V2.07. The RTL is */ 2782fcf5ef2aSThomas Huth /* incorrect and will be fixed in V2.07B. */ 2783fcf5ef2aSThomas Huth int i; 2784fcf5ef2aSThomas Huth ppc_avr_t tmp; 2785fcf5ef2aSThomas Huth 2786fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 27872dea57dbSMark Cave-Ayland tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])]; 2788fcf5ef2aSThomas Huth } 2789fcf5ef2aSThomas Huth 2790fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 27912dea57dbSMark Cave-Ayland r->VsrW(i) = 27922dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 0)][0] ^ 27932dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 1)][1] ^ 27942dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 2)][2] ^ 27952dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 3)][3]; 2796fcf5ef2aSThomas Huth } 2797fcf5ef2aSThomas Huth } 2798fcf5ef2aSThomas Huth 2799fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2800fcf5ef2aSThomas Huth { 2801fcf5ef2aSThomas Huth ppc_avr_t result; 2802fcf5ef2aSThomas Huth int i; 2803fcf5ef2aSThomas Huth 2804fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 28052dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]); 2806fcf5ef2aSThomas Huth } 2807fcf5ef2aSThomas Huth *r = result; 2808fcf5ef2aSThomas Huth } 2809fcf5ef2aSThomas Huth 2810fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2811fcf5ef2aSThomas Huth { 2812fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2813fcf5ef2aSThomas Huth int six = st_six & 0xF; 2814fcf5ef2aSThomas Huth int i; 2815fcf5ef2aSThomas Huth 2816730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2817fcf5ef2aSThomas Huth if (st == 0) { 2818fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 28190ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 7) ^ 28200ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 18) ^ 2821730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 3); 2822fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 28230ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 17) ^ 28240ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 19) ^ 2825730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 10); 2826fcf5ef2aSThomas Huth } 2827fcf5ef2aSThomas Huth } else { /* st == 1 */ 2828fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 28290ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 2) ^ 28300ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 13) ^ 28310ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 22); 2832fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 28330ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 6) ^ 28340ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 11) ^ 28350ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 25); 2836fcf5ef2aSThomas Huth } 2837fcf5ef2aSThomas Huth } 2838fcf5ef2aSThomas Huth } 2839fcf5ef2aSThomas Huth } 2840fcf5ef2aSThomas Huth 2841fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2842fcf5ef2aSThomas Huth { 2843fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2844fcf5ef2aSThomas Huth int six = st_six & 0xF; 2845fcf5ef2aSThomas Huth int i; 2846fcf5ef2aSThomas Huth 2847730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 2848fcf5ef2aSThomas Huth if (st == 0) { 2849fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 28500ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 1) ^ 28510ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 8) ^ 2852730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 7); 2853fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 28540ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 19) ^ 28550ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 61) ^ 2856730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 6); 2857fcf5ef2aSThomas Huth } 2858fcf5ef2aSThomas Huth } else { /* st == 1 */ 2859fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 28600ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 28) ^ 28610ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 34) ^ 28620ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 39); 2863fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 28640ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 14) ^ 28650ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 18) ^ 28660ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 41); 2867fcf5ef2aSThomas Huth } 2868fcf5ef2aSThomas Huth } 2869fcf5ef2aSThomas Huth } 2870fcf5ef2aSThomas Huth } 2871fcf5ef2aSThomas Huth 2872fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2873fcf5ef2aSThomas Huth { 2874fcf5ef2aSThomas Huth ppc_avr_t result; 2875fcf5ef2aSThomas Huth int i; 2876fcf5ef2aSThomas Huth 287760594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 287860594feaSMark Cave-Ayland int indexA = c->VsrB(i) >> 4; 287960594feaSMark Cave-Ayland int indexB = c->VsrB(i) & 0xF; 288060594feaSMark Cave-Ayland 288160594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB); 2882fcf5ef2aSThomas Huth } 2883fcf5ef2aSThomas Huth *r = result; 2884fcf5ef2aSThomas Huth } 2885fcf5ef2aSThomas Huth 2886fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I 2887fcf5ef2aSThomas Huth 2888fcf5ef2aSThomas Huth /*****************************************************************************/ 2889fcf5ef2aSThomas Huth /* SPE extension helpers */ 2890fcf5ef2aSThomas Huth /* Use a table to make this quicker */ 2891fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = { 2892fcf5ef2aSThomas Huth 0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE, 2893fcf5ef2aSThomas Huth 0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF, 2894fcf5ef2aSThomas Huth }; 2895fcf5ef2aSThomas Huth 2896fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val) 2897fcf5ef2aSThomas Huth { 2898fcf5ef2aSThomas Huth return hbrev[val >> 4] | (hbrev[val & 0xF] << 4); 2899fcf5ef2aSThomas Huth } 2900fcf5ef2aSThomas Huth 2901fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val) 2902fcf5ef2aSThomas Huth { 2903fcf5ef2aSThomas Huth return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) | 2904fcf5ef2aSThomas Huth (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24); 2905fcf5ef2aSThomas Huth } 2906fcf5ef2aSThomas Huth 2907fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */ 2908fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2) 2909fcf5ef2aSThomas Huth { 2910fcf5ef2aSThomas Huth uint32_t a, b, d, mask; 2911fcf5ef2aSThomas Huth 2912fcf5ef2aSThomas Huth mask = UINT32_MAX >> (32 - MASKBITS); 2913fcf5ef2aSThomas Huth a = arg1 & mask; 2914fcf5ef2aSThomas Huth b = arg2 & mask; 2915fcf5ef2aSThomas Huth d = word_reverse(1 + word_reverse(a | ~b)); 2916fcf5ef2aSThomas Huth return (arg1 & ~mask) | (d & b); 2917fcf5ef2aSThomas Huth } 2918fcf5ef2aSThomas Huth 2919fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val) 2920fcf5ef2aSThomas Huth { 2921fcf5ef2aSThomas Huth if (val & 0x80000000) { 2922fcf5ef2aSThomas Huth return clz32(~val); 2923fcf5ef2aSThomas Huth } else { 2924fcf5ef2aSThomas Huth return clz32(val); 2925fcf5ef2aSThomas Huth } 2926fcf5ef2aSThomas Huth } 2927fcf5ef2aSThomas Huth 2928fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val) 2929fcf5ef2aSThomas Huth { 2930fcf5ef2aSThomas Huth return clz32(val); 2931fcf5ef2aSThomas Huth } 2932fcf5ef2aSThomas Huth 2933fcf5ef2aSThomas Huth /* 440 specific */ 2934fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high, 2935fcf5ef2aSThomas Huth target_ulong low, uint32_t update_Rc) 2936fcf5ef2aSThomas Huth { 2937fcf5ef2aSThomas Huth target_ulong mask; 2938fcf5ef2aSThomas Huth int i; 2939fcf5ef2aSThomas Huth 2940fcf5ef2aSThomas Huth i = 1; 2941fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 2942fcf5ef2aSThomas Huth if ((high & mask) == 0) { 2943fcf5ef2aSThomas Huth if (update_Rc) { 2944fcf5ef2aSThomas Huth env->crf[0] = 0x4; 2945fcf5ef2aSThomas Huth } 2946fcf5ef2aSThomas Huth goto done; 2947fcf5ef2aSThomas Huth } 2948fcf5ef2aSThomas Huth i++; 2949fcf5ef2aSThomas Huth } 2950fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 2951fcf5ef2aSThomas Huth if ((low & mask) == 0) { 2952fcf5ef2aSThomas Huth if (update_Rc) { 2953fcf5ef2aSThomas Huth env->crf[0] = 0x8; 2954fcf5ef2aSThomas Huth } 2955fcf5ef2aSThomas Huth goto done; 2956fcf5ef2aSThomas Huth } 2957fcf5ef2aSThomas Huth i++; 2958fcf5ef2aSThomas Huth } 2959fcf5ef2aSThomas Huth i = 8; 2960fcf5ef2aSThomas Huth if (update_Rc) { 2961fcf5ef2aSThomas Huth env->crf[0] = 0x2; 2962fcf5ef2aSThomas Huth } 2963fcf5ef2aSThomas Huth done: 2964fcf5ef2aSThomas Huth env->xer = (env->xer & ~0x7F) | i; 2965fcf5ef2aSThomas Huth if (update_Rc) { 2966fcf5ef2aSThomas Huth env->crf[0] |= xer_so; 2967fcf5ef2aSThomas Huth } 2968fcf5ef2aSThomas Huth return i; 2969fcf5ef2aSThomas Huth } 2970