1fcf5ef2aSThomas Huth /* 2fcf5ef2aSThomas Huth * PowerPC integer and vector emulation helpers for QEMU. 3fcf5ef2aSThomas Huth * 4fcf5ef2aSThomas Huth * Copyright (c) 2003-2007 Jocelyn Mayer 5fcf5ef2aSThomas Huth * 6fcf5ef2aSThomas Huth * This library is free software; you can redistribute it and/or 7fcf5ef2aSThomas Huth * modify it under the terms of the GNU Lesser General Public 8fcf5ef2aSThomas Huth * License as published by the Free Software Foundation; either 96bd039cdSChetan Pant * version 2.1 of the License, or (at your option) any later version. 10fcf5ef2aSThomas Huth * 11fcf5ef2aSThomas Huth * This library is distributed in the hope that it will be useful, 12fcf5ef2aSThomas Huth * but WITHOUT ANY WARRANTY; without even the implied warranty of 13fcf5ef2aSThomas Huth * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14fcf5ef2aSThomas Huth * Lesser General Public License for more details. 15fcf5ef2aSThomas Huth * 16fcf5ef2aSThomas Huth * You should have received a copy of the GNU Lesser General Public 17fcf5ef2aSThomas Huth * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18fcf5ef2aSThomas Huth */ 19db725815SMarkus Armbruster 20fcf5ef2aSThomas Huth #include "qemu/osdep.h" 21fcf5ef2aSThomas Huth #include "cpu.h" 22fcf5ef2aSThomas Huth #include "internal.h" 23fcf5ef2aSThomas Huth #include "qemu/host-utils.h" 24db725815SMarkus Armbruster #include "qemu/main-loop.h" 258a05fd9aSRichard Henderson #include "qemu/log.h" 26fcf5ef2aSThomas Huth #include "exec/helper-proto.h" 27fcf5ef2aSThomas Huth #include "crypto/aes.h" 2824f91e81SAlex Bennée #include "fpu/softfloat.h" 293f74b632SRichard Henderson #include "qapi/error.h" 303f74b632SRichard Henderson #include "qemu/guest-random.h" 31fcf5ef2aSThomas Huth 32fcf5ef2aSThomas Huth #include "helper_regs.h" 33fcf5ef2aSThomas Huth /*****************************************************************************/ 34fcf5ef2aSThomas Huth /* Fixed point operations helpers */ 35fcf5ef2aSThomas Huth 36f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov) 37f32899deSNikunj A Dadhania { 38f32899deSNikunj A Dadhania if (unlikely(ov)) { 39f32899deSNikunj A Dadhania env->so = env->ov = 1; 40f32899deSNikunj A Dadhania } else { 41f32899deSNikunj A Dadhania env->ov = 0; 42f32899deSNikunj A Dadhania } 43f32899deSNikunj A Dadhania } 44f32899deSNikunj A Dadhania 45fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb, 46fcf5ef2aSThomas Huth uint32_t oe) 47fcf5ef2aSThomas Huth { 48fcf5ef2aSThomas Huth uint64_t rt = 0; 49fcf5ef2aSThomas Huth int overflow = 0; 50fcf5ef2aSThomas Huth 51fcf5ef2aSThomas Huth uint64_t dividend = (uint64_t)ra << 32; 52fcf5ef2aSThomas Huth uint64_t divisor = (uint32_t)rb; 53fcf5ef2aSThomas Huth 54fcf5ef2aSThomas Huth if (unlikely(divisor == 0)) { 55fcf5ef2aSThomas Huth overflow = 1; 56fcf5ef2aSThomas Huth } else { 57fcf5ef2aSThomas Huth rt = dividend / divisor; 58fcf5ef2aSThomas Huth overflow = rt > UINT32_MAX; 59fcf5ef2aSThomas Huth } 60fcf5ef2aSThomas Huth 61fcf5ef2aSThomas Huth if (unlikely(overflow)) { 62fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 63fcf5ef2aSThomas Huth } 64fcf5ef2aSThomas Huth 65fcf5ef2aSThomas Huth if (oe) { 66f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 67fcf5ef2aSThomas Huth } 68fcf5ef2aSThomas Huth 69fcf5ef2aSThomas Huth return (target_ulong)rt; 70fcf5ef2aSThomas Huth } 71fcf5ef2aSThomas Huth 72fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb, 73fcf5ef2aSThomas Huth uint32_t oe) 74fcf5ef2aSThomas Huth { 75fcf5ef2aSThomas Huth int64_t rt = 0; 76fcf5ef2aSThomas Huth int overflow = 0; 77fcf5ef2aSThomas Huth 78fcf5ef2aSThomas Huth int64_t dividend = (int64_t)ra << 32; 79fcf5ef2aSThomas Huth int64_t divisor = (int64_t)((int32_t)rb); 80fcf5ef2aSThomas Huth 81fcf5ef2aSThomas Huth if (unlikely((divisor == 0) || 82fcf5ef2aSThomas Huth ((divisor == -1ull) && (dividend == INT64_MIN)))) { 83fcf5ef2aSThomas Huth overflow = 1; 84fcf5ef2aSThomas Huth } else { 85fcf5ef2aSThomas Huth rt = dividend / divisor; 86fcf5ef2aSThomas Huth overflow = rt != (int32_t)rt; 87fcf5ef2aSThomas Huth } 88fcf5ef2aSThomas Huth 89fcf5ef2aSThomas Huth if (unlikely(overflow)) { 90fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 91fcf5ef2aSThomas Huth } 92fcf5ef2aSThomas Huth 93fcf5ef2aSThomas Huth if (oe) { 94f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 95fcf5ef2aSThomas Huth } 96fcf5ef2aSThomas Huth 97fcf5ef2aSThomas Huth return (target_ulong)rt; 98fcf5ef2aSThomas Huth } 99fcf5ef2aSThomas Huth 100fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 101fcf5ef2aSThomas Huth 102fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe) 103fcf5ef2aSThomas Huth { 104fcf5ef2aSThomas Huth uint64_t rt = 0; 105fcf5ef2aSThomas Huth int overflow = 0; 106fcf5ef2aSThomas Huth 1079276a31cSLuis Pires if (unlikely(rb == 0 || ra >= rb)) { 1089276a31cSLuis Pires overflow = 1; 109fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1109276a31cSLuis Pires } else { 1119276a31cSLuis Pires divu128(&rt, &ra, rb); 112fcf5ef2aSThomas Huth } 113fcf5ef2aSThomas Huth 114fcf5ef2aSThomas Huth if (oe) { 115f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 116fcf5ef2aSThomas Huth } 117fcf5ef2aSThomas Huth 118fcf5ef2aSThomas Huth return rt; 119fcf5ef2aSThomas Huth } 120fcf5ef2aSThomas Huth 121fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe) 122fcf5ef2aSThomas Huth { 12340f3e79aSLuis Pires uint64_t rt = 0; 124fcf5ef2aSThomas Huth int64_t ra = (int64_t)rau; 125fcf5ef2aSThomas Huth int64_t rb = (int64_t)rbu; 1269276a31cSLuis Pires int overflow = 0; 127fcf5ef2aSThomas Huth 1289276a31cSLuis Pires if (unlikely(rb == 0 || uabs64(ra) >= uabs64(rb))) { 1299276a31cSLuis Pires overflow = 1; 130fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 1319276a31cSLuis Pires } else { 1329276a31cSLuis Pires divs128(&rt, &ra, rb); 133fcf5ef2aSThomas Huth } 134fcf5ef2aSThomas Huth 135fcf5ef2aSThomas Huth if (oe) { 136f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 137fcf5ef2aSThomas Huth } 138fcf5ef2aSThomas Huth 139fcf5ef2aSThomas Huth return rt; 140fcf5ef2aSThomas Huth } 141fcf5ef2aSThomas Huth 142fcf5ef2aSThomas Huth #endif 143fcf5ef2aSThomas Huth 144fcf5ef2aSThomas Huth 145fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 146fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */ 147fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff)) 148fcf5ef2aSThomas Huth 149b6cb41b2SDavid Gibson /* 150b6cb41b2SDavid Gibson * subtract 1 from each byte, and with inverse, check if MSB is set at each 151fcf5ef2aSThomas Huth * byte. 152fcf5ef2aSThomas Huth * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80 153fcf5ef2aSThomas Huth * (0xFF & 0xFF) & 0x80 = 0x80 (zero found) 154fcf5ef2aSThomas Huth */ 155fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80)) 156fcf5ef2aSThomas Huth 157fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */ 158fcf5ef2aSThomas Huth #define hasvalue(x, n) (haszero((x) ^ pattern(n))) 159fcf5ef2aSThomas Huth 160fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb) 161fcf5ef2aSThomas Huth { 162efa73196SNikunj A Dadhania return hasvalue(rb, ra) ? CRF_GT : 0; 163fcf5ef2aSThomas Huth } 164fcf5ef2aSThomas Huth 165fcf5ef2aSThomas Huth #undef pattern 166fcf5ef2aSThomas Huth #undef haszero 167fcf5ef2aSThomas Huth #undef hasvalue 168fcf5ef2aSThomas Huth 169b6cb41b2SDavid Gibson /* 1703f74b632SRichard Henderson * Return a random number. 171fcf5ef2aSThomas Huth */ 1723f74b632SRichard Henderson uint64_t helper_darn32(void) 173fcf5ef2aSThomas Huth { 1743f74b632SRichard Henderson Error *err = NULL; 1753f74b632SRichard Henderson uint32_t ret; 1763f74b632SRichard Henderson 1773f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1783f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1793f74b632SRichard Henderson error_get_pretty(err)); 1803f74b632SRichard Henderson error_free(err); 181fcf5ef2aSThomas Huth return -1; 182fcf5ef2aSThomas Huth } 183fcf5ef2aSThomas Huth 1843f74b632SRichard Henderson return ret; 1853f74b632SRichard Henderson } 1863f74b632SRichard Henderson 1873f74b632SRichard Henderson uint64_t helper_darn64(void) 188fcf5ef2aSThomas Huth { 1893f74b632SRichard Henderson Error *err = NULL; 1903f74b632SRichard Henderson uint64_t ret; 1913f74b632SRichard Henderson 1923f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1933f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1943f74b632SRichard Henderson error_get_pretty(err)); 1953f74b632SRichard Henderson error_free(err); 196fcf5ef2aSThomas Huth return -1; 197fcf5ef2aSThomas Huth } 198fcf5ef2aSThomas Huth 1993f74b632SRichard Henderson return ret; 2003f74b632SRichard Henderson } 201fcf5ef2aSThomas Huth 202fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb) 203fcf5ef2aSThomas Huth { 204fcf5ef2aSThomas Huth int i; 205fcf5ef2aSThomas Huth uint64_t ra = 0; 206fcf5ef2aSThomas Huth 207fcf5ef2aSThomas Huth for (i = 0; i < 8; i++) { 208fcf5ef2aSThomas Huth int index = (rs >> (i * 8)) & 0xFF; 209fcf5ef2aSThomas Huth if (index < 64) { 210a6a444a8SCédric Le Goater if (rb & PPC_BIT(index)) { 211fcf5ef2aSThomas Huth ra |= 1 << i; 212fcf5ef2aSThomas Huth } 213fcf5ef2aSThomas Huth } 214fcf5ef2aSThomas Huth } 215fcf5ef2aSThomas Huth return ra; 216fcf5ef2aSThomas Huth } 217fcf5ef2aSThomas Huth 218fcf5ef2aSThomas Huth #endif 219fcf5ef2aSThomas Huth 220fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb) 221fcf5ef2aSThomas Huth { 222fcf5ef2aSThomas Huth target_ulong mask = 0xff; 223fcf5ef2aSThomas Huth target_ulong ra = 0; 224fcf5ef2aSThomas Huth int i; 225fcf5ef2aSThomas Huth 226fcf5ef2aSThomas Huth for (i = 0; i < sizeof(target_ulong); i++) { 227fcf5ef2aSThomas Huth if ((rs & mask) == (rb & mask)) { 228fcf5ef2aSThomas Huth ra |= mask; 229fcf5ef2aSThomas Huth } 230fcf5ef2aSThomas Huth mask <<= 8; 231fcf5ef2aSThomas Huth } 232fcf5ef2aSThomas Huth return ra; 233fcf5ef2aSThomas Huth } 234fcf5ef2aSThomas Huth 235fcf5ef2aSThomas Huth /* shift right arithmetic helper */ 236fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value, 237fcf5ef2aSThomas Huth target_ulong shift) 238fcf5ef2aSThomas Huth { 239fcf5ef2aSThomas Huth int32_t ret; 240fcf5ef2aSThomas Huth 241fcf5ef2aSThomas Huth if (likely(!(shift & 0x20))) { 242fcf5ef2aSThomas Huth if (likely((uint32_t)shift != 0)) { 243fcf5ef2aSThomas Huth shift &= 0x1f; 244fcf5ef2aSThomas Huth ret = (int32_t)value >> shift; 245fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) { 246af1c259fSSandipan Das env->ca32 = env->ca = 0; 247fcf5ef2aSThomas Huth } else { 248af1c259fSSandipan Das env->ca32 = env->ca = 1; 249fcf5ef2aSThomas Huth } 250fcf5ef2aSThomas Huth } else { 251fcf5ef2aSThomas Huth ret = (int32_t)value; 252af1c259fSSandipan Das env->ca32 = env->ca = 0; 253fcf5ef2aSThomas Huth } 254fcf5ef2aSThomas Huth } else { 255fcf5ef2aSThomas Huth ret = (int32_t)value >> 31; 256af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 257fcf5ef2aSThomas Huth } 258fcf5ef2aSThomas Huth return (target_long)ret; 259fcf5ef2aSThomas Huth } 260fcf5ef2aSThomas Huth 261fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 262fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value, 263fcf5ef2aSThomas Huth target_ulong shift) 264fcf5ef2aSThomas Huth { 265fcf5ef2aSThomas Huth int64_t ret; 266fcf5ef2aSThomas Huth 267fcf5ef2aSThomas Huth if (likely(!(shift & 0x40))) { 268fcf5ef2aSThomas Huth if (likely((uint64_t)shift != 0)) { 269fcf5ef2aSThomas Huth shift &= 0x3f; 270fcf5ef2aSThomas Huth ret = (int64_t)value >> shift; 271fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) { 272af1c259fSSandipan Das env->ca32 = env->ca = 0; 273fcf5ef2aSThomas Huth } else { 274af1c259fSSandipan Das env->ca32 = env->ca = 1; 275fcf5ef2aSThomas Huth } 276fcf5ef2aSThomas Huth } else { 277fcf5ef2aSThomas Huth ret = (int64_t)value; 278af1c259fSSandipan Das env->ca32 = env->ca = 0; 279fcf5ef2aSThomas Huth } 280fcf5ef2aSThomas Huth } else { 281fcf5ef2aSThomas Huth ret = (int64_t)value >> 63; 282af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 283fcf5ef2aSThomas Huth } 284fcf5ef2aSThomas Huth return ret; 285fcf5ef2aSThomas Huth } 286fcf5ef2aSThomas Huth #endif 287fcf5ef2aSThomas Huth 288fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 289fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 290fcf5ef2aSThomas Huth { 29179770002SRichard Henderson /* Note that we don't fold past bytes */ 292fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 293fcf5ef2aSThomas Huth 0x5555555555555555ULL); 294fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 295fcf5ef2aSThomas Huth 0x3333333333333333ULL); 296fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 297fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 298fcf5ef2aSThomas Huth return val; 299fcf5ef2aSThomas Huth } 300fcf5ef2aSThomas Huth 301fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val) 302fcf5ef2aSThomas Huth { 30379770002SRichard Henderson /* Note that we don't fold past words. */ 304fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 305fcf5ef2aSThomas Huth 0x5555555555555555ULL); 306fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 307fcf5ef2aSThomas Huth 0x3333333333333333ULL); 308fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 309fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 310fcf5ef2aSThomas Huth val = (val & 0x00ff00ff00ff00ffULL) + ((val >> 8) & 311fcf5ef2aSThomas Huth 0x00ff00ff00ff00ffULL); 312fcf5ef2aSThomas Huth val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) & 313fcf5ef2aSThomas Huth 0x0000ffff0000ffffULL); 314fcf5ef2aSThomas Huth return val; 315fcf5ef2aSThomas Huth } 316fcf5ef2aSThomas Huth #else 317fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 318fcf5ef2aSThomas Huth { 31979770002SRichard Henderson /* Note that we don't fold past bytes */ 320fcf5ef2aSThomas Huth val = (val & 0x55555555) + ((val >> 1) & 0x55555555); 321fcf5ef2aSThomas Huth val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 322fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f) + ((val >> 4) & 0x0f0f0f0f); 323fcf5ef2aSThomas Huth return val; 324fcf5ef2aSThomas Huth } 325fcf5ef2aSThomas Huth #endif 326fcf5ef2aSThomas Huth 327*6e0bbc40SMatheus Ferst uint64_t helper_CFUGED(uint64_t src, uint64_t mask) 32889ccd7dcSMatheus Ferst { 32989ccd7dcSMatheus Ferst /* 33089ccd7dcSMatheus Ferst * Instead of processing the mask bit-by-bit from the most significant to 33189ccd7dcSMatheus Ferst * the least significant bit, as described in PowerISA, we'll handle it in 33289ccd7dcSMatheus Ferst * blocks of 'n' zeros/ones from LSB to MSB. To avoid the decision to use 33389ccd7dcSMatheus Ferst * ctz or cto, we negate the mask at the end of the loop. 33489ccd7dcSMatheus Ferst */ 33589ccd7dcSMatheus Ferst target_ulong m, left = 0, right = 0; 33689ccd7dcSMatheus Ferst unsigned int n, i = 64; 33789ccd7dcSMatheus Ferst bool bit = false; /* tracks if we are processing zeros or ones */ 33889ccd7dcSMatheus Ferst 33989ccd7dcSMatheus Ferst if (mask == 0 || mask == -1) { 34089ccd7dcSMatheus Ferst return src; 34189ccd7dcSMatheus Ferst } 34289ccd7dcSMatheus Ferst 34389ccd7dcSMatheus Ferst /* Processes the mask in blocks, from LSB to MSB */ 34489ccd7dcSMatheus Ferst while (i) { 34589ccd7dcSMatheus Ferst /* Find how many bits we should take */ 34689ccd7dcSMatheus Ferst n = ctz64(mask); 34789ccd7dcSMatheus Ferst if (n > i) { 34889ccd7dcSMatheus Ferst n = i; 34989ccd7dcSMatheus Ferst } 35089ccd7dcSMatheus Ferst 35189ccd7dcSMatheus Ferst /* 35289ccd7dcSMatheus Ferst * Extracts 'n' trailing bits of src and put them on the leading 'n' 35389ccd7dcSMatheus Ferst * bits of 'right' or 'left', pushing down the previously extracted 35489ccd7dcSMatheus Ferst * values. 35589ccd7dcSMatheus Ferst */ 35689ccd7dcSMatheus Ferst m = (1ll << n) - 1; 35789ccd7dcSMatheus Ferst if (bit) { 35889ccd7dcSMatheus Ferst right = ror64(right | (src & m), n); 35989ccd7dcSMatheus Ferst } else { 36089ccd7dcSMatheus Ferst left = ror64(left | (src & m), n); 36189ccd7dcSMatheus Ferst } 36289ccd7dcSMatheus Ferst 36389ccd7dcSMatheus Ferst /* 36489ccd7dcSMatheus Ferst * Discards the processed bits from 'src' and 'mask'. Note that we are 36589ccd7dcSMatheus Ferst * removing 'n' trailing zeros from 'mask', but the logical shift will 36689ccd7dcSMatheus Ferst * add 'n' leading zeros back, so the population count of 'mask' is kept 36789ccd7dcSMatheus Ferst * the same. 36889ccd7dcSMatheus Ferst */ 36989ccd7dcSMatheus Ferst src >>= n; 37089ccd7dcSMatheus Ferst mask >>= n; 37189ccd7dcSMatheus Ferst i -= n; 37289ccd7dcSMatheus Ferst bit = !bit; 37389ccd7dcSMatheus Ferst mask = ~mask; 37489ccd7dcSMatheus Ferst } 37589ccd7dcSMatheus Ferst 37689ccd7dcSMatheus Ferst /* 37789ccd7dcSMatheus Ferst * At the end, right was ror'ed ctpop(mask) times. To put it back in place, 37889ccd7dcSMatheus Ferst * we'll shift it more 64-ctpop(mask) times. 37989ccd7dcSMatheus Ferst */ 38089ccd7dcSMatheus Ferst if (bit) { 38189ccd7dcSMatheus Ferst n = ctpop64(mask); 38289ccd7dcSMatheus Ferst } else { 38389ccd7dcSMatheus Ferst n = 64 - ctpop64(mask); 38489ccd7dcSMatheus Ferst } 38589ccd7dcSMatheus Ferst 38689ccd7dcSMatheus Ferst return left | (right >> n); 38789ccd7dcSMatheus Ferst } 38889ccd7dcSMatheus Ferst 38921ba6e58SMatheus Ferst #if defined(TARGET_PPC64) 39021ba6e58SMatheus Ferst uint64_t helper_PDEPD(uint64_t src, uint64_t mask) 39121ba6e58SMatheus Ferst { 39221ba6e58SMatheus Ferst int i, o; 39321ba6e58SMatheus Ferst uint64_t result = 0; 39421ba6e58SMatheus Ferst 39521ba6e58SMatheus Ferst if (mask == -1) { 39621ba6e58SMatheus Ferst return src; 39721ba6e58SMatheus Ferst } 39821ba6e58SMatheus Ferst 39921ba6e58SMatheus Ferst for (i = 0; mask != 0; i++) { 40021ba6e58SMatheus Ferst o = ctz64(mask); 40121ba6e58SMatheus Ferst mask &= mask - 1; 40221ba6e58SMatheus Ferst result |= ((src >> i) & 1) << o; 40321ba6e58SMatheus Ferst } 40421ba6e58SMatheus Ferst 40521ba6e58SMatheus Ferst return result; 40621ba6e58SMatheus Ferst } 4078bdb7606SMatheus Ferst 4088bdb7606SMatheus Ferst uint64_t helper_PEXTD(uint64_t src, uint64_t mask) 4098bdb7606SMatheus Ferst { 4108bdb7606SMatheus Ferst int i, o; 4118bdb7606SMatheus Ferst uint64_t result = 0; 4128bdb7606SMatheus Ferst 4138bdb7606SMatheus Ferst if (mask == -1) { 4148bdb7606SMatheus Ferst return src; 4158bdb7606SMatheus Ferst } 4168bdb7606SMatheus Ferst 4178bdb7606SMatheus Ferst for (o = 0; mask != 0; o++) { 4188bdb7606SMatheus Ferst i = ctz64(mask); 4198bdb7606SMatheus Ferst mask &= mask - 1; 4208bdb7606SMatheus Ferst result |= ((src >> i) & 1) << o; 4218bdb7606SMatheus Ferst } 4228bdb7606SMatheus Ferst 4238bdb7606SMatheus Ferst return result; 4248bdb7606SMatheus Ferst } 42521ba6e58SMatheus Ferst #endif 42621ba6e58SMatheus Ferst 427fcf5ef2aSThomas Huth /*****************************************************************************/ 428fcf5ef2aSThomas Huth /* PowerPC 601 specific instructions (POWER bridge) */ 429fcf5ef2aSThomas Huth target_ulong helper_div(CPUPPCState *env, target_ulong arg1, target_ulong arg2) 430fcf5ef2aSThomas Huth { 431fcf5ef2aSThomas Huth uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ]; 432fcf5ef2aSThomas Huth 433fcf5ef2aSThomas Huth if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 434fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 435fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 436fcf5ef2aSThomas Huth return INT32_MIN; 437fcf5ef2aSThomas Huth } else { 438fcf5ef2aSThomas Huth env->spr[SPR_MQ] = tmp % arg2; 439fcf5ef2aSThomas Huth return tmp / (int32_t)arg2; 440fcf5ef2aSThomas Huth } 441fcf5ef2aSThomas Huth } 442fcf5ef2aSThomas Huth 443fcf5ef2aSThomas Huth target_ulong helper_divo(CPUPPCState *env, target_ulong arg1, 444fcf5ef2aSThomas Huth target_ulong arg2) 445fcf5ef2aSThomas Huth { 446fcf5ef2aSThomas Huth uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ]; 447fcf5ef2aSThomas Huth 448fcf5ef2aSThomas Huth if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 449fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 450fcf5ef2aSThomas Huth env->so = env->ov = 1; 451fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 452fcf5ef2aSThomas Huth return INT32_MIN; 453fcf5ef2aSThomas Huth } else { 454fcf5ef2aSThomas Huth env->spr[SPR_MQ] = tmp % arg2; 455fcf5ef2aSThomas Huth tmp /= (int32_t)arg2; 456fcf5ef2aSThomas Huth if ((int32_t)tmp != tmp) { 457fcf5ef2aSThomas Huth env->so = env->ov = 1; 458fcf5ef2aSThomas Huth } else { 459fcf5ef2aSThomas Huth env->ov = 0; 460fcf5ef2aSThomas Huth } 461fcf5ef2aSThomas Huth return tmp; 462fcf5ef2aSThomas Huth } 463fcf5ef2aSThomas Huth } 464fcf5ef2aSThomas Huth 465fcf5ef2aSThomas Huth target_ulong helper_divs(CPUPPCState *env, target_ulong arg1, 466fcf5ef2aSThomas Huth target_ulong arg2) 467fcf5ef2aSThomas Huth { 468fcf5ef2aSThomas Huth if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 469fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 470fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 471fcf5ef2aSThomas Huth return INT32_MIN; 472fcf5ef2aSThomas Huth } else { 473fcf5ef2aSThomas Huth env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2; 474fcf5ef2aSThomas Huth return (int32_t)arg1 / (int32_t)arg2; 475fcf5ef2aSThomas Huth } 476fcf5ef2aSThomas Huth } 477fcf5ef2aSThomas Huth 478fcf5ef2aSThomas Huth target_ulong helper_divso(CPUPPCState *env, target_ulong arg1, 479fcf5ef2aSThomas Huth target_ulong arg2) 480fcf5ef2aSThomas Huth { 481fcf5ef2aSThomas Huth if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 482fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 483fcf5ef2aSThomas Huth env->so = env->ov = 1; 484fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 485fcf5ef2aSThomas Huth return INT32_MIN; 486fcf5ef2aSThomas Huth } else { 487fcf5ef2aSThomas Huth env->ov = 0; 488fcf5ef2aSThomas Huth env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2; 489fcf5ef2aSThomas Huth return (int32_t)arg1 / (int32_t)arg2; 490fcf5ef2aSThomas Huth } 491fcf5ef2aSThomas Huth } 492fcf5ef2aSThomas Huth 493fcf5ef2aSThomas Huth /*****************************************************************************/ 494fcf5ef2aSThomas Huth /* 602 specific instructions */ 495fcf5ef2aSThomas Huth /* mfrom is the most crazy instruction ever seen, imho ! */ 496fcf5ef2aSThomas Huth /* Real implementation uses a ROM table. Do the same */ 497b6cb41b2SDavid Gibson /* 498b6cb41b2SDavid Gibson * Extremely decomposed: 499fcf5ef2aSThomas Huth * -arg / 256 500fcf5ef2aSThomas Huth * return 256 * log10(10 + 1.0) + 0.5 501fcf5ef2aSThomas Huth */ 502fcf5ef2aSThomas Huth #if !defined(CONFIG_USER_ONLY) 503fcf5ef2aSThomas Huth target_ulong helper_602_mfrom(target_ulong arg) 504fcf5ef2aSThomas Huth { 505fcf5ef2aSThomas Huth if (likely(arg < 602)) { 506139c1837SPaolo Bonzini #include "mfrom_table.c.inc" 507fcf5ef2aSThomas Huth return mfrom_ROM_table[arg]; 508fcf5ef2aSThomas Huth } else { 509fcf5ef2aSThomas Huth return 0; 510fcf5ef2aSThomas Huth } 511fcf5ef2aSThomas Huth } 512fcf5ef2aSThomas Huth #endif 513fcf5ef2aSThomas Huth 514fcf5ef2aSThomas Huth /*****************************************************************************/ 515fcf5ef2aSThomas Huth /* Altivec extension helpers */ 516fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 517fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 518fcf5ef2aSThomas Huth for (index = 0; index < ARRAY_SIZE(r->element); index++) 519fcf5ef2aSThomas Huth #else 520fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 521fcf5ef2aSThomas Huth for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--) 522fcf5ef2aSThomas Huth #endif 523fcf5ef2aSThomas Huth 524fcf5ef2aSThomas Huth /* Saturating arithmetic helpers. */ 525fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max) \ 526fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 527fcf5ef2aSThomas Huth { \ 528fcf5ef2aSThomas Huth to_type r; \ 529fcf5ef2aSThomas Huth \ 530fcf5ef2aSThomas Huth if (x < (from_type)min) { \ 531fcf5ef2aSThomas Huth r = min; \ 532fcf5ef2aSThomas Huth *sat = 1; \ 533fcf5ef2aSThomas Huth } else if (x > (from_type)max) { \ 534fcf5ef2aSThomas Huth r = max; \ 535fcf5ef2aSThomas Huth *sat = 1; \ 536fcf5ef2aSThomas Huth } else { \ 537fcf5ef2aSThomas Huth r = x; \ 538fcf5ef2aSThomas Huth } \ 539fcf5ef2aSThomas Huth return r; \ 540fcf5ef2aSThomas Huth } 541fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max) \ 542fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 543fcf5ef2aSThomas Huth { \ 544fcf5ef2aSThomas Huth to_type r; \ 545fcf5ef2aSThomas Huth \ 546fcf5ef2aSThomas Huth if (x > (from_type)max) { \ 547fcf5ef2aSThomas Huth r = max; \ 548fcf5ef2aSThomas Huth *sat = 1; \ 549fcf5ef2aSThomas Huth } else { \ 550fcf5ef2aSThomas Huth r = x; \ 551fcf5ef2aSThomas Huth } \ 552fcf5ef2aSThomas Huth return r; \ 553fcf5ef2aSThomas Huth } 554fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX) 555fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX) 556fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX) 557fcf5ef2aSThomas Huth 558fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX) 559fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX) 560fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX) 561fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX) 562fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX) 563fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX) 564fcf5ef2aSThomas Huth #undef SATCVT 565fcf5ef2aSThomas Huth #undef SATCVTU 566fcf5ef2aSThomas Huth 567dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr) 568fcf5ef2aSThomas Huth { 569c19940dbSBruno Larsen (billionai) ppc_store_vscr(env, vscr); 570fcf5ef2aSThomas Huth } 571fcf5ef2aSThomas Huth 572cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env) 573cc2b90d7SRichard Henderson { 574c19940dbSBruno Larsen (billionai) return ppc_get_vscr(env); 575cc2b90d7SRichard Henderson } 576cc2b90d7SRichard Henderson 5776175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env) 5786175f5a0SRichard Henderson { 5799b5b74daSRichard Henderson /* The choice of non-zero value is arbitrary. */ 5809b5b74daSRichard Henderson env->vscr_sat.u32[0] = 1; 5816175f5a0SRichard Henderson } 5826175f5a0SRichard Henderson 583fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 584fcf5ef2aSThomas Huth { 585fcf5ef2aSThomas Huth int i; 586fcf5ef2aSThomas Huth 587fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 588fcf5ef2aSThomas Huth r->u32[i] = ~a->u32[i] < b->u32[i]; 589fcf5ef2aSThomas Huth } 590fcf5ef2aSThomas Huth } 591fcf5ef2aSThomas Huth 592fcf5ef2aSThomas Huth /* vprtybw */ 593fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b) 594fcf5ef2aSThomas Huth { 595fcf5ef2aSThomas Huth int i; 596fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 597fcf5ef2aSThomas Huth uint64_t res = b->u32[i] ^ (b->u32[i] >> 16); 598fcf5ef2aSThomas Huth res ^= res >> 8; 599fcf5ef2aSThomas Huth r->u32[i] = res & 1; 600fcf5ef2aSThomas Huth } 601fcf5ef2aSThomas Huth } 602fcf5ef2aSThomas Huth 603fcf5ef2aSThomas Huth /* vprtybd */ 604fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b) 605fcf5ef2aSThomas Huth { 606fcf5ef2aSThomas Huth int i; 607fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 608fcf5ef2aSThomas Huth uint64_t res = b->u64[i] ^ (b->u64[i] >> 32); 609fcf5ef2aSThomas Huth res ^= res >> 16; 610fcf5ef2aSThomas Huth res ^= res >> 8; 611fcf5ef2aSThomas Huth r->u64[i] = res & 1; 612fcf5ef2aSThomas Huth } 613fcf5ef2aSThomas Huth } 614fcf5ef2aSThomas Huth 615fcf5ef2aSThomas Huth /* vprtybq */ 616fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b) 617fcf5ef2aSThomas Huth { 618fcf5ef2aSThomas Huth uint64_t res = b->u64[0] ^ b->u64[1]; 619fcf5ef2aSThomas Huth res ^= res >> 32; 620fcf5ef2aSThomas Huth res ^= res >> 16; 621fcf5ef2aSThomas Huth res ^= res >> 8; 6223c385a93SMark Cave-Ayland r->VsrD(1) = res & 1; 6233c385a93SMark Cave-Ayland r->VsrD(0) = 0; 624fcf5ef2aSThomas Huth } 625fcf5ef2aSThomas Huth 626fcf5ef2aSThomas Huth #define VARITHFP(suffix, func) \ 627fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 628fcf5ef2aSThomas Huth ppc_avr_t *b) \ 629fcf5ef2aSThomas Huth { \ 630fcf5ef2aSThomas Huth int i; \ 631fcf5ef2aSThomas Huth \ 63205ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 63305ee3e8aSMark Cave-Ayland r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status); \ 634fcf5ef2aSThomas Huth } \ 635fcf5ef2aSThomas Huth } 636fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add) 637fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub) 638fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min) 639fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max) 640fcf5ef2aSThomas Huth #undef VARITHFP 641fcf5ef2aSThomas Huth 642fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type) \ 643fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 644fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) \ 645fcf5ef2aSThomas Huth { \ 646fcf5ef2aSThomas Huth int i; \ 64705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 64805ee3e8aSMark Cave-Ayland r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \ 649fcf5ef2aSThomas Huth type, &env->vec_status); \ 650fcf5ef2aSThomas Huth } \ 651fcf5ef2aSThomas Huth } 652fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0); 653fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c); 654fcf5ef2aSThomas Huth #undef VARITHFPFMA 655fcf5ef2aSThomas Huth 656fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element) \ 657fcf5ef2aSThomas Huth { \ 658fcf5ef2aSThomas Huth type result = (type)a->element[i] op (type)b->element[i]; \ 659fcf5ef2aSThomas Huth r->element[i] = cvt(result, &sat); \ 660fcf5ef2aSThomas Huth } 661fcf5ef2aSThomas Huth 662fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element) \ 663fb11ae7dSRichard Henderson void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat, \ 664fb11ae7dSRichard Henderson ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 665fcf5ef2aSThomas Huth { \ 666fcf5ef2aSThomas Huth int sat = 0; \ 667fcf5ef2aSThomas Huth int i; \ 668fcf5ef2aSThomas Huth \ 669fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 670fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 671fcf5ef2aSThomas Huth } \ 672fcf5ef2aSThomas Huth if (sat) { \ 673fb11ae7dSRichard Henderson vscr_sat->u32[0] = 1; \ 674fcf5ef2aSThomas Huth } \ 675fcf5ef2aSThomas Huth } 676fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt) \ 677fcf5ef2aSThomas Huth VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element) \ 678fcf5ef2aSThomas Huth VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element) 679fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt) \ 680fcf5ef2aSThomas Huth VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element) \ 681fcf5ef2aSThomas Huth VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element) 682fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb) 683fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh) 684fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw) 685fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub) 686fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh) 687fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw) 688fcf5ef2aSThomas Huth #undef VARITHSAT_CASE 689fcf5ef2aSThomas Huth #undef VARITHSAT_DO 690fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED 691fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED 692fcf5ef2aSThomas Huth 693fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype) \ 694fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 695fcf5ef2aSThomas Huth { \ 696fcf5ef2aSThomas Huth int i; \ 697fcf5ef2aSThomas Huth \ 698fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 699fcf5ef2aSThomas Huth etype x = (etype)a->element[i] + (etype)b->element[i] + 1; \ 700fcf5ef2aSThomas Huth r->element[i] = x >> 1; \ 701fcf5ef2aSThomas Huth } \ 702fcf5ef2aSThomas Huth } 703fcf5ef2aSThomas Huth 704fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element, \ 705fcf5ef2aSThomas Huth unsigned_type) \ 706fcf5ef2aSThomas Huth VAVG_DO(avgs##type, signed_element, signed_type) \ 707fcf5ef2aSThomas Huth VAVG_DO(avgu##type, unsigned_element, unsigned_type) 708fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t) 709fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t) 710fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t) 711fcf5ef2aSThomas Huth #undef VAVG_DO 712fcf5ef2aSThomas Huth #undef VAVG 713fcf5ef2aSThomas Huth 714fcf5ef2aSThomas Huth #define VABSDU_DO(name, element) \ 715fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 716fcf5ef2aSThomas Huth { \ 717fcf5ef2aSThomas Huth int i; \ 718fcf5ef2aSThomas Huth \ 719fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 720fcf5ef2aSThomas Huth r->element[i] = (a->element[i] > b->element[i]) ? \ 721fcf5ef2aSThomas Huth (a->element[i] - b->element[i]) : \ 722fcf5ef2aSThomas Huth (b->element[i] - a->element[i]); \ 723fcf5ef2aSThomas Huth } \ 724fcf5ef2aSThomas Huth } 725fcf5ef2aSThomas Huth 726b6cb41b2SDavid Gibson /* 727b6cb41b2SDavid Gibson * VABSDU - Vector absolute difference unsigned 728fcf5ef2aSThomas Huth * name - instruction mnemonic suffix (b: byte, h: halfword, w: word) 729fcf5ef2aSThomas Huth * element - element type to access from vector 730fcf5ef2aSThomas Huth */ 731fcf5ef2aSThomas Huth #define VABSDU(type, element) \ 732fcf5ef2aSThomas Huth VABSDU_DO(absdu##type, element) 733fcf5ef2aSThomas Huth VABSDU(b, u8) 734fcf5ef2aSThomas Huth VABSDU(h, u16) 735fcf5ef2aSThomas Huth VABSDU(w, u32) 736fcf5ef2aSThomas Huth #undef VABSDU_DO 737fcf5ef2aSThomas Huth #undef VABSDU 738fcf5ef2aSThomas Huth 739fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element) \ 740fcf5ef2aSThomas Huth void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r, \ 741fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 742fcf5ef2aSThomas Huth { \ 743fcf5ef2aSThomas Huth int i; \ 744fcf5ef2aSThomas Huth \ 74505ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 746fcf5ef2aSThomas Huth float32 t = cvt(b->element[i], &env->vec_status); \ 74705ee3e8aSMark Cave-Ayland r->f32[i] = float32_scalbn(t, -uim, &env->vec_status); \ 748fcf5ef2aSThomas Huth } \ 749fcf5ef2aSThomas Huth } 750fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32) 751fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32) 752fcf5ef2aSThomas Huth #undef VCF 753fcf5ef2aSThomas Huth 754fcf5ef2aSThomas Huth #define VCMP_DO(suffix, compare, element, record) \ 755fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 756fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 757fcf5ef2aSThomas Huth { \ 758fcf5ef2aSThomas Huth uint64_t ones = (uint64_t)-1; \ 759fcf5ef2aSThomas Huth uint64_t all = ones; \ 760fcf5ef2aSThomas Huth uint64_t none = 0; \ 761fcf5ef2aSThomas Huth int i; \ 762fcf5ef2aSThomas Huth \ 763fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 764fcf5ef2aSThomas Huth uint64_t result = (a->element[i] compare b->element[i] ? \ 765fcf5ef2aSThomas Huth ones : 0x0); \ 766fcf5ef2aSThomas Huth switch (sizeof(a->element[0])) { \ 767fcf5ef2aSThomas Huth case 8: \ 768fcf5ef2aSThomas Huth r->u64[i] = result; \ 769fcf5ef2aSThomas Huth break; \ 770fcf5ef2aSThomas Huth case 4: \ 771fcf5ef2aSThomas Huth r->u32[i] = result; \ 772fcf5ef2aSThomas Huth break; \ 773fcf5ef2aSThomas Huth case 2: \ 774fcf5ef2aSThomas Huth r->u16[i] = result; \ 775fcf5ef2aSThomas Huth break; \ 776fcf5ef2aSThomas Huth case 1: \ 777fcf5ef2aSThomas Huth r->u8[i] = result; \ 778fcf5ef2aSThomas Huth break; \ 779fcf5ef2aSThomas Huth } \ 780fcf5ef2aSThomas Huth all &= result; \ 781fcf5ef2aSThomas Huth none |= result; \ 782fcf5ef2aSThomas Huth } \ 783fcf5ef2aSThomas Huth if (record) { \ 784fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 785fcf5ef2aSThomas Huth } \ 786fcf5ef2aSThomas Huth } 787fcf5ef2aSThomas Huth #define VCMP(suffix, compare, element) \ 788fcf5ef2aSThomas Huth VCMP_DO(suffix, compare, element, 0) \ 789fcf5ef2aSThomas Huth VCMP_DO(suffix##_dot, compare, element, 1) 790fcf5ef2aSThomas Huth VCMP(equb, ==, u8) 791fcf5ef2aSThomas Huth VCMP(equh, ==, u16) 792fcf5ef2aSThomas Huth VCMP(equw, ==, u32) 793fcf5ef2aSThomas Huth VCMP(equd, ==, u64) 794fcf5ef2aSThomas Huth VCMP(gtub, >, u8) 795fcf5ef2aSThomas Huth VCMP(gtuh, >, u16) 796fcf5ef2aSThomas Huth VCMP(gtuw, >, u32) 797fcf5ef2aSThomas Huth VCMP(gtud, >, u64) 798fcf5ef2aSThomas Huth VCMP(gtsb, >, s8) 799fcf5ef2aSThomas Huth VCMP(gtsh, >, s16) 800fcf5ef2aSThomas Huth VCMP(gtsw, >, s32) 801fcf5ef2aSThomas Huth VCMP(gtsd, >, s64) 802fcf5ef2aSThomas Huth #undef VCMP_DO 803fcf5ef2aSThomas Huth #undef VCMP 804fcf5ef2aSThomas Huth 805fcf5ef2aSThomas Huth #define VCMPNE_DO(suffix, element, etype, cmpzero, record) \ 806fcf5ef2aSThomas Huth void helper_vcmpne##suffix(CPUPPCState *env, ppc_avr_t *r, \ 807fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 808fcf5ef2aSThomas Huth { \ 809fcf5ef2aSThomas Huth etype ones = (etype)-1; \ 810fcf5ef2aSThomas Huth etype all = ones; \ 811fcf5ef2aSThomas Huth etype result, none = 0; \ 812fcf5ef2aSThomas Huth int i; \ 813fcf5ef2aSThomas Huth \ 814fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 815fcf5ef2aSThomas Huth if (cmpzero) { \ 816fcf5ef2aSThomas Huth result = ((a->element[i] == 0) \ 817fcf5ef2aSThomas Huth || (b->element[i] == 0) \ 818fcf5ef2aSThomas Huth || (a->element[i] != b->element[i]) ? \ 819fcf5ef2aSThomas Huth ones : 0x0); \ 820fcf5ef2aSThomas Huth } else { \ 821fcf5ef2aSThomas Huth result = (a->element[i] != b->element[i]) ? ones : 0x0; \ 822fcf5ef2aSThomas Huth } \ 823fcf5ef2aSThomas Huth r->element[i] = result; \ 824fcf5ef2aSThomas Huth all &= result; \ 825fcf5ef2aSThomas Huth none |= result; \ 826fcf5ef2aSThomas Huth } \ 827fcf5ef2aSThomas Huth if (record) { \ 828fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 829fcf5ef2aSThomas Huth } \ 830fcf5ef2aSThomas Huth } 831fcf5ef2aSThomas Huth 832b6cb41b2SDavid Gibson /* 833b6cb41b2SDavid Gibson * VCMPNEZ - Vector compare not equal to zero 834fcf5ef2aSThomas Huth * suffix - instruction mnemonic suffix (b: byte, h: halfword, w: word) 835fcf5ef2aSThomas Huth * element - element type to access from vector 836fcf5ef2aSThomas Huth */ 837fcf5ef2aSThomas Huth #define VCMPNE(suffix, element, etype, cmpzero) \ 838fcf5ef2aSThomas Huth VCMPNE_DO(suffix, element, etype, cmpzero, 0) \ 839fcf5ef2aSThomas Huth VCMPNE_DO(suffix##_dot, element, etype, cmpzero, 1) 840fcf5ef2aSThomas Huth VCMPNE(zb, u8, uint8_t, 1) 841fcf5ef2aSThomas Huth VCMPNE(zh, u16, uint16_t, 1) 842fcf5ef2aSThomas Huth VCMPNE(zw, u32, uint32_t, 1) 843fcf5ef2aSThomas Huth VCMPNE(b, u8, uint8_t, 0) 844fcf5ef2aSThomas Huth VCMPNE(h, u16, uint16_t, 0) 845fcf5ef2aSThomas Huth VCMPNE(w, u32, uint32_t, 0) 846fcf5ef2aSThomas Huth #undef VCMPNE_DO 847fcf5ef2aSThomas Huth #undef VCMPNE 848fcf5ef2aSThomas Huth 849fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record) \ 850fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 851fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 852fcf5ef2aSThomas Huth { \ 853fcf5ef2aSThomas Huth uint32_t ones = (uint32_t)-1; \ 854fcf5ef2aSThomas Huth uint32_t all = ones; \ 855fcf5ef2aSThomas Huth uint32_t none = 0; \ 856fcf5ef2aSThomas Huth int i; \ 857fcf5ef2aSThomas Huth \ 85805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 859fcf5ef2aSThomas Huth uint32_t result; \ 86071bfd65cSRichard Henderson FloatRelation rel = \ 86171bfd65cSRichard Henderson float32_compare_quiet(a->f32[i], b->f32[i], \ 862fcf5ef2aSThomas Huth &env->vec_status); \ 863fcf5ef2aSThomas Huth if (rel == float_relation_unordered) { \ 864fcf5ef2aSThomas Huth result = 0; \ 865fcf5ef2aSThomas Huth } else if (rel compare order) { \ 866fcf5ef2aSThomas Huth result = ones; \ 867fcf5ef2aSThomas Huth } else { \ 868fcf5ef2aSThomas Huth result = 0; \ 869fcf5ef2aSThomas Huth } \ 870fcf5ef2aSThomas Huth r->u32[i] = result; \ 871fcf5ef2aSThomas Huth all &= result; \ 872fcf5ef2aSThomas Huth none |= result; \ 873fcf5ef2aSThomas Huth } \ 874fcf5ef2aSThomas Huth if (record) { \ 875fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 876fcf5ef2aSThomas Huth } \ 877fcf5ef2aSThomas Huth } 878fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order) \ 879fcf5ef2aSThomas Huth VCMPFP_DO(suffix, compare, order, 0) \ 880fcf5ef2aSThomas Huth VCMPFP_DO(suffix##_dot, compare, order, 1) 881fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal) 882fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less) 883fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater) 884fcf5ef2aSThomas Huth #undef VCMPFP_DO 885fcf5ef2aSThomas Huth #undef VCMPFP 886fcf5ef2aSThomas Huth 887fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r, 888fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b, int record) 889fcf5ef2aSThomas Huth { 890fcf5ef2aSThomas Huth int i; 891fcf5ef2aSThomas Huth int all_in = 0; 892fcf5ef2aSThomas Huth 89305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 89471bfd65cSRichard Henderson FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i], 89505ee3e8aSMark Cave-Ayland &env->vec_status); 896fcf5ef2aSThomas Huth if (le_rel == float_relation_unordered) { 897fcf5ef2aSThomas Huth r->u32[i] = 0xc0000000; 898fcf5ef2aSThomas Huth all_in = 1; 899fcf5ef2aSThomas Huth } else { 90005ee3e8aSMark Cave-Ayland float32 bneg = float32_chs(b->f32[i]); 90171bfd65cSRichard Henderson FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg, 90205ee3e8aSMark Cave-Ayland &env->vec_status); 903fcf5ef2aSThomas Huth int le = le_rel != float_relation_greater; 904fcf5ef2aSThomas Huth int ge = ge_rel != float_relation_less; 905fcf5ef2aSThomas Huth 906fcf5ef2aSThomas Huth r->u32[i] = ((!le) << 31) | ((!ge) << 30); 907fcf5ef2aSThomas Huth all_in |= (!le | !ge); 908fcf5ef2aSThomas Huth } 909fcf5ef2aSThomas Huth } 910fcf5ef2aSThomas Huth if (record) { 911fcf5ef2aSThomas Huth env->crf[6] = (all_in == 0) << 1; 912fcf5ef2aSThomas Huth } 913fcf5ef2aSThomas Huth } 914fcf5ef2aSThomas Huth 915fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 916fcf5ef2aSThomas Huth { 917fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 0); 918fcf5ef2aSThomas Huth } 919fcf5ef2aSThomas Huth 920fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 921fcf5ef2aSThomas Huth ppc_avr_t *b) 922fcf5ef2aSThomas Huth { 923fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 1); 924fcf5ef2aSThomas Huth } 925fcf5ef2aSThomas Huth 926fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element) \ 927fcf5ef2aSThomas Huth void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r, \ 928fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 929fcf5ef2aSThomas Huth { \ 930fcf5ef2aSThomas Huth int i; \ 931fcf5ef2aSThomas Huth int sat = 0; \ 932fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 933fcf5ef2aSThomas Huth \ 934fcf5ef2aSThomas Huth set_float_rounding_mode(float_round_to_zero, &s); \ 93505ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 93605ee3e8aSMark Cave-Ayland if (float32_is_any_nan(b->f32[i])) { \ 937fcf5ef2aSThomas Huth r->element[i] = 0; \ 938fcf5ef2aSThomas Huth } else { \ 93905ee3e8aSMark Cave-Ayland float64 t = float32_to_float64(b->f32[i], &s); \ 940fcf5ef2aSThomas Huth int64_t j; \ 941fcf5ef2aSThomas Huth \ 942fcf5ef2aSThomas Huth t = float64_scalbn(t, uim, &s); \ 943fcf5ef2aSThomas Huth j = float64_to_int64(t, &s); \ 944fcf5ef2aSThomas Huth r->element[i] = satcvt(j, &sat); \ 945fcf5ef2aSThomas Huth } \ 946fcf5ef2aSThomas Huth } \ 947fcf5ef2aSThomas Huth if (sat) { \ 9486175f5a0SRichard Henderson set_vscr_sat(env); \ 949fcf5ef2aSThomas Huth } \ 950fcf5ef2aSThomas Huth } 951fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32) 952fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32) 953fcf5ef2aSThomas Huth #undef VCT 954fcf5ef2aSThomas Huth 955fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r) 956fcf5ef2aSThomas Huth { 957fcf5ef2aSThomas Huth target_ulong count = 0; 958fcf5ef2aSThomas Huth int i; 95960594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 96060594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 961fcf5ef2aSThomas Huth break; 962fcf5ef2aSThomas Huth } 963fcf5ef2aSThomas Huth count++; 964fcf5ef2aSThomas Huth } 965fcf5ef2aSThomas Huth return count; 966fcf5ef2aSThomas Huth } 967fcf5ef2aSThomas Huth 968fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r) 969fcf5ef2aSThomas Huth { 970fcf5ef2aSThomas Huth target_ulong count = 0; 971fcf5ef2aSThomas Huth int i; 972fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 97360594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 974fcf5ef2aSThomas Huth break; 975fcf5ef2aSThomas Huth } 976fcf5ef2aSThomas Huth count++; 977fcf5ef2aSThomas Huth } 978fcf5ef2aSThomas Huth return count; 979fcf5ef2aSThomas Huth } 980fcf5ef2aSThomas Huth 981fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 982fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 983fcf5ef2aSThomas Huth { 984fcf5ef2aSThomas Huth int sat = 0; 985fcf5ef2aSThomas Huth int i; 986fcf5ef2aSThomas Huth 987fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 988fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 989fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 990fcf5ef2aSThomas Huth 991fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 992fcf5ef2aSThomas Huth } 993fcf5ef2aSThomas Huth 994fcf5ef2aSThomas Huth if (sat) { 9956175f5a0SRichard Henderson set_vscr_sat(env); 996fcf5ef2aSThomas Huth } 997fcf5ef2aSThomas Huth } 998fcf5ef2aSThomas Huth 999fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1000fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1001fcf5ef2aSThomas Huth { 1002fcf5ef2aSThomas Huth int sat = 0; 1003fcf5ef2aSThomas Huth int i; 1004fcf5ef2aSThomas Huth 1005fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1006fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i] + 0x00004000; 1007fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 1008fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 1009fcf5ef2aSThomas Huth } 1010fcf5ef2aSThomas Huth 1011fcf5ef2aSThomas Huth if (sat) { 10126175f5a0SRichard Henderson set_vscr_sat(env); 1013fcf5ef2aSThomas Huth } 1014fcf5ef2aSThomas Huth } 1015fcf5ef2aSThomas Huth 1016fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1017fcf5ef2aSThomas Huth { 1018fcf5ef2aSThomas Huth int i; 1019fcf5ef2aSThomas Huth 1020fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1021fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 1022fcf5ef2aSThomas Huth r->s16[i] = (int16_t) (prod + c->s16[i]); 1023fcf5ef2aSThomas Huth } 1024fcf5ef2aSThomas Huth } 1025fcf5ef2aSThomas Huth 1026d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs) \ 1027fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1028fcf5ef2aSThomas Huth { \ 1029fcf5ef2aSThomas Huth ppc_avr_t result; \ 1030d81c2040SMark Cave-Ayland int i, half = ARRAY_SIZE(r->element) / 2; \ 1031fcf5ef2aSThomas Huth \ 1032d81c2040SMark Cave-Ayland for (i = 0; i < half; i++) { \ 1033d81c2040SMark Cave-Ayland result.access(i * 2 + 0) = a->access(i + ofs); \ 1034d81c2040SMark Cave-Ayland result.access(i * 2 + 1) = b->access(i + ofs); \ 1035fcf5ef2aSThomas Huth } \ 1036fcf5ef2aSThomas Huth *r = result; \ 1037fcf5ef2aSThomas Huth } 1038d81c2040SMark Cave-Ayland 1039d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access) \ 1040d81c2040SMark Cave-Ayland VMRG_DO(mrgl##suffix, element, access, half) \ 1041d81c2040SMark Cave-Ayland VMRG_DO(mrgh##suffix, element, access, 0) 1042d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB) 1043d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH) 1044d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW) 1045fcf5ef2aSThomas Huth #undef VMRG_DO 1046fcf5ef2aSThomas Huth #undef VMRG 1047fcf5ef2aSThomas Huth 1048fcf5ef2aSThomas Huth void helper_vmsummbm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1049fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1050fcf5ef2aSThomas Huth { 1051fcf5ef2aSThomas Huth int32_t prod[16]; 1052fcf5ef2aSThomas Huth int i; 1053fcf5ef2aSThomas Huth 1054fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s8); i++) { 1055fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s8[i] * b->u8[i]; 1056fcf5ef2aSThomas Huth } 1057fcf5ef2aSThomas Huth 1058fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1059fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] + 1060fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1061fcf5ef2aSThomas Huth } 1062fcf5ef2aSThomas Huth } 1063fcf5ef2aSThomas Huth 1064fcf5ef2aSThomas Huth void helper_vmsumshm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1065fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1066fcf5ef2aSThomas Huth { 1067fcf5ef2aSThomas Huth int32_t prod[8]; 1068fcf5ef2aSThomas Huth int i; 1069fcf5ef2aSThomas Huth 1070fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1071fcf5ef2aSThomas Huth prod[i] = a->s16[i] * b->s16[i]; 1072fcf5ef2aSThomas Huth } 1073fcf5ef2aSThomas Huth 1074fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1075fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1076fcf5ef2aSThomas Huth } 1077fcf5ef2aSThomas Huth } 1078fcf5ef2aSThomas Huth 1079fcf5ef2aSThomas Huth void helper_vmsumshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1080fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1081fcf5ef2aSThomas Huth { 1082fcf5ef2aSThomas Huth int32_t prod[8]; 1083fcf5ef2aSThomas Huth int i; 1084fcf5ef2aSThomas Huth int sat = 0; 1085fcf5ef2aSThomas Huth 1086fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1087fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s16[i] * b->s16[i]; 1088fcf5ef2aSThomas Huth } 1089fcf5ef2aSThomas Huth 1090fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1091fcf5ef2aSThomas Huth int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1092fcf5ef2aSThomas Huth 1093fcf5ef2aSThomas Huth r->u32[i] = cvtsdsw(t, &sat); 1094fcf5ef2aSThomas Huth } 1095fcf5ef2aSThomas Huth 1096fcf5ef2aSThomas Huth if (sat) { 10976175f5a0SRichard Henderson set_vscr_sat(env); 1098fcf5ef2aSThomas Huth } 1099fcf5ef2aSThomas Huth } 1100fcf5ef2aSThomas Huth 1101fcf5ef2aSThomas Huth void helper_vmsumubm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1102fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1103fcf5ef2aSThomas Huth { 1104fcf5ef2aSThomas Huth uint16_t prod[16]; 1105fcf5ef2aSThomas Huth int i; 1106fcf5ef2aSThomas Huth 1107fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1108fcf5ef2aSThomas Huth prod[i] = a->u8[i] * b->u8[i]; 1109fcf5ef2aSThomas Huth } 1110fcf5ef2aSThomas Huth 1111fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1112fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] + 1113fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1114fcf5ef2aSThomas Huth } 1115fcf5ef2aSThomas Huth } 1116fcf5ef2aSThomas Huth 1117fcf5ef2aSThomas Huth void helper_vmsumuhm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1118fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1119fcf5ef2aSThomas Huth { 1120fcf5ef2aSThomas Huth uint32_t prod[8]; 1121fcf5ef2aSThomas Huth int i; 1122fcf5ef2aSThomas Huth 1123fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1124fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1125fcf5ef2aSThomas Huth } 1126fcf5ef2aSThomas Huth 1127fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1128fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1129fcf5ef2aSThomas Huth } 1130fcf5ef2aSThomas Huth } 1131fcf5ef2aSThomas Huth 1132fcf5ef2aSThomas Huth void helper_vmsumuhs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1133fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1134fcf5ef2aSThomas Huth { 1135fcf5ef2aSThomas Huth uint32_t prod[8]; 1136fcf5ef2aSThomas Huth int i; 1137fcf5ef2aSThomas Huth int sat = 0; 1138fcf5ef2aSThomas Huth 1139fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1140fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1141fcf5ef2aSThomas Huth } 1142fcf5ef2aSThomas Huth 1143fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1144fcf5ef2aSThomas Huth uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1145fcf5ef2aSThomas Huth 1146fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1147fcf5ef2aSThomas Huth } 1148fcf5ef2aSThomas Huth 1149fcf5ef2aSThomas Huth if (sat) { 11506175f5a0SRichard Henderson set_vscr_sat(env); 1151fcf5ef2aSThomas Huth } 1152fcf5ef2aSThomas Huth } 1153fcf5ef2aSThomas Huth 11544fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast) \ 1155fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1156fcf5ef2aSThomas Huth { \ 1157fcf5ef2aSThomas Huth int i; \ 1158fcf5ef2aSThomas Huth \ 11594fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 11604fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i) * \ 11614fbc89edSMark Cave-Ayland (cast)b->mul_access(i); \ 1162fcf5ef2aSThomas Huth } \ 1163fcf5ef2aSThomas Huth } 11644fbc89edSMark Cave-Ayland 11654fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast) \ 11664fbc89edSMark Cave-Ayland void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 11674fbc89edSMark Cave-Ayland { \ 11684fbc89edSMark Cave-Ayland int i; \ 11694fbc89edSMark Cave-Ayland \ 11704fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 11714fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) * \ 11724fbc89edSMark Cave-Ayland (cast)b->mul_access(i + 1); \ 11734fbc89edSMark Cave-Ayland } \ 11744fbc89edSMark Cave-Ayland } 11754fbc89edSMark Cave-Ayland 11764fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast) \ 11774fbc89edSMark Cave-Ayland VMUL_DO_EVN(mule##suffix, mul_element, mul_access, prod_access, cast) \ 11784fbc89edSMark Cave-Ayland VMUL_DO_ODD(mulo##suffix, mul_element, mul_access, prod_access, cast) 11794fbc89edSMark Cave-Ayland VMUL(sb, s8, VsrSB, VsrSH, int16_t) 11804fbc89edSMark Cave-Ayland VMUL(sh, s16, VsrSH, VsrSW, int32_t) 11814fbc89edSMark Cave-Ayland VMUL(sw, s32, VsrSW, VsrSD, int64_t) 11824fbc89edSMark Cave-Ayland VMUL(ub, u8, VsrB, VsrH, uint16_t) 11834fbc89edSMark Cave-Ayland VMUL(uh, u16, VsrH, VsrW, uint32_t) 11844fbc89edSMark Cave-Ayland VMUL(uw, u32, VsrW, VsrD, uint64_t) 11854fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN 11864fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD 1187fcf5ef2aSThomas Huth #undef VMUL 1188fcf5ef2aSThomas Huth 1189f3e0d864SLijun Pan void helper_vmulhsw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1190f3e0d864SLijun Pan { 1191f3e0d864SLijun Pan int i; 1192f3e0d864SLijun Pan 1193f3e0d864SLijun Pan for (i = 0; i < 4; i++) { 1194f3e0d864SLijun Pan r->s32[i] = (int32_t)(((int64_t)a->s32[i] * (int64_t)b->s32[i]) >> 32); 1195f3e0d864SLijun Pan } 1196f3e0d864SLijun Pan } 1197f3e0d864SLijun Pan 1198f3e0d864SLijun Pan void helper_vmulhuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1199f3e0d864SLijun Pan { 1200f3e0d864SLijun Pan int i; 1201f3e0d864SLijun Pan 1202f3e0d864SLijun Pan for (i = 0; i < 4; i++) { 1203f3e0d864SLijun Pan r->u32[i] = (uint32_t)(((uint64_t)a->u32[i] * 1204f3e0d864SLijun Pan (uint64_t)b->u32[i]) >> 32); 1205f3e0d864SLijun Pan } 1206f3e0d864SLijun Pan } 1207f3e0d864SLijun Pan 1208c4b8b49dSLijun Pan void helper_vmulhsd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1209c4b8b49dSLijun Pan { 1210c4b8b49dSLijun Pan uint64_t discard; 1211c4b8b49dSLijun Pan 1212c4b8b49dSLijun Pan muls64(&discard, &r->u64[0], a->s64[0], b->s64[0]); 1213c4b8b49dSLijun Pan muls64(&discard, &r->u64[1], a->s64[1], b->s64[1]); 1214c4b8b49dSLijun Pan } 1215c4b8b49dSLijun Pan 1216c4b8b49dSLijun Pan void helper_vmulhud(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1217c4b8b49dSLijun Pan { 1218c4b8b49dSLijun Pan uint64_t discard; 1219c4b8b49dSLijun Pan 1220c4b8b49dSLijun Pan mulu64(&discard, &r->u64[0], a->u64[0], b->u64[0]); 1221c4b8b49dSLijun Pan mulu64(&discard, &r->u64[1], a->u64[1], b->u64[1]); 1222c4b8b49dSLijun Pan } 1223c4b8b49dSLijun Pan 1224fcf5ef2aSThomas Huth void helper_vperm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1225fcf5ef2aSThomas Huth ppc_avr_t *c) 1226fcf5ef2aSThomas Huth { 1227fcf5ef2aSThomas Huth ppc_avr_t result; 1228fcf5ef2aSThomas Huth int i; 1229fcf5ef2aSThomas Huth 123060594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 123160594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1232fcf5ef2aSThomas Huth int index = s & 0xf; 1233fcf5ef2aSThomas Huth 1234fcf5ef2aSThomas Huth if (s & 0x10) { 123560594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1236fcf5ef2aSThomas Huth } else { 123760594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1238fcf5ef2aSThomas Huth } 1239fcf5ef2aSThomas Huth } 1240fcf5ef2aSThomas Huth *r = result; 1241fcf5ef2aSThomas Huth } 1242fcf5ef2aSThomas Huth 1243fcf5ef2aSThomas Huth void helper_vpermr(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1244fcf5ef2aSThomas Huth ppc_avr_t *c) 1245fcf5ef2aSThomas Huth { 1246fcf5ef2aSThomas Huth ppc_avr_t result; 1247fcf5ef2aSThomas Huth int i; 1248fcf5ef2aSThomas Huth 124960594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 125060594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1251fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1252fcf5ef2aSThomas Huth 1253fcf5ef2aSThomas Huth if (s & 0x10) { 125460594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1255fcf5ef2aSThomas Huth } else { 125660594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1257fcf5ef2aSThomas Huth } 1258fcf5ef2aSThomas Huth } 1259fcf5ef2aSThomas Huth *r = result; 1260fcf5ef2aSThomas Huth } 1261fcf5ef2aSThomas Huth 1262fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1263fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)]) 1264fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i) 1265fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0) 1266fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1)) 1267fcf5ef2aSThomas Huth #else 1268fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)]) 1269fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i) 1270fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0) 1271fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \ 1272fcf5ef2aSThomas Huth (extract64((avr)->u64[1 - i], 63 - index, 1)) 1273fcf5ef2aSThomas Huth #endif 1274fcf5ef2aSThomas Huth 1275fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1276fcf5ef2aSThomas Huth { 1277fcf5ef2aSThomas Huth int i, j; 1278fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 1279fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1280fcf5ef2aSThomas Huth for (j = 0; j < 8; j++) { 1281fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, (i * 8) + j); 1282fcf5ef2aSThomas Huth if (index < 64 && EXTRACT_BIT(a, i, index)) { 1283fcf5ef2aSThomas Huth result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j); 1284fcf5ef2aSThomas Huth } 1285fcf5ef2aSThomas Huth } 1286fcf5ef2aSThomas Huth } 1287fcf5ef2aSThomas Huth *r = result; 1288fcf5ef2aSThomas Huth } 1289fcf5ef2aSThomas Huth 1290fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1291fcf5ef2aSThomas Huth { 1292fcf5ef2aSThomas Huth int i; 1293fcf5ef2aSThomas Huth uint64_t perm = 0; 1294fcf5ef2aSThomas Huth 1295fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1296fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, i); 1297fcf5ef2aSThomas Huth 1298fcf5ef2aSThomas Huth if (index < 128) { 1299fcf5ef2aSThomas Huth uint64_t mask = (1ull << (63 - (index & 0x3F))); 1300fcf5ef2aSThomas Huth if (a->u64[VBPERMQ_DW(index)] & mask) { 1301fcf5ef2aSThomas Huth perm |= (0x8000 >> i); 1302fcf5ef2aSThomas Huth } 1303fcf5ef2aSThomas Huth } 1304fcf5ef2aSThomas Huth } 1305fcf5ef2aSThomas Huth 13063c385a93SMark Cave-Ayland r->VsrD(0) = perm; 13073c385a93SMark Cave-Ayland r->VsrD(1) = 0; 1308fcf5ef2aSThomas Huth } 1309fcf5ef2aSThomas Huth 1310fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX 1311fcf5ef2aSThomas Huth #undef VBPERMQ_DW 1312fcf5ef2aSThomas Huth 1313fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp) \ 1314fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1315fcf5ef2aSThomas Huth { \ 1316fcf5ef2aSThomas Huth int i, j; \ 1317fcf5ef2aSThomas Huth trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])]; \ 1318fcf5ef2aSThomas Huth \ 1319fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, srcfld) { \ 1320fcf5ef2aSThomas Huth prod[i] = 0; \ 1321fcf5ef2aSThomas Huth for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) { \ 1322fcf5ef2aSThomas Huth if (a->srcfld[i] & (1ull << j)) { \ 1323fcf5ef2aSThomas Huth prod[i] ^= ((trgtyp)b->srcfld[i] << j); \ 1324fcf5ef2aSThomas Huth } \ 1325fcf5ef2aSThomas Huth } \ 1326fcf5ef2aSThomas Huth } \ 1327fcf5ef2aSThomas Huth \ 1328fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, trgfld) { \ 1329fcf5ef2aSThomas Huth r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1]; \ 1330fcf5ef2aSThomas Huth } \ 1331fcf5ef2aSThomas Huth } 1332fcf5ef2aSThomas Huth 1333fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t) 1334fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t) 1335fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t) 1336fcf5ef2aSThomas Huth 1337fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1338fcf5ef2aSThomas Huth { 1339fcf5ef2aSThomas Huth 1340fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1341fcf5ef2aSThomas Huth int i, j; 1342fcf5ef2aSThomas Huth __uint128_t prod[2]; 1343fcf5ef2aSThomas Huth 1344fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1345fcf5ef2aSThomas Huth prod[i] = 0; 1346fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1347fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1348fcf5ef2aSThomas Huth prod[i] ^= (((__uint128_t)b->u64[i]) << j); 1349fcf5ef2aSThomas Huth } 1350fcf5ef2aSThomas Huth } 1351fcf5ef2aSThomas Huth } 1352fcf5ef2aSThomas Huth 1353fcf5ef2aSThomas Huth r->u128 = prod[0] ^ prod[1]; 1354fcf5ef2aSThomas Huth 1355fcf5ef2aSThomas Huth #else 1356fcf5ef2aSThomas Huth int i, j; 1357fcf5ef2aSThomas Huth ppc_avr_t prod[2]; 1358fcf5ef2aSThomas Huth 1359fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 13603c385a93SMark Cave-Ayland prod[i].VsrD(1) = prod[i].VsrD(0) = 0; 1361fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1362fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1363fcf5ef2aSThomas Huth ppc_avr_t bshift; 1364fcf5ef2aSThomas Huth if (j == 0) { 13653c385a93SMark Cave-Ayland bshift.VsrD(0) = 0; 13663c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i]; 1367fcf5ef2aSThomas Huth } else { 13683c385a93SMark Cave-Ayland bshift.VsrD(0) = b->u64[i] >> (64 - j); 13693c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i] << j; 1370fcf5ef2aSThomas Huth } 13713c385a93SMark Cave-Ayland prod[i].VsrD(1) ^= bshift.VsrD(1); 13723c385a93SMark Cave-Ayland prod[i].VsrD(0) ^= bshift.VsrD(0); 1373fcf5ef2aSThomas Huth } 1374fcf5ef2aSThomas Huth } 1375fcf5ef2aSThomas Huth } 1376fcf5ef2aSThomas Huth 13773c385a93SMark Cave-Ayland r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1); 13783c385a93SMark Cave-Ayland r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0); 1379fcf5ef2aSThomas Huth #endif 1380fcf5ef2aSThomas Huth } 1381fcf5ef2aSThomas Huth 1382fcf5ef2aSThomas Huth 1383fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1384fcf5ef2aSThomas Huth #define PKBIG 1 1385fcf5ef2aSThomas Huth #else 1386fcf5ef2aSThomas Huth #define PKBIG 0 1387fcf5ef2aSThomas Huth #endif 1388fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1389fcf5ef2aSThomas Huth { 1390fcf5ef2aSThomas Huth int i, j; 1391fcf5ef2aSThomas Huth ppc_avr_t result; 1392fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1393fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { a, b }; 1394fcf5ef2aSThomas Huth #else 1395fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { b, a }; 1396fcf5ef2aSThomas Huth #endif 1397fcf5ef2aSThomas Huth 1398fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1399fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(j, u32) { 1400fcf5ef2aSThomas Huth uint32_t e = x[i]->u32[j]; 1401fcf5ef2aSThomas Huth 1402fcf5ef2aSThomas Huth result.u16[4 * i + j] = (((e >> 9) & 0xfc00) | 1403fcf5ef2aSThomas Huth ((e >> 6) & 0x3e0) | 1404fcf5ef2aSThomas Huth ((e >> 3) & 0x1f)); 1405fcf5ef2aSThomas Huth } 1406fcf5ef2aSThomas Huth } 1407fcf5ef2aSThomas Huth *r = result; 1408fcf5ef2aSThomas Huth } 1409fcf5ef2aSThomas Huth 1410fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat) \ 1411fcf5ef2aSThomas Huth void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1412fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 1413fcf5ef2aSThomas Huth { \ 1414fcf5ef2aSThomas Huth int i; \ 1415fcf5ef2aSThomas Huth int sat = 0; \ 1416fcf5ef2aSThomas Huth ppc_avr_t result; \ 1417fcf5ef2aSThomas Huth ppc_avr_t *a0 = PKBIG ? a : b; \ 1418fcf5ef2aSThomas Huth ppc_avr_t *a1 = PKBIG ? b : a; \ 1419fcf5ef2aSThomas Huth \ 1420fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, from) { \ 1421fcf5ef2aSThomas Huth result.to[i] = cvt(a0->from[i], &sat); \ 1422fcf5ef2aSThomas Huth result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\ 1423fcf5ef2aSThomas Huth } \ 1424fcf5ef2aSThomas Huth *r = result; \ 1425fcf5ef2aSThomas Huth if (dosat && sat) { \ 14266175f5a0SRichard Henderson set_vscr_sat(env); \ 1427fcf5ef2aSThomas Huth } \ 1428fcf5ef2aSThomas Huth } 1429fcf5ef2aSThomas Huth #define I(x, y) (x) 1430fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1) 1431fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1) 1432fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1) 1433fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1) 1434fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1) 1435fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1) 1436fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1) 1437fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1) 1438fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1) 1439fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0) 1440fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0) 1441fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0) 1442fcf5ef2aSThomas Huth #undef I 1443fcf5ef2aSThomas Huth #undef VPK 1444fcf5ef2aSThomas Huth #undef PKBIG 1445fcf5ef2aSThomas Huth 1446fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1447fcf5ef2aSThomas Huth { 1448fcf5ef2aSThomas Huth int i; 1449fcf5ef2aSThomas Huth 145005ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 145105ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status); 1452fcf5ef2aSThomas Huth } 1453fcf5ef2aSThomas Huth } 1454fcf5ef2aSThomas Huth 1455fcf5ef2aSThomas Huth #define VRFI(suffix, rounding) \ 1456fcf5ef2aSThomas Huth void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1457fcf5ef2aSThomas Huth ppc_avr_t *b) \ 1458fcf5ef2aSThomas Huth { \ 1459fcf5ef2aSThomas Huth int i; \ 1460fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 1461fcf5ef2aSThomas Huth \ 1462fcf5ef2aSThomas Huth set_float_rounding_mode(rounding, &s); \ 146305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 146405ee3e8aSMark Cave-Ayland r->f32[i] = float32_round_to_int (b->f32[i], &s); \ 1465fcf5ef2aSThomas Huth } \ 1466fcf5ef2aSThomas Huth } 1467fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even) 1468fcf5ef2aSThomas Huth VRFI(m, float_round_down) 1469fcf5ef2aSThomas Huth VRFI(p, float_round_up) 1470fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero) 1471fcf5ef2aSThomas Huth #undef VRFI 1472fcf5ef2aSThomas Huth 1473fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1474fcf5ef2aSThomas Huth { 1475fcf5ef2aSThomas Huth int i; 1476fcf5ef2aSThomas Huth 147705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 147805ee3e8aSMark Cave-Ayland float32 t = float32_sqrt(b->f32[i], &env->vec_status); 1479fcf5ef2aSThomas Huth 148005ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, t, &env->vec_status); 1481fcf5ef2aSThomas Huth } 1482fcf5ef2aSThomas Huth } 1483fcf5ef2aSThomas Huth 1484fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert) \ 1485fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1486fcf5ef2aSThomas Huth { \ 1487fcf5ef2aSThomas Huth int i; \ 1488fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1489fcf5ef2aSThomas Huth uint##size##_t src1 = a->element[i]; \ 1490fcf5ef2aSThomas Huth uint##size##_t src2 = b->element[i]; \ 1491fcf5ef2aSThomas Huth uint##size##_t src3 = r->element[i]; \ 1492fcf5ef2aSThomas Huth uint##size##_t begin, end, shift, mask, rot_val; \ 1493fcf5ef2aSThomas Huth \ 1494fcf5ef2aSThomas Huth shift = extract##size(src2, 0, 6); \ 1495fcf5ef2aSThomas Huth end = extract##size(src2, 8, 6); \ 1496fcf5ef2aSThomas Huth begin = extract##size(src2, 16, 6); \ 1497fcf5ef2aSThomas Huth rot_val = rol##size(src1, shift); \ 1498fcf5ef2aSThomas Huth mask = mask_u##size(begin, end); \ 1499fcf5ef2aSThomas Huth if (insert) { \ 1500fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask) | (src3 & ~mask); \ 1501fcf5ef2aSThomas Huth } else { \ 1502fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask); \ 1503fcf5ef2aSThomas Huth } \ 1504fcf5ef2aSThomas Huth } \ 1505fcf5ef2aSThomas Huth } 1506fcf5ef2aSThomas Huth 1507fcf5ef2aSThomas Huth VRLMI(vrldmi, 64, u64, 1); 1508fcf5ef2aSThomas Huth VRLMI(vrlwmi, 32, u32, 1); 1509fcf5ef2aSThomas Huth VRLMI(vrldnm, 64, u64, 0); 1510fcf5ef2aSThomas Huth VRLMI(vrlwnm, 32, u32, 0); 1511fcf5ef2aSThomas Huth 1512fcf5ef2aSThomas Huth void helper_vsel(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1513fcf5ef2aSThomas Huth ppc_avr_t *c) 1514fcf5ef2aSThomas Huth { 1515fcf5ef2aSThomas Huth r->u64[0] = (a->u64[0] & ~c->u64[0]) | (b->u64[0] & c->u64[0]); 1516fcf5ef2aSThomas Huth r->u64[1] = (a->u64[1] & ~c->u64[1]) | (b->u64[1] & c->u64[1]); 1517fcf5ef2aSThomas Huth } 1518fcf5ef2aSThomas Huth 1519fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1520fcf5ef2aSThomas Huth { 1521fcf5ef2aSThomas Huth int i; 1522fcf5ef2aSThomas Huth 152305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 152405ee3e8aSMark Cave-Ayland r->f32[i] = float32_exp2(b->f32[i], &env->vec_status); 1525fcf5ef2aSThomas Huth } 1526fcf5ef2aSThomas Huth } 1527fcf5ef2aSThomas Huth 1528fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1529fcf5ef2aSThomas Huth { 1530fcf5ef2aSThomas Huth int i; 1531fcf5ef2aSThomas Huth 153205ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 153305ee3e8aSMark Cave-Ayland r->f32[i] = float32_log2(b->f32[i], &env->vec_status); 1534fcf5ef2aSThomas Huth } 1535fcf5ef2aSThomas Huth } 1536fcf5ef2aSThomas Huth 153760caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 153860caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 153960caf221SAvinesh Kumar { \ 1540f297c4c6SMatheus Ferst int index = (a & 0xf) * 8; \ 154160caf221SAvinesh Kumar if (left) { \ 1542f297c4c6SMatheus Ferst index = 128 - index - size; \ 154360caf221SAvinesh Kumar } \ 154460caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 154560caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 154660caf221SAvinesh Kumar } 154760caf221SAvinesh Kumar VEXTU_X_DO(vextublx, 8, 1) 154860caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1) 154960caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1) 155060caf221SAvinesh Kumar VEXTU_X_DO(vextubrx, 8, 0) 155160caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0) 155260caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0) 155360caf221SAvinesh Kumar #undef VEXTU_X_DO 155460caf221SAvinesh Kumar 1555fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1556fcf5ef2aSThomas Huth { 1557fcf5ef2aSThomas Huth int i; 1558fcf5ef2aSThomas Huth unsigned int shift, bytes, size; 1559fcf5ef2aSThomas Huth 1560fcf5ef2aSThomas Huth size = ARRAY_SIZE(r->u8); 1561fcf5ef2aSThomas Huth for (i = 0; i < size; i++) { 156263be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 156363be02fcSAnton Blanchard bytes = (a->VsrB(i) << 8) + /* extract adjacent bytes */ 156463be02fcSAnton Blanchard (((i + 1) < size) ? a->VsrB(i + 1) : 0); 156563be02fcSAnton Blanchard r->VsrB(i) = (bytes << shift) >> 8; /* shift and store result */ 1566fcf5ef2aSThomas Huth } 1567fcf5ef2aSThomas Huth } 1568fcf5ef2aSThomas Huth 1569fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1570fcf5ef2aSThomas Huth { 1571fcf5ef2aSThomas Huth int i; 1572fcf5ef2aSThomas Huth unsigned int shift, bytes; 1573fcf5ef2aSThomas Huth 1574b6cb41b2SDavid Gibson /* 1575b6cb41b2SDavid Gibson * Use reverse order, as destination and source register can be 1576b6cb41b2SDavid Gibson * same. Its being modified in place saving temporary, reverse 1577b6cb41b2SDavid Gibson * order will guarantee that computed result is not fed back. 1578fcf5ef2aSThomas Huth */ 1579fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 158063be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 158163be02fcSAnton Blanchard bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i); 1582fcf5ef2aSThomas Huth /* extract adjacent bytes */ 158363be02fcSAnton Blanchard r->VsrB(i) = (bytes >> shift) & 0xFF; /* shift and store result */ 1584fcf5ef2aSThomas Huth } 1585fcf5ef2aSThomas Huth } 1586fcf5ef2aSThomas Huth 1587fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift) 1588fcf5ef2aSThomas Huth { 1589fcf5ef2aSThomas Huth int sh = shift & 0xf; 1590fcf5ef2aSThomas Huth int i; 1591fcf5ef2aSThomas Huth ppc_avr_t result; 1592fcf5ef2aSThomas Huth 1593fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1594fcf5ef2aSThomas Huth int index = sh + i; 1595fcf5ef2aSThomas Huth if (index > 0xf) { 159660594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index - 0x10); 1597fcf5ef2aSThomas Huth } else { 159860594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1599fcf5ef2aSThomas Huth } 1600fcf5ef2aSThomas Huth } 1601fcf5ef2aSThomas Huth *r = result; 1602fcf5ef2aSThomas Huth } 1603fcf5ef2aSThomas Huth 1604fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1605fcf5ef2aSThomas Huth { 16063c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1607fcf5ef2aSThomas Huth 1608fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1609fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1610fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1611fcf5ef2aSThomas Huth #else 1612fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1613fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1614fcf5ef2aSThomas Huth #endif 1615fcf5ef2aSThomas Huth } 1616fcf5ef2aSThomas Huth 1617fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1618fcf5ef2aSThomas Huth #define VINSERT(suffix, element) \ 1619fcf5ef2aSThomas Huth void helper_vinsert##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1620fcf5ef2aSThomas Huth { \ 16214fff7218SLaurent Vivier memmove(&r->u8[index], &b->u8[8 - sizeof(r->element[0])], \ 1622fcf5ef2aSThomas Huth sizeof(r->element[0])); \ 1623fcf5ef2aSThomas Huth } 1624fcf5ef2aSThomas Huth #else 1625fcf5ef2aSThomas Huth #define VINSERT(suffix, element) \ 1626fcf5ef2aSThomas Huth void helper_vinsert##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1627fcf5ef2aSThomas Huth { \ 1628fcf5ef2aSThomas Huth uint32_t d = (16 - index) - sizeof(r->element[0]); \ 1629fcf5ef2aSThomas Huth memmove(&r->u8[d], &b->u8[8], sizeof(r->element[0])); \ 1630fcf5ef2aSThomas Huth } 1631fcf5ef2aSThomas Huth #endif 1632fcf5ef2aSThomas Huth VINSERT(b, u8) 1633fcf5ef2aSThomas Huth VINSERT(h, u16) 1634fcf5ef2aSThomas Huth VINSERT(w, u32) 1635fcf5ef2aSThomas Huth VINSERT(d, u64) 1636fcf5ef2aSThomas Huth #undef VINSERT 1637fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1638fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1639fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1640fcf5ef2aSThomas Huth { \ 1641fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1642fcf5ef2aSThomas Huth memmove(&r->u8[8 - es], &b->u8[index], es); \ 1643fcf5ef2aSThomas Huth memset(&r->u8[8], 0, 8); \ 1644fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8 - es); \ 1645fcf5ef2aSThomas Huth } 1646fcf5ef2aSThomas Huth #else 1647fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1648fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1649fcf5ef2aSThomas Huth { \ 1650fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1651fcf5ef2aSThomas Huth uint32_t s = (16 - index) - es; \ 1652fcf5ef2aSThomas Huth memmove(&r->u8[8], &b->u8[s], es); \ 1653fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8); \ 1654fcf5ef2aSThomas Huth memset(&r->u8[8 + es], 0, 8 - es); \ 1655fcf5ef2aSThomas Huth } 1656fcf5ef2aSThomas Huth #endif 1657fcf5ef2aSThomas Huth VEXTRACT(ub, u8) 1658fcf5ef2aSThomas Huth VEXTRACT(uh, u16) 1659fcf5ef2aSThomas Huth VEXTRACT(uw, u32) 1660fcf5ef2aSThomas Huth VEXTRACT(d, u64) 1661fcf5ef2aSThomas Huth #undef VEXTRACT 1662fcf5ef2aSThomas Huth 16635ba5335dSMark Cave-Ayland void helper_xxextractuw(CPUPPCState *env, ppc_vsr_t *xt, 16645ba5335dSMark Cave-Ayland ppc_vsr_t *xb, uint32_t index) 16658ad901e5SNikunj A Dadhania { 166603b32c09SMark Cave-Ayland ppc_vsr_t t = { }; 16678ad901e5SNikunj A Dadhania size_t es = sizeof(uint32_t); 16688ad901e5SNikunj A Dadhania uint32_t ext_index; 16698ad901e5SNikunj A Dadhania int i; 16708ad901e5SNikunj A Dadhania 16718ad901e5SNikunj A Dadhania ext_index = index; 16728ad901e5SNikunj A Dadhania for (i = 0; i < es; i++, ext_index++) { 167303b32c09SMark Cave-Ayland t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16); 16748ad901e5SNikunj A Dadhania } 16758ad901e5SNikunj A Dadhania 167603b32c09SMark Cave-Ayland *xt = t; 16778ad901e5SNikunj A Dadhania } 16788ad901e5SNikunj A Dadhania 16795ba5335dSMark Cave-Ayland void helper_xxinsertw(CPUPPCState *env, ppc_vsr_t *xt, 16805ba5335dSMark Cave-Ayland ppc_vsr_t *xb, uint32_t index) 16813398b742SNikunj A Dadhania { 168203b32c09SMark Cave-Ayland ppc_vsr_t t = *xt; 16833398b742SNikunj A Dadhania size_t es = sizeof(uint32_t); 16843398b742SNikunj A Dadhania int ins_index, i = 0; 16853398b742SNikunj A Dadhania 16863398b742SNikunj A Dadhania ins_index = index; 16873398b742SNikunj A Dadhania for (i = 0; i < es && ins_index < 16; i++, ins_index++) { 168803b32c09SMark Cave-Ayland t.VsrB(ins_index) = xb->VsrB(8 - es + i); 16893398b742SNikunj A Dadhania } 16903398b742SNikunj A Dadhania 169103b32c09SMark Cave-Ayland *xt = t; 16923398b742SNikunj A Dadhania } 16933398b742SNikunj A Dadhania 1694634c5835SMark Cave-Ayland #define VEXT_SIGNED(name, element, cast) \ 1695fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 1696fcf5ef2aSThomas Huth { \ 1697fcf5ef2aSThomas Huth int i; \ 169860594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1699634c5835SMark Cave-Ayland r->element[i] = (cast)b->element[i]; \ 1700fcf5ef2aSThomas Huth } \ 1701fcf5ef2aSThomas Huth } 1702634c5835SMark Cave-Ayland VEXT_SIGNED(vextsb2w, s32, int8_t) 1703634c5835SMark Cave-Ayland VEXT_SIGNED(vextsb2d, s64, int8_t) 1704634c5835SMark Cave-Ayland VEXT_SIGNED(vextsh2w, s32, int16_t) 1705634c5835SMark Cave-Ayland VEXT_SIGNED(vextsh2d, s64, int16_t) 1706634c5835SMark Cave-Ayland VEXT_SIGNED(vextsw2d, s64, int32_t) 1707fcf5ef2aSThomas Huth #undef VEXT_SIGNED 1708fcf5ef2aSThomas Huth 1709fcf5ef2aSThomas Huth #define VNEG(name, element) \ 1710fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 1711fcf5ef2aSThomas Huth { \ 1712fcf5ef2aSThomas Huth int i; \ 171360594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1714fcf5ef2aSThomas Huth r->element[i] = -b->element[i]; \ 1715fcf5ef2aSThomas Huth } \ 1716fcf5ef2aSThomas Huth } 1717fcf5ef2aSThomas Huth VNEG(vnegw, s32) 1718fcf5ef2aSThomas Huth VNEG(vnegd, s64) 1719fcf5ef2aSThomas Huth #undef VNEG 1720fcf5ef2aSThomas Huth 1721fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1722fcf5ef2aSThomas Huth { 17233c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1724fcf5ef2aSThomas Huth 1725fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1726fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1727fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1728fcf5ef2aSThomas Huth #else 1729fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1730fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1731fcf5ef2aSThomas Huth #endif 1732fcf5ef2aSThomas Huth } 1733fcf5ef2aSThomas Huth 1734fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1735fcf5ef2aSThomas Huth { 1736fcf5ef2aSThomas Huth int i; 1737fcf5ef2aSThomas Huth 1738fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1739fcf5ef2aSThomas Huth r->u32[i] = a->u32[i] >= b->u32[i]; 1740fcf5ef2aSThomas Huth } 1741fcf5ef2aSThomas Huth } 1742fcf5ef2aSThomas Huth 1743fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1744fcf5ef2aSThomas Huth { 1745fcf5ef2aSThomas Huth int64_t t; 1746fcf5ef2aSThomas Huth int i, upper; 1747fcf5ef2aSThomas Huth ppc_avr_t result; 1748fcf5ef2aSThomas Huth int sat = 0; 1749fcf5ef2aSThomas Huth 1750fcf5ef2aSThomas Huth upper = ARRAY_SIZE(r->s32) - 1; 175160594feaSMark Cave-Ayland t = (int64_t)b->VsrSW(upper); 1752fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 175360594feaSMark Cave-Ayland t += a->VsrSW(i); 175460594feaSMark Cave-Ayland result.VsrSW(i) = 0; 1755fcf5ef2aSThomas Huth } 175660594feaSMark Cave-Ayland result.VsrSW(upper) = cvtsdsw(t, &sat); 1757fcf5ef2aSThomas Huth *r = result; 1758fcf5ef2aSThomas Huth 1759fcf5ef2aSThomas Huth if (sat) { 17606175f5a0SRichard Henderson set_vscr_sat(env); 1761fcf5ef2aSThomas Huth } 1762fcf5ef2aSThomas Huth } 1763fcf5ef2aSThomas Huth 1764fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1765fcf5ef2aSThomas Huth { 1766fcf5ef2aSThomas Huth int i, j, upper; 1767fcf5ef2aSThomas Huth ppc_avr_t result; 1768fcf5ef2aSThomas Huth int sat = 0; 1769fcf5ef2aSThomas Huth 1770fcf5ef2aSThomas Huth upper = 1; 1771fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 177260594feaSMark Cave-Ayland int64_t t = (int64_t)b->VsrSW(upper + i * 2); 1773fcf5ef2aSThomas Huth 17747fa0ddc1SAnton Blanchard result.VsrD(i) = 0; 1775fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u64); j++) { 177660594feaSMark Cave-Ayland t += a->VsrSW(2 * i + j); 1777fcf5ef2aSThomas Huth } 177860594feaSMark Cave-Ayland result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat); 1779fcf5ef2aSThomas Huth } 1780fcf5ef2aSThomas Huth 1781fcf5ef2aSThomas Huth *r = result; 1782fcf5ef2aSThomas Huth if (sat) { 17836175f5a0SRichard Henderson set_vscr_sat(env); 1784fcf5ef2aSThomas Huth } 1785fcf5ef2aSThomas Huth } 1786fcf5ef2aSThomas Huth 1787fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1788fcf5ef2aSThomas Huth { 1789fcf5ef2aSThomas Huth int i, j; 1790fcf5ef2aSThomas Huth int sat = 0; 1791fcf5ef2aSThomas Huth 1792fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1793fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1794fcf5ef2aSThomas Huth 1795fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->s32); j++) { 1796fcf5ef2aSThomas Huth t += a->s8[4 * i + j]; 1797fcf5ef2aSThomas Huth } 1798fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1799fcf5ef2aSThomas Huth } 1800fcf5ef2aSThomas Huth 1801fcf5ef2aSThomas Huth if (sat) { 18026175f5a0SRichard Henderson set_vscr_sat(env); 1803fcf5ef2aSThomas Huth } 1804fcf5ef2aSThomas Huth } 1805fcf5ef2aSThomas Huth 1806fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1807fcf5ef2aSThomas Huth { 1808fcf5ef2aSThomas Huth int sat = 0; 1809fcf5ef2aSThomas Huth int i; 1810fcf5ef2aSThomas Huth 1811fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1812fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1813fcf5ef2aSThomas Huth 1814fcf5ef2aSThomas Huth t += a->s16[2 * i] + a->s16[2 * i + 1]; 1815fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1816fcf5ef2aSThomas Huth } 1817fcf5ef2aSThomas Huth 1818fcf5ef2aSThomas Huth if (sat) { 18196175f5a0SRichard Henderson set_vscr_sat(env); 1820fcf5ef2aSThomas Huth } 1821fcf5ef2aSThomas Huth } 1822fcf5ef2aSThomas Huth 1823fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1824fcf5ef2aSThomas Huth { 1825fcf5ef2aSThomas Huth int i, j; 1826fcf5ef2aSThomas Huth int sat = 0; 1827fcf5ef2aSThomas Huth 1828fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1829fcf5ef2aSThomas Huth uint64_t t = (uint64_t)b->u32[i]; 1830fcf5ef2aSThomas Huth 1831fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u32); j++) { 1832fcf5ef2aSThomas Huth t += a->u8[4 * i + j]; 1833fcf5ef2aSThomas Huth } 1834fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1835fcf5ef2aSThomas Huth } 1836fcf5ef2aSThomas Huth 1837fcf5ef2aSThomas Huth if (sat) { 18386175f5a0SRichard Henderson set_vscr_sat(env); 1839fcf5ef2aSThomas Huth } 1840fcf5ef2aSThomas Huth } 1841fcf5ef2aSThomas Huth 1842fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1843fcf5ef2aSThomas Huth #define UPKHI 1 1844fcf5ef2aSThomas Huth #define UPKLO 0 1845fcf5ef2aSThomas Huth #else 1846fcf5ef2aSThomas Huth #define UPKHI 0 1847fcf5ef2aSThomas Huth #define UPKLO 1 1848fcf5ef2aSThomas Huth #endif 1849fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi) \ 1850fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 1851fcf5ef2aSThomas Huth { \ 1852fcf5ef2aSThomas Huth int i; \ 1853fcf5ef2aSThomas Huth ppc_avr_t result; \ 1854fcf5ef2aSThomas Huth \ 1855fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { \ 1856fcf5ef2aSThomas Huth uint16_t e = b->u16[hi ? i : i + 4]; \ 1857fcf5ef2aSThomas Huth uint8_t a = (e >> 15) ? 0xff : 0; \ 1858fcf5ef2aSThomas Huth uint8_t r = (e >> 10) & 0x1f; \ 1859fcf5ef2aSThomas Huth uint8_t g = (e >> 5) & 0x1f; \ 1860fcf5ef2aSThomas Huth uint8_t b = e & 0x1f; \ 1861fcf5ef2aSThomas Huth \ 1862fcf5ef2aSThomas Huth result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b; \ 1863fcf5ef2aSThomas Huth } \ 1864fcf5ef2aSThomas Huth *r = result; \ 1865fcf5ef2aSThomas Huth } 1866fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO) 1867fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI) 1868fcf5ef2aSThomas Huth #undef VUPKPX 1869fcf5ef2aSThomas Huth 1870fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi) \ 1871fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 1872fcf5ef2aSThomas Huth { \ 1873fcf5ef2aSThomas Huth int i; \ 1874fcf5ef2aSThomas Huth ppc_avr_t result; \ 1875fcf5ef2aSThomas Huth \ 1876fcf5ef2aSThomas Huth if (hi) { \ 1877fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) { \ 1878fcf5ef2aSThomas Huth result.unpacked[i] = b->packee[i]; \ 1879fcf5ef2aSThomas Huth } \ 1880fcf5ef2aSThomas Huth } else { \ 1881fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \ 1882fcf5ef2aSThomas Huth i++) { \ 1883fcf5ef2aSThomas Huth result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \ 1884fcf5ef2aSThomas Huth } \ 1885fcf5ef2aSThomas Huth } \ 1886fcf5ef2aSThomas Huth *r = result; \ 1887fcf5ef2aSThomas Huth } 1888fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI) 1889fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI) 1890fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI) 1891fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO) 1892fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO) 1893fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO) 1894fcf5ef2aSThomas Huth #undef VUPK 1895fcf5ef2aSThomas Huth #undef UPKHI 1896fcf5ef2aSThomas Huth #undef UPKLO 1897fcf5ef2aSThomas Huth 1898fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element) \ 1899fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *b) \ 1900fcf5ef2aSThomas Huth { \ 1901fcf5ef2aSThomas Huth int i; \ 1902fcf5ef2aSThomas Huth \ 190360594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1904fcf5ef2aSThomas Huth r->element[i] = name(b->element[i]); \ 1905fcf5ef2aSThomas Huth } \ 1906fcf5ef2aSThomas Huth } 1907fcf5ef2aSThomas Huth 1908fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8) 1909fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16) 1910fcf5ef2aSThomas Huth 1911fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8) 1912fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16) 1913fcf5ef2aSThomas Huth 1914fcf5ef2aSThomas Huth #undef clzb 1915fcf5ef2aSThomas Huth #undef clzh 1916fcf5ef2aSThomas Huth 1917fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8) 1918fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16) 1919fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v)) 1920fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v)) 1921fcf5ef2aSThomas Huth 1922fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8) 1923fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16) 1924fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32) 1925fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64) 1926fcf5ef2aSThomas Huth 1927fcf5ef2aSThomas Huth #undef ctzb 1928fcf5ef2aSThomas Huth #undef ctzh 1929fcf5ef2aSThomas Huth #undef ctzw 1930fcf5ef2aSThomas Huth #undef ctzd 1931fcf5ef2aSThomas Huth 1932fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v) 1933fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v) 1934fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v) 1935fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v) 1936fcf5ef2aSThomas Huth 1937fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8) 1938fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16) 1939fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32) 1940fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64) 1941fcf5ef2aSThomas Huth 1942fcf5ef2aSThomas Huth #undef popcntb 1943fcf5ef2aSThomas Huth #undef popcnth 1944fcf5ef2aSThomas Huth #undef popcntw 1945fcf5ef2aSThomas Huth #undef popcntd 1946fcf5ef2aSThomas Huth 1947fcf5ef2aSThomas Huth #undef VGENERIC_DO 1948fcf5ef2aSThomas Huth 1949fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1950fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } } 1951fcf5ef2aSThomas Huth #else 1952fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } } 1953fcf5ef2aSThomas Huth #endif 1954fcf5ef2aSThomas Huth 1955fcf5ef2aSThomas Huth #ifndef CONFIG_INT128 1956fcf5ef2aSThomas Huth 1957fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a) 1958fcf5ef2aSThomas Huth { 1959fcf5ef2aSThomas Huth t->u64[0] = ~a.u64[0]; 1960fcf5ef2aSThomas Huth t->u64[1] = ~a.u64[1]; 1961fcf5ef2aSThomas Huth } 1962fcf5ef2aSThomas Huth 1963fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b) 1964fcf5ef2aSThomas Huth { 19653c385a93SMark Cave-Ayland if (a.VsrD(0) < b.VsrD(0)) { 1966fcf5ef2aSThomas Huth return -1; 19673c385a93SMark Cave-Ayland } else if (a.VsrD(0) > b.VsrD(0)) { 1968fcf5ef2aSThomas Huth return 1; 19693c385a93SMark Cave-Ayland } else if (a.VsrD(1) < b.VsrD(1)) { 1970fcf5ef2aSThomas Huth return -1; 19713c385a93SMark Cave-Ayland } else if (a.VsrD(1) > b.VsrD(1)) { 1972fcf5ef2aSThomas Huth return 1; 1973fcf5ef2aSThomas Huth } else { 1974fcf5ef2aSThomas Huth return 0; 1975fcf5ef2aSThomas Huth } 1976fcf5ef2aSThomas Huth } 1977fcf5ef2aSThomas Huth 1978fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 1979fcf5ef2aSThomas Huth { 19803c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 19813c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 19823c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 1983fcf5ef2aSThomas Huth } 1984fcf5ef2aSThomas Huth 1985fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 1986fcf5ef2aSThomas Huth { 1987fcf5ef2aSThomas Huth ppc_avr_t not_a; 19883c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 19893c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 19903c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 1991fcf5ef2aSThomas Huth avr_qw_not(¬_a, a); 1992fcf5ef2aSThomas Huth return avr_qw_cmpu(not_a, b) < 0; 1993fcf5ef2aSThomas Huth } 1994fcf5ef2aSThomas Huth 1995fcf5ef2aSThomas Huth #endif 1996fcf5ef2aSThomas Huth 1997fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1998fcf5ef2aSThomas Huth { 1999fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2000fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128; 2001fcf5ef2aSThomas Huth #else 2002fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 2003fcf5ef2aSThomas Huth #endif 2004fcf5ef2aSThomas Huth } 2005fcf5ef2aSThomas Huth 2006fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2007fcf5ef2aSThomas Huth { 2008fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2009fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128 + (c->u128 & 1); 2010fcf5ef2aSThomas Huth #else 2011fcf5ef2aSThomas Huth 20123c385a93SMark Cave-Ayland if (c->VsrD(1) & 1) { 2013fcf5ef2aSThomas Huth ppc_avr_t tmp; 2014fcf5ef2aSThomas Huth 20153c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 20163c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2017fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 2018fcf5ef2aSThomas Huth avr_qw_add(r, tmp, *b); 2019fcf5ef2aSThomas Huth } else { 2020fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 2021fcf5ef2aSThomas Huth } 2022fcf5ef2aSThomas Huth #endif 2023fcf5ef2aSThomas Huth } 2024fcf5ef2aSThomas Huth 2025fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2026fcf5ef2aSThomas Huth { 2027fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2028fcf5ef2aSThomas Huth r->u128 = (~a->u128 < b->u128); 2029fcf5ef2aSThomas Huth #else 2030fcf5ef2aSThomas Huth ppc_avr_t not_a; 2031fcf5ef2aSThomas Huth 2032fcf5ef2aSThomas Huth avr_qw_not(¬_a, *a); 2033fcf5ef2aSThomas Huth 20343c385a93SMark Cave-Ayland r->VsrD(0) = 0; 20353c385a93SMark Cave-Ayland r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0); 2036fcf5ef2aSThomas Huth #endif 2037fcf5ef2aSThomas Huth } 2038fcf5ef2aSThomas Huth 2039fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2040fcf5ef2aSThomas Huth { 2041fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2042fcf5ef2aSThomas Huth int carry_out = (~a->u128 < b->u128); 2043fcf5ef2aSThomas Huth if (!carry_out && (c->u128 & 1)) { 2044fcf5ef2aSThomas Huth carry_out = ((a->u128 + b->u128 + 1) == 0) && 2045fcf5ef2aSThomas Huth ((a->u128 != 0) || (b->u128 != 0)); 2046fcf5ef2aSThomas Huth } 2047fcf5ef2aSThomas Huth r->u128 = carry_out; 2048fcf5ef2aSThomas Huth #else 2049fcf5ef2aSThomas Huth 20503c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2051fcf5ef2aSThomas Huth int carry_out = 0; 2052fcf5ef2aSThomas Huth ppc_avr_t tmp; 2053fcf5ef2aSThomas Huth 2054fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, *a, *b); 2055fcf5ef2aSThomas Huth 2056fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2057fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 2058fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, tmp, one); 2059fcf5ef2aSThomas Huth } 20603c385a93SMark Cave-Ayland r->VsrD(0) = 0; 20613c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2062fcf5ef2aSThomas Huth #endif 2063fcf5ef2aSThomas Huth } 2064fcf5ef2aSThomas Huth 2065fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2066fcf5ef2aSThomas Huth { 2067fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2068fcf5ef2aSThomas Huth r->u128 = a->u128 - b->u128; 2069fcf5ef2aSThomas Huth #else 2070fcf5ef2aSThomas Huth ppc_avr_t tmp; 2071fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 2072fcf5ef2aSThomas Huth 2073fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2074fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 2075fcf5ef2aSThomas Huth avr_qw_add(r, tmp, one); 2076fcf5ef2aSThomas Huth #endif 2077fcf5ef2aSThomas Huth } 2078fcf5ef2aSThomas Huth 2079fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2080fcf5ef2aSThomas Huth { 2081fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2082fcf5ef2aSThomas Huth r->u128 = a->u128 + ~b->u128 + (c->u128 & 1); 2083fcf5ef2aSThomas Huth #else 2084fcf5ef2aSThomas Huth ppc_avr_t tmp, sum; 2085fcf5ef2aSThomas Huth 2086fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2087fcf5ef2aSThomas Huth avr_qw_add(&sum, *a, tmp); 2088fcf5ef2aSThomas Huth 20893c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 20903c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2091fcf5ef2aSThomas Huth avr_qw_add(r, sum, tmp); 2092fcf5ef2aSThomas Huth #endif 2093fcf5ef2aSThomas Huth } 2094fcf5ef2aSThomas Huth 2095fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2096fcf5ef2aSThomas Huth { 2097fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2098fcf5ef2aSThomas Huth r->u128 = (~a->u128 < ~b->u128) || 2099fcf5ef2aSThomas Huth (a->u128 + ~b->u128 == (__uint128_t)-1); 2100fcf5ef2aSThomas Huth #else 2101fcf5ef2aSThomas Huth int carry = (avr_qw_cmpu(*a, *b) > 0); 2102fcf5ef2aSThomas Huth if (!carry) { 2103fcf5ef2aSThomas Huth ppc_avr_t tmp; 2104fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2105fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 21063c385a93SMark Cave-Ayland carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull)); 2107fcf5ef2aSThomas Huth } 21083c385a93SMark Cave-Ayland r->VsrD(0) = 0; 21093c385a93SMark Cave-Ayland r->VsrD(1) = carry; 2110fcf5ef2aSThomas Huth #endif 2111fcf5ef2aSThomas Huth } 2112fcf5ef2aSThomas Huth 2113fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2114fcf5ef2aSThomas Huth { 2115fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2116fcf5ef2aSThomas Huth r->u128 = 2117fcf5ef2aSThomas Huth (~a->u128 < ~b->u128) || 2118fcf5ef2aSThomas Huth ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1)); 2119fcf5ef2aSThomas Huth #else 21203c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2121fcf5ef2aSThomas Huth int carry_out = (avr_qw_cmpu(*a, *b) > 0); 2122fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2123fcf5ef2aSThomas Huth ppc_avr_t tmp; 2124fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2125fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 21263c385a93SMark Cave-Ayland carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull)); 2127fcf5ef2aSThomas Huth } 2128fcf5ef2aSThomas Huth 21293c385a93SMark Cave-Ayland r->VsrD(0) = 0; 21303c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2131fcf5ef2aSThomas Huth #endif 2132fcf5ef2aSThomas Huth } 2133fcf5ef2aSThomas Huth 2134fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC 2135fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF 2136fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1 0xA 2137fcf5ef2aSThomas Huth #define BCD_NEG_PREF 0xD 2138fcf5ef2aSThomas Huth #define BCD_NEG_ALT 0xB 2139fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2 0xE 2140fcf5ef2aSThomas Huth #define NATIONAL_PLUS 0x2B 2141fcf5ef2aSThomas Huth #define NATIONAL_NEG 0x2D 2142fcf5ef2aSThomas Huth 2143365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2)) 2144fcf5ef2aSThomas Huth 2145fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd) 2146fcf5ef2aSThomas Huth { 2147428115c3SMark Cave-Ayland switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) { 2148fcf5ef2aSThomas Huth case BCD_PLUS_PREF_1: 2149fcf5ef2aSThomas Huth case BCD_PLUS_PREF_2: 2150fcf5ef2aSThomas Huth case BCD_PLUS_ALT_1: 2151fcf5ef2aSThomas Huth case BCD_PLUS_ALT_2: 2152fcf5ef2aSThomas Huth { 2153fcf5ef2aSThomas Huth return 1; 2154fcf5ef2aSThomas Huth } 2155fcf5ef2aSThomas Huth 2156fcf5ef2aSThomas Huth case BCD_NEG_PREF: 2157fcf5ef2aSThomas Huth case BCD_NEG_ALT: 2158fcf5ef2aSThomas Huth { 2159fcf5ef2aSThomas Huth return -1; 2160fcf5ef2aSThomas Huth } 2161fcf5ef2aSThomas Huth 2162fcf5ef2aSThomas Huth default: 2163fcf5ef2aSThomas Huth { 2164fcf5ef2aSThomas Huth return 0; 2165fcf5ef2aSThomas Huth } 2166fcf5ef2aSThomas Huth } 2167fcf5ef2aSThomas Huth } 2168fcf5ef2aSThomas Huth 2169fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps) 2170fcf5ef2aSThomas Huth { 2171fcf5ef2aSThomas Huth if (sgn >= 0) { 2172fcf5ef2aSThomas Huth return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2; 2173fcf5ef2aSThomas Huth } else { 2174fcf5ef2aSThomas Huth return BCD_NEG_PREF; 2175fcf5ef2aSThomas Huth } 2176fcf5ef2aSThomas Huth } 2177fcf5ef2aSThomas Huth 2178fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid) 2179fcf5ef2aSThomas Huth { 2180fcf5ef2aSThomas Huth uint8_t result; 2181fcf5ef2aSThomas Huth if (n & 1) { 2182428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4; 2183fcf5ef2aSThomas Huth } else { 2184428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF; 2185fcf5ef2aSThomas Huth } 2186fcf5ef2aSThomas Huth 2187fcf5ef2aSThomas Huth if (unlikely(result > 9)) { 2188fcf5ef2aSThomas Huth *invalid = true; 2189fcf5ef2aSThomas Huth } 2190fcf5ef2aSThomas Huth return result; 2191fcf5ef2aSThomas Huth } 2192fcf5ef2aSThomas Huth 2193fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n) 2194fcf5ef2aSThomas Huth { 2195fcf5ef2aSThomas Huth if (n & 1) { 2196428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F; 2197428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4); 2198fcf5ef2aSThomas Huth } else { 2199428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0; 2200428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= digit; 2201fcf5ef2aSThomas Huth } 2202fcf5ef2aSThomas Huth } 2203fcf5ef2aSThomas Huth 2204071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd) 2205071663dfSJose Ricardo Ziviani { 2206071663dfSJose Ricardo Ziviani int i; 2207071663dfSJose Ricardo Ziviani int invalid = 0; 2208071663dfSJose Ricardo Ziviani 2209071663dfSJose Ricardo Ziviani if (bcd_get_sgn(bcd) == 0) { 2210071663dfSJose Ricardo Ziviani return false; 2211071663dfSJose Ricardo Ziviani } 2212071663dfSJose Ricardo Ziviani 2213071663dfSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2214071663dfSJose Ricardo Ziviani bcd_get_digit(bcd, i, &invalid); 2215071663dfSJose Ricardo Ziviani if (unlikely(invalid)) { 2216071663dfSJose Ricardo Ziviani return false; 2217071663dfSJose Ricardo Ziviani } 2218071663dfSJose Ricardo Ziviani } 2219071663dfSJose Ricardo Ziviani return true; 2220071663dfSJose Ricardo Ziviani } 2221071663dfSJose Ricardo Ziviani 2222fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd) 2223fcf5ef2aSThomas Huth { 22243c385a93SMark Cave-Ayland if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) { 2225efa73196SNikunj A Dadhania return CRF_EQ; 2226fcf5ef2aSThomas Huth } else { 2227efa73196SNikunj A Dadhania return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT; 2228fcf5ef2aSThomas Huth } 2229fcf5ef2aSThomas Huth } 2230fcf5ef2aSThomas Huth 2231fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n) 2232fcf5ef2aSThomas Huth { 223360594feaSMark Cave-Ayland return reg->VsrH(7 - n); 2234fcf5ef2aSThomas Huth } 2235fcf5ef2aSThomas Huth 2236fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n) 2237fcf5ef2aSThomas Huth { 223860594feaSMark Cave-Ayland reg->VsrH(7 - n) = val; 2239fcf5ef2aSThomas Huth } 2240fcf5ef2aSThomas Huth 2241fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b) 2242fcf5ef2aSThomas Huth { 2243fcf5ef2aSThomas Huth int i; 2244fcf5ef2aSThomas Huth int invalid = 0; 2245fcf5ef2aSThomas Huth for (i = 31; i > 0; i--) { 2246fcf5ef2aSThomas Huth uint8_t dig_a = bcd_get_digit(a, i, &invalid); 2247fcf5ef2aSThomas Huth uint8_t dig_b = bcd_get_digit(b, i, &invalid); 2248fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2249fcf5ef2aSThomas Huth return 0; /* doesn't matter */ 2250fcf5ef2aSThomas Huth } else if (dig_a > dig_b) { 2251fcf5ef2aSThomas Huth return 1; 2252fcf5ef2aSThomas Huth } else if (dig_a < dig_b) { 2253fcf5ef2aSThomas Huth return -1; 2254fcf5ef2aSThomas Huth } 2255fcf5ef2aSThomas Huth } 2256fcf5ef2aSThomas Huth 2257fcf5ef2aSThomas Huth return 0; 2258fcf5ef2aSThomas Huth } 2259fcf5ef2aSThomas Huth 2260936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2261fcf5ef2aSThomas Huth int *overflow) 2262fcf5ef2aSThomas Huth { 2263fcf5ef2aSThomas Huth int carry = 0; 2264fcf5ef2aSThomas Huth int i; 2265936fda4dSFabiano Rosas int is_zero = 1; 2266936fda4dSFabiano Rosas 2267fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2268fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) + 2269fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2270936fda4dSFabiano Rosas is_zero &= (digit == 0); 2271fcf5ef2aSThomas Huth if (digit > 9) { 2272fcf5ef2aSThomas Huth carry = 1; 2273fcf5ef2aSThomas Huth digit -= 10; 2274fcf5ef2aSThomas Huth } else { 2275fcf5ef2aSThomas Huth carry = 0; 2276fcf5ef2aSThomas Huth } 2277fcf5ef2aSThomas Huth 2278fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2279fcf5ef2aSThomas Huth } 2280fcf5ef2aSThomas Huth 2281fcf5ef2aSThomas Huth *overflow = carry; 2282936fda4dSFabiano Rosas return is_zero; 2283fcf5ef2aSThomas Huth } 2284fcf5ef2aSThomas Huth 2285d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2286fcf5ef2aSThomas Huth int *overflow) 2287fcf5ef2aSThomas Huth { 2288fcf5ef2aSThomas Huth int carry = 0; 2289fcf5ef2aSThomas Huth int i; 2290d03b174aSYasmin Beatriz 2291fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2292fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) - 2293fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2294fcf5ef2aSThomas Huth if (digit & 0x80) { 2295fcf5ef2aSThomas Huth carry = -1; 2296fcf5ef2aSThomas Huth digit += 10; 2297fcf5ef2aSThomas Huth } else { 2298fcf5ef2aSThomas Huth carry = 0; 2299fcf5ef2aSThomas Huth } 2300fcf5ef2aSThomas Huth 2301fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2302fcf5ef2aSThomas Huth } 2303fcf5ef2aSThomas Huth 2304fcf5ef2aSThomas Huth *overflow = carry; 2305fcf5ef2aSThomas Huth } 2306fcf5ef2aSThomas Huth 2307fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2308fcf5ef2aSThomas Huth { 2309fcf5ef2aSThomas Huth 2310fcf5ef2aSThomas Huth int sgna = bcd_get_sgn(a); 2311fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2312fcf5ef2aSThomas Huth int invalid = (sgna == 0) || (sgnb == 0); 2313fcf5ef2aSThomas Huth int overflow = 0; 2314936fda4dSFabiano Rosas int zero = 0; 2315fcf5ef2aSThomas Huth uint32_t cr = 0; 2316fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 2317fcf5ef2aSThomas Huth 2318fcf5ef2aSThomas Huth if (!invalid) { 2319fcf5ef2aSThomas Huth if (sgna == sgnb) { 2320428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2321936fda4dSFabiano Rosas zero = bcd_add_mag(&result, a, b, &invalid, &overflow); 2322936fda4dSFabiano Rosas cr = (sgna > 0) ? CRF_GT : CRF_LT; 2323fcf5ef2aSThomas Huth } else { 2324d03b174aSYasmin Beatriz int magnitude = bcd_cmp_mag(a, b); 2325d03b174aSYasmin Beatriz if (magnitude > 0) { 2326428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2327d03b174aSYasmin Beatriz bcd_sub_mag(&result, a, b, &invalid, &overflow); 2328d03b174aSYasmin Beatriz cr = (sgna > 0) ? CRF_GT : CRF_LT; 2329d03b174aSYasmin Beatriz } else if (magnitude < 0) { 2330428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps); 2331d03b174aSYasmin Beatriz bcd_sub_mag(&result, b, a, &invalid, &overflow); 2332efa73196SNikunj A Dadhania cr = (sgnb > 0) ? CRF_GT : CRF_LT; 2333d03b174aSYasmin Beatriz } else { 2334428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps); 2335d03b174aSYasmin Beatriz cr = CRF_EQ; 2336d03b174aSYasmin Beatriz } 2337fcf5ef2aSThomas Huth } 2338fcf5ef2aSThomas Huth } 2339fcf5ef2aSThomas Huth 2340fcf5ef2aSThomas Huth if (unlikely(invalid)) { 23413c385a93SMark Cave-Ayland result.VsrD(0) = result.VsrD(1) = -1; 2342efa73196SNikunj A Dadhania cr = CRF_SO; 2343fcf5ef2aSThomas Huth } else if (overflow) { 2344efa73196SNikunj A Dadhania cr |= CRF_SO; 2345936fda4dSFabiano Rosas } else if (zero) { 2346936fda4dSFabiano Rosas cr |= CRF_EQ; 2347fcf5ef2aSThomas Huth } 2348fcf5ef2aSThomas Huth 2349fcf5ef2aSThomas Huth *r = result; 2350fcf5ef2aSThomas Huth 2351fcf5ef2aSThomas Huth return cr; 2352fcf5ef2aSThomas Huth } 2353fcf5ef2aSThomas Huth 2354fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2355fcf5ef2aSThomas Huth { 2356fcf5ef2aSThomas Huth ppc_avr_t bcopy = *b; 2357fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2358fcf5ef2aSThomas Huth if (sgnb < 0) { 2359fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0); 2360fcf5ef2aSThomas Huth } else if (sgnb > 0) { 2361fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_NEG_PREF, 0); 2362fcf5ef2aSThomas Huth } 2363fcf5ef2aSThomas Huth /* else invalid ... defer to bcdadd code for proper handling */ 2364fcf5ef2aSThomas Huth 2365fcf5ef2aSThomas Huth return helper_bcdadd(r, a, &bcopy, ps); 2366fcf5ef2aSThomas Huth } 2367fcf5ef2aSThomas Huth 2368fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2369fcf5ef2aSThomas Huth { 2370fcf5ef2aSThomas Huth int i; 2371fcf5ef2aSThomas Huth int cr = 0; 2372fcf5ef2aSThomas Huth uint16_t national = 0; 2373fcf5ef2aSThomas Huth uint16_t sgnb = get_national_digit(b, 0); 2374fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2375fcf5ef2aSThomas Huth int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG); 2376fcf5ef2aSThomas Huth 2377fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2378fcf5ef2aSThomas Huth national = get_national_digit(b, i); 2379fcf5ef2aSThomas Huth if (unlikely(national < 0x30 || national > 0x39)) { 2380fcf5ef2aSThomas Huth invalid = 1; 2381fcf5ef2aSThomas Huth break; 2382fcf5ef2aSThomas Huth } 2383fcf5ef2aSThomas Huth 2384fcf5ef2aSThomas Huth bcd_put_digit(&ret, national & 0xf, i); 2385fcf5ef2aSThomas Huth } 2386fcf5ef2aSThomas Huth 2387fcf5ef2aSThomas Huth if (sgnb == NATIONAL_PLUS) { 2388fcf5ef2aSThomas Huth bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0); 2389fcf5ef2aSThomas Huth } else { 2390fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2391fcf5ef2aSThomas Huth } 2392fcf5ef2aSThomas Huth 2393fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2394fcf5ef2aSThomas Huth 2395fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2396efa73196SNikunj A Dadhania cr = CRF_SO; 2397fcf5ef2aSThomas Huth } 2398fcf5ef2aSThomas Huth 2399fcf5ef2aSThomas Huth *r = ret; 2400fcf5ef2aSThomas Huth 2401fcf5ef2aSThomas Huth return cr; 2402fcf5ef2aSThomas Huth } 2403fcf5ef2aSThomas Huth 2404fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2405fcf5ef2aSThomas Huth { 2406fcf5ef2aSThomas Huth int i; 2407fcf5ef2aSThomas Huth int cr = 0; 2408fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2409fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2410fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2411fcf5ef2aSThomas Huth 24123c385a93SMark Cave-Ayland int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0); 2413fcf5ef2aSThomas Huth 2414fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2415fcf5ef2aSThomas Huth set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i); 2416fcf5ef2aSThomas Huth 2417fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2418fcf5ef2aSThomas Huth break; 2419fcf5ef2aSThomas Huth } 2420fcf5ef2aSThomas Huth } 2421fcf5ef2aSThomas Huth set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0); 2422fcf5ef2aSThomas Huth 2423fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2424fcf5ef2aSThomas Huth 2425fcf5ef2aSThomas Huth if (ox_flag) { 2426efa73196SNikunj A Dadhania cr |= CRF_SO; 2427fcf5ef2aSThomas Huth } 2428fcf5ef2aSThomas Huth 2429fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2430efa73196SNikunj A Dadhania cr = CRF_SO; 2431fcf5ef2aSThomas Huth } 2432fcf5ef2aSThomas Huth 2433fcf5ef2aSThomas Huth *r = ret; 2434fcf5ef2aSThomas Huth 2435fcf5ef2aSThomas Huth return cr; 2436fcf5ef2aSThomas Huth } 2437fcf5ef2aSThomas Huth 2438fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2439fcf5ef2aSThomas Huth { 2440fcf5ef2aSThomas Huth int i; 2441fcf5ef2aSThomas Huth int cr = 0; 2442fcf5ef2aSThomas Huth int invalid = 0; 2443fcf5ef2aSThomas Huth int zone_digit = 0; 2444fcf5ef2aSThomas Huth int zone_lead = ps ? 0xF : 0x3; 2445fcf5ef2aSThomas Huth int digit = 0; 2446fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2447428115c3SMark Cave-Ayland int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4; 2448fcf5ef2aSThomas Huth 2449fcf5ef2aSThomas Huth if (unlikely((sgnb < 0xA) && ps)) { 2450fcf5ef2aSThomas Huth invalid = 1; 2451fcf5ef2aSThomas Huth } 2452fcf5ef2aSThomas Huth 2453fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2454428115c3SMark Cave-Ayland zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead; 2455428115c3SMark Cave-Ayland digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF; 2456fcf5ef2aSThomas Huth if (unlikely(zone_digit != zone_lead || digit > 0x9)) { 2457fcf5ef2aSThomas Huth invalid = 1; 2458fcf5ef2aSThomas Huth break; 2459fcf5ef2aSThomas Huth } 2460fcf5ef2aSThomas Huth 2461fcf5ef2aSThomas Huth bcd_put_digit(&ret, digit, i + 1); 2462fcf5ef2aSThomas Huth } 2463fcf5ef2aSThomas Huth 2464fcf5ef2aSThomas Huth if ((ps && (sgnb == 0xB || sgnb == 0xD)) || 2465fcf5ef2aSThomas Huth (!ps && (sgnb & 0x4))) { 2466fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2467fcf5ef2aSThomas Huth } else { 2468fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0); 2469fcf5ef2aSThomas Huth } 2470fcf5ef2aSThomas Huth 2471fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2472fcf5ef2aSThomas Huth 2473fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2474efa73196SNikunj A Dadhania cr = CRF_SO; 2475fcf5ef2aSThomas Huth } 2476fcf5ef2aSThomas Huth 2477fcf5ef2aSThomas Huth *r = ret; 2478fcf5ef2aSThomas Huth 2479fcf5ef2aSThomas Huth return cr; 2480fcf5ef2aSThomas Huth } 2481fcf5ef2aSThomas Huth 2482fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2483fcf5ef2aSThomas Huth { 2484fcf5ef2aSThomas Huth int i; 2485fcf5ef2aSThomas Huth int cr = 0; 2486fcf5ef2aSThomas Huth uint8_t digit = 0; 2487fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2488fcf5ef2aSThomas Huth int zone_lead = (ps) ? 0xF0 : 0x30; 2489fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2490fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2491fcf5ef2aSThomas Huth 24923c385a93SMark Cave-Ayland int ox_flag = ((b->VsrD(0) >> 4) != 0); 2493fcf5ef2aSThomas Huth 2494fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2495fcf5ef2aSThomas Huth digit = bcd_get_digit(b, i + 1, &invalid); 2496fcf5ef2aSThomas Huth 2497fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2498fcf5ef2aSThomas Huth break; 2499fcf5ef2aSThomas Huth } 2500fcf5ef2aSThomas Huth 2501428115c3SMark Cave-Ayland ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit; 2502fcf5ef2aSThomas Huth } 2503fcf5ef2aSThomas Huth 2504fcf5ef2aSThomas Huth if (ps) { 2505fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1); 2506fcf5ef2aSThomas Huth } else { 2507fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1); 2508fcf5ef2aSThomas Huth } 2509fcf5ef2aSThomas Huth 2510fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2511fcf5ef2aSThomas Huth 2512fcf5ef2aSThomas Huth if (ox_flag) { 2513efa73196SNikunj A Dadhania cr |= CRF_SO; 2514fcf5ef2aSThomas Huth } 2515fcf5ef2aSThomas Huth 2516fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2517efa73196SNikunj A Dadhania cr = CRF_SO; 2518fcf5ef2aSThomas Huth } 2519fcf5ef2aSThomas Huth 2520fcf5ef2aSThomas Huth *r = ret; 2521fcf5ef2aSThomas Huth 2522fcf5ef2aSThomas Huth return cr; 2523fcf5ef2aSThomas Huth } 2524fcf5ef2aSThomas Huth 2525a3d67f3eSLuis Pires /** 2526a3d67f3eSLuis Pires * Compare 2 128-bit unsigned integers, passed in as unsigned 64-bit pairs 2527a3d67f3eSLuis Pires * 2528a3d67f3eSLuis Pires * Returns: 2529a3d67f3eSLuis Pires * > 0 if ahi|alo > bhi|blo, 2530a3d67f3eSLuis Pires * 0 if ahi|alo == bhi|blo, 2531a3d67f3eSLuis Pires * < 0 if ahi|alo < bhi|blo 2532a3d67f3eSLuis Pires */ 2533a3d67f3eSLuis Pires static inline int ucmp128(uint64_t alo, uint64_t ahi, 2534a3d67f3eSLuis Pires uint64_t blo, uint64_t bhi) 2535a3d67f3eSLuis Pires { 2536a3d67f3eSLuis Pires return (ahi == bhi) ? 2537a3d67f3eSLuis Pires (alo > blo ? 1 : (alo == blo ? 0 : -1)) : 2538a3d67f3eSLuis Pires (ahi > bhi ? 1 : -1); 2539a3d67f3eSLuis Pires } 2540a3d67f3eSLuis Pires 2541a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2542a406c058SJose Ricardo Ziviani { 2543a406c058SJose Ricardo Ziviani int i; 2544a3d67f3eSLuis Pires int cr; 2545a406c058SJose Ricardo Ziviani uint64_t lo_value; 2546a406c058SJose Ricardo Ziviani uint64_t hi_value; 254740f3e79aSLuis Pires uint64_t rem; 2548a406c058SJose Ricardo Ziviani ppc_avr_t ret = { .u64 = { 0, 0 } }; 2549a406c058SJose Ricardo Ziviani 25503c385a93SMark Cave-Ayland if (b->VsrSD(0) < 0) { 25513c385a93SMark Cave-Ayland lo_value = -b->VsrSD(1); 25523c385a93SMark Cave-Ayland hi_value = ~b->VsrD(0) + !lo_value; 2553a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, 0xD, 0); 2554a3d67f3eSLuis Pires 2555a3d67f3eSLuis Pires cr = CRF_LT; 2556a406c058SJose Ricardo Ziviani } else { 25573c385a93SMark Cave-Ayland lo_value = b->VsrD(1); 25583c385a93SMark Cave-Ayland hi_value = b->VsrD(0); 2559a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0); 2560a3d67f3eSLuis Pires 2561a3d67f3eSLuis Pires if (hi_value == 0 && lo_value == 0) { 2562a3d67f3eSLuis Pires cr = CRF_EQ; 2563a3d67f3eSLuis Pires } else { 2564a3d67f3eSLuis Pires cr = CRF_GT; 2565a3d67f3eSLuis Pires } 2566a406c058SJose Ricardo Ziviani } 2567a406c058SJose Ricardo Ziviani 2568a3d67f3eSLuis Pires /* 2569a3d67f3eSLuis Pires * Check src limits: abs(src) <= 10^31 - 1 2570a3d67f3eSLuis Pires * 2571a3d67f3eSLuis Pires * 10^31 - 1 = 0x0000007e37be2022 c0914b267fffffff 2572a3d67f3eSLuis Pires */ 2573a3d67f3eSLuis Pires if (ucmp128(lo_value, hi_value, 2574a3d67f3eSLuis Pires 0xc0914b267fffffffULL, 0x7e37be2022ULL) > 0) { 2575a3d67f3eSLuis Pires cr |= CRF_SO; 2576a3d67f3eSLuis Pires 2577a3d67f3eSLuis Pires /* 2578a3d67f3eSLuis Pires * According to the ISA, if src wouldn't fit in the destination 2579a3d67f3eSLuis Pires * register, the result is undefined. 2580a3d67f3eSLuis Pires * In that case, we leave r unchanged. 2581a3d67f3eSLuis Pires */ 2582a3d67f3eSLuis Pires } else { 258340f3e79aSLuis Pires rem = divu128(&lo_value, &hi_value, 1000000000000000ULL); 2584a406c058SJose Ricardo Ziviani 258540f3e79aSLuis Pires for (i = 1; i < 16; rem /= 10, i++) { 258640f3e79aSLuis Pires bcd_put_digit(&ret, rem % 10, i); 2587a406c058SJose Ricardo Ziviani } 2588a406c058SJose Ricardo Ziviani 2589a406c058SJose Ricardo Ziviani for (; i < 32; lo_value /= 10, i++) { 2590a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, lo_value % 10, i); 2591a406c058SJose Ricardo Ziviani } 2592a406c058SJose Ricardo Ziviani 2593a406c058SJose Ricardo Ziviani *r = ret; 2594a3d67f3eSLuis Pires } 2595a406c058SJose Ricardo Ziviani 2596a406c058SJose Ricardo Ziviani return cr; 2597a406c058SJose Ricardo Ziviani } 2598a406c058SJose Ricardo Ziviani 2599c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2600c85bc7ddSJose Ricardo Ziviani { 2601c85bc7ddSJose Ricardo Ziviani uint8_t i; 2602c85bc7ddSJose Ricardo Ziviani int cr; 2603c85bc7ddSJose Ricardo Ziviani uint64_t carry; 2604c85bc7ddSJose Ricardo Ziviani uint64_t unused; 2605c85bc7ddSJose Ricardo Ziviani uint64_t lo_value; 2606c85bc7ddSJose Ricardo Ziviani uint64_t hi_value = 0; 2607c85bc7ddSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2608c85bc7ddSJose Ricardo Ziviani int invalid = (sgnb == 0); 2609c85bc7ddSJose Ricardo Ziviani 2610c85bc7ddSJose Ricardo Ziviani lo_value = bcd_get_digit(b, 31, &invalid); 2611c85bc7ddSJose Ricardo Ziviani for (i = 30; i > 0; i--) { 2612c85bc7ddSJose Ricardo Ziviani mulu64(&lo_value, &carry, lo_value, 10ULL); 2613c85bc7ddSJose Ricardo Ziviani mulu64(&hi_value, &unused, hi_value, 10ULL); 2614c85bc7ddSJose Ricardo Ziviani lo_value += bcd_get_digit(b, i, &invalid); 2615c85bc7ddSJose Ricardo Ziviani hi_value += carry; 2616c85bc7ddSJose Ricardo Ziviani 2617c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2618c85bc7ddSJose Ricardo Ziviani break; 2619c85bc7ddSJose Ricardo Ziviani } 2620c85bc7ddSJose Ricardo Ziviani } 2621c85bc7ddSJose Ricardo Ziviani 2622c85bc7ddSJose Ricardo Ziviani if (sgnb == -1) { 26233c385a93SMark Cave-Ayland r->VsrSD(1) = -lo_value; 26243c385a93SMark Cave-Ayland r->VsrSD(0) = ~hi_value + !r->VsrSD(1); 2625c85bc7ddSJose Ricardo Ziviani } else { 26263c385a93SMark Cave-Ayland r->VsrSD(1) = lo_value; 26273c385a93SMark Cave-Ayland r->VsrSD(0) = hi_value; 2628c85bc7ddSJose Ricardo Ziviani } 2629c85bc7ddSJose Ricardo Ziviani 2630c85bc7ddSJose Ricardo Ziviani cr = bcd_cmp_zero(b); 2631c85bc7ddSJose Ricardo Ziviani 2632c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2633c85bc7ddSJose Ricardo Ziviani cr = CRF_SO; 2634c85bc7ddSJose Ricardo Ziviani } 2635c85bc7ddSJose Ricardo Ziviani 2636c85bc7ddSJose Ricardo Ziviani return cr; 2637c85bc7ddSJose Ricardo Ziviani } 2638c85bc7ddSJose Ricardo Ziviani 2639c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2640c3025c3bSJose Ricardo Ziviani { 2641c3025c3bSJose Ricardo Ziviani int i; 2642c3025c3bSJose Ricardo Ziviani int invalid = 0; 2643c3025c3bSJose Ricardo Ziviani 2644c3025c3bSJose Ricardo Ziviani if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) { 2645c3025c3bSJose Ricardo Ziviani return CRF_SO; 2646c3025c3bSJose Ricardo Ziviani } 2647c3025c3bSJose Ricardo Ziviani 2648c3025c3bSJose Ricardo Ziviani *r = *a; 2649428115c3SMark Cave-Ayland bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0); 2650c3025c3bSJose Ricardo Ziviani 2651c3025c3bSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2652c3025c3bSJose Ricardo Ziviani bcd_get_digit(a, i, &invalid); 2653c3025c3bSJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2654c3025c3bSJose Ricardo Ziviani if (unlikely(invalid)) { 2655c3025c3bSJose Ricardo Ziviani return CRF_SO; 2656c3025c3bSJose Ricardo Ziviani } 2657c3025c3bSJose Ricardo Ziviani } 2658c3025c3bSJose Ricardo Ziviani 2659c3025c3bSJose Ricardo Ziviani return bcd_cmp_zero(r); 2660c3025c3bSJose Ricardo Ziviani } 2661c3025c3bSJose Ricardo Ziviani 2662466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2663466a3f9cSJose Ricardo Ziviani { 2664466a3f9cSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2665466a3f9cSJose Ricardo Ziviani 2666466a3f9cSJose Ricardo Ziviani *r = *b; 2667466a3f9cSJose Ricardo Ziviani bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0); 2668466a3f9cSJose Ricardo Ziviani 2669071663dfSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2670466a3f9cSJose Ricardo Ziviani return CRF_SO; 2671466a3f9cSJose Ricardo Ziviani } 2672466a3f9cSJose Ricardo Ziviani 2673466a3f9cSJose Ricardo Ziviani return bcd_cmp_zero(r); 2674466a3f9cSJose Ricardo Ziviani } 2675466a3f9cSJose Ricardo Ziviani 2676e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2677e04797f7SJose Ricardo Ziviani { 2678e04797f7SJose Ricardo Ziviani int cr; 2679428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2680e04797f7SJose Ricardo Ziviani bool ox_flag = false; 2681e04797f7SJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2682e04797f7SJose Ricardo Ziviani ppc_avr_t ret = *b; 26833c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2684e04797f7SJose Ricardo Ziviani 2685e04797f7SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2686e04797f7SJose Ricardo Ziviani return CRF_SO; 2687e04797f7SJose Ricardo Ziviani } 2688e04797f7SJose Ricardo Ziviani 2689e04797f7SJose Ricardo Ziviani if (unlikely(i > 31)) { 2690e04797f7SJose Ricardo Ziviani i = 31; 2691e04797f7SJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2692e04797f7SJose Ricardo Ziviani i = -31; 2693e04797f7SJose Ricardo Ziviani } 2694e04797f7SJose Ricardo Ziviani 2695e04797f7SJose Ricardo Ziviani if (i > 0) { 26963c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2697e04797f7SJose Ricardo Ziviani } else { 26983c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2699e04797f7SJose Ricardo Ziviani } 2700e04797f7SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2701e04797f7SJose Ricardo Ziviani 2702e04797f7SJose Ricardo Ziviani *r = ret; 2703e04797f7SJose Ricardo Ziviani 2704e04797f7SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2705e04797f7SJose Ricardo Ziviani if (ox_flag) { 2706e04797f7SJose Ricardo Ziviani cr |= CRF_SO; 2707e04797f7SJose Ricardo Ziviani } 2708e04797f7SJose Ricardo Ziviani 2709e04797f7SJose Ricardo Ziviani return cr; 2710e04797f7SJose Ricardo Ziviani } 2711e04797f7SJose Ricardo Ziviani 2712a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2713a49a95e9SJose Ricardo Ziviani { 2714a49a95e9SJose Ricardo Ziviani int cr; 2715a49a95e9SJose Ricardo Ziviani int i; 2716a49a95e9SJose Ricardo Ziviani int invalid = 0; 2717a49a95e9SJose Ricardo Ziviani bool ox_flag = false; 2718a49a95e9SJose Ricardo Ziviani ppc_avr_t ret = *b; 2719a49a95e9SJose Ricardo Ziviani 2720a49a95e9SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 2721a49a95e9SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2722a49a95e9SJose Ricardo Ziviani 2723a49a95e9SJose Ricardo Ziviani if (unlikely(invalid)) { 2724a49a95e9SJose Ricardo Ziviani return CRF_SO; 2725a49a95e9SJose Ricardo Ziviani } 2726a49a95e9SJose Ricardo Ziviani } 2727a49a95e9SJose Ricardo Ziviani 2728428115c3SMark Cave-Ayland i = a->VsrSB(7); 2729a49a95e9SJose Ricardo Ziviani if (i >= 32) { 2730a49a95e9SJose Ricardo Ziviani ox_flag = true; 27313c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2732a49a95e9SJose Ricardo Ziviani } else if (i <= -32) { 27333c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2734a49a95e9SJose Ricardo Ziviani } else if (i > 0) { 27353c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2736a49a95e9SJose Ricardo Ziviani } else { 27373c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2738a49a95e9SJose Ricardo Ziviani } 2739a49a95e9SJose Ricardo Ziviani *r = ret; 2740a49a95e9SJose Ricardo Ziviani 2741a49a95e9SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2742a49a95e9SJose Ricardo Ziviani if (ox_flag) { 2743a49a95e9SJose Ricardo Ziviani cr |= CRF_SO; 2744a49a95e9SJose Ricardo Ziviani } 2745a49a95e9SJose Ricardo Ziviani 2746a49a95e9SJose Ricardo Ziviani return cr; 2747a49a95e9SJose Ricardo Ziviani } 2748a49a95e9SJose Ricardo Ziviani 2749a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2750a54238adSJose Ricardo Ziviani { 2751a54238adSJose Ricardo Ziviani int cr; 2752a54238adSJose Ricardo Ziviani int unused = 0; 2753a54238adSJose Ricardo Ziviani int invalid = 0; 2754a54238adSJose Ricardo Ziviani bool ox_flag = false; 2755a54238adSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2756a54238adSJose Ricardo Ziviani ppc_avr_t ret = *b; 27573c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2758a54238adSJose Ricardo Ziviani 2759428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2760428115c3SMark Cave-Ayland ppc_avr_t bcd_one; 2761428115c3SMark Cave-Ayland 2762428115c3SMark Cave-Ayland bcd_one.VsrD(0) = 0; 2763428115c3SMark Cave-Ayland bcd_one.VsrD(1) = 0x10; 2764a54238adSJose Ricardo Ziviani 2765a54238adSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2766a54238adSJose Ricardo Ziviani return CRF_SO; 2767a54238adSJose Ricardo Ziviani } 2768a54238adSJose Ricardo Ziviani 2769a54238adSJose Ricardo Ziviani if (unlikely(i > 31)) { 2770a54238adSJose Ricardo Ziviani i = 31; 2771a54238adSJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2772a54238adSJose Ricardo Ziviani i = -31; 2773a54238adSJose Ricardo Ziviani } 2774a54238adSJose Ricardo Ziviani 2775a54238adSJose Ricardo Ziviani if (i > 0) { 27763c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2777a54238adSJose Ricardo Ziviani } else { 27783c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2779a54238adSJose Ricardo Ziviani 2780a54238adSJose Ricardo Ziviani if (bcd_get_digit(&ret, 0, &invalid) >= 5) { 2781a54238adSJose Ricardo Ziviani bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused); 2782a54238adSJose Ricardo Ziviani } 2783a54238adSJose Ricardo Ziviani } 2784a54238adSJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2785a54238adSJose Ricardo Ziviani 2786a54238adSJose Ricardo Ziviani cr = bcd_cmp_zero(&ret); 2787a54238adSJose Ricardo Ziviani if (ox_flag) { 2788a54238adSJose Ricardo Ziviani cr |= CRF_SO; 2789a54238adSJose Ricardo Ziviani } 2790a54238adSJose Ricardo Ziviani *r = ret; 2791a54238adSJose Ricardo Ziviani 2792a54238adSJose Ricardo Ziviani return cr; 2793a54238adSJose Ricardo Ziviani } 2794a54238adSJose Ricardo Ziviani 279531bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 279631bc4d11SJose Ricardo Ziviani { 279731bc4d11SJose Ricardo Ziviani uint64_t mask; 279831bc4d11SJose Ricardo Ziviani uint32_t ox_flag = 0; 2799428115c3SMark Cave-Ayland int i = a->VsrSH(3) + 1; 280031bc4d11SJose Ricardo Ziviani ppc_avr_t ret = *b; 280131bc4d11SJose Ricardo Ziviani 280231bc4d11SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 280331bc4d11SJose Ricardo Ziviani return CRF_SO; 280431bc4d11SJose Ricardo Ziviani } 280531bc4d11SJose Ricardo Ziviani 280631bc4d11SJose Ricardo Ziviani if (i > 16 && i < 32) { 280731bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 28083c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 280931bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 281031bc4d11SJose Ricardo Ziviani } 281131bc4d11SJose Ricardo Ziviani 28123c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 281331bc4d11SJose Ricardo Ziviani } else if (i >= 0 && i <= 16) { 281431bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 28153c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 281631bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 281731bc4d11SJose Ricardo Ziviani } 281831bc4d11SJose Ricardo Ziviani 28193c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 28203c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 282131bc4d11SJose Ricardo Ziviani } 282231bc4d11SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0); 282331bc4d11SJose Ricardo Ziviani *r = ret; 282431bc4d11SJose Ricardo Ziviani 282531bc4d11SJose Ricardo Ziviani return bcd_cmp_zero(&ret) | ox_flag; 282631bc4d11SJose Ricardo Ziviani } 282731bc4d11SJose Ricardo Ziviani 28285c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 28295c32e2e4SJose Ricardo Ziviani { 28305c32e2e4SJose Ricardo Ziviani int i; 28315c32e2e4SJose Ricardo Ziviani uint64_t mask; 28325c32e2e4SJose Ricardo Ziviani uint32_t ox_flag = 0; 28335c32e2e4SJose Ricardo Ziviani int invalid = 0; 28345c32e2e4SJose Ricardo Ziviani ppc_avr_t ret = *b; 28355c32e2e4SJose Ricardo Ziviani 28365c32e2e4SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 28375c32e2e4SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 28385c32e2e4SJose Ricardo Ziviani 28395c32e2e4SJose Ricardo Ziviani if (unlikely(invalid)) { 28405c32e2e4SJose Ricardo Ziviani return CRF_SO; 28415c32e2e4SJose Ricardo Ziviani } 28425c32e2e4SJose Ricardo Ziviani } 28435c32e2e4SJose Ricardo Ziviani 2844428115c3SMark Cave-Ayland i = a->VsrSH(3); 28455c32e2e4SJose Ricardo Ziviani if (i > 16 && i < 33) { 28465c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 28473c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 28485c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 28495c32e2e4SJose Ricardo Ziviani } 28505c32e2e4SJose Ricardo Ziviani 28513c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 28525c32e2e4SJose Ricardo Ziviani } else if (i > 0 && i <= 16) { 28535c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 28543c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 28555c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 28565c32e2e4SJose Ricardo Ziviani } 28575c32e2e4SJose Ricardo Ziviani 28583c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 28593c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 28605c32e2e4SJose Ricardo Ziviani } else if (i == 0) { 28613c385a93SMark Cave-Ayland if (ret.VsrD(0) || ret.VsrD(1)) { 28625c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 28635c32e2e4SJose Ricardo Ziviani } 28643c385a93SMark Cave-Ayland ret.VsrD(0) = ret.VsrD(1) = 0; 28655c32e2e4SJose Ricardo Ziviani } 28665c32e2e4SJose Ricardo Ziviani 28675c32e2e4SJose Ricardo Ziviani *r = ret; 28683c385a93SMark Cave-Ayland if (r->VsrD(0) == 0 && r->VsrD(1) == 0) { 28695c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_EQ; 28705c32e2e4SJose Ricardo Ziviani } 28715c32e2e4SJose Ricardo Ziviani 28725c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_GT; 28735c32e2e4SJose Ricardo Ziviani } 28745c32e2e4SJose Ricardo Ziviani 2875fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a) 2876fcf5ef2aSThomas Huth { 2877fcf5ef2aSThomas Huth int i; 2878fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 2879fcf5ef2aSThomas Huth r->u8[i] = AES_sbox[a->u8[i]]; 2880fcf5ef2aSThomas Huth } 2881fcf5ef2aSThomas Huth } 2882fcf5ef2aSThomas Huth 2883fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2884fcf5ef2aSThomas Huth { 2885fcf5ef2aSThomas Huth ppc_avr_t result; 2886fcf5ef2aSThomas Huth int i; 2887fcf5ef2aSThomas Huth 2888fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 28892dea57dbSMark Cave-Ayland result.VsrW(i) = b->VsrW(i) ^ 28902dea57dbSMark Cave-Ayland (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^ 28912dea57dbSMark Cave-Ayland AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^ 28922dea57dbSMark Cave-Ayland AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^ 28932dea57dbSMark Cave-Ayland AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]); 2894fcf5ef2aSThomas Huth } 2895fcf5ef2aSThomas Huth *r = result; 2896fcf5ef2aSThomas Huth } 2897fcf5ef2aSThomas Huth 2898fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2899fcf5ef2aSThomas Huth { 2900fcf5ef2aSThomas Huth ppc_avr_t result; 2901fcf5ef2aSThomas Huth int i; 2902fcf5ef2aSThomas Huth 2903fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 29042dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]); 2905fcf5ef2aSThomas Huth } 2906fcf5ef2aSThomas Huth *r = result; 2907fcf5ef2aSThomas Huth } 2908fcf5ef2aSThomas Huth 2909fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2910fcf5ef2aSThomas Huth { 2911fcf5ef2aSThomas Huth /* This differs from what is written in ISA V2.07. The RTL is */ 2912fcf5ef2aSThomas Huth /* incorrect and will be fixed in V2.07B. */ 2913fcf5ef2aSThomas Huth int i; 2914fcf5ef2aSThomas Huth ppc_avr_t tmp; 2915fcf5ef2aSThomas Huth 2916fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 29172dea57dbSMark Cave-Ayland tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])]; 2918fcf5ef2aSThomas Huth } 2919fcf5ef2aSThomas Huth 2920fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 29212dea57dbSMark Cave-Ayland r->VsrW(i) = 29222dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 0)][0] ^ 29232dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 1)][1] ^ 29242dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 2)][2] ^ 29252dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 3)][3]; 2926fcf5ef2aSThomas Huth } 2927fcf5ef2aSThomas Huth } 2928fcf5ef2aSThomas Huth 2929fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2930fcf5ef2aSThomas Huth { 2931fcf5ef2aSThomas Huth ppc_avr_t result; 2932fcf5ef2aSThomas Huth int i; 2933fcf5ef2aSThomas Huth 2934fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 29352dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]); 2936fcf5ef2aSThomas Huth } 2937fcf5ef2aSThomas Huth *r = result; 2938fcf5ef2aSThomas Huth } 2939fcf5ef2aSThomas Huth 2940fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2941fcf5ef2aSThomas Huth { 2942fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2943fcf5ef2aSThomas Huth int six = st_six & 0xF; 2944fcf5ef2aSThomas Huth int i; 2945fcf5ef2aSThomas Huth 2946730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2947fcf5ef2aSThomas Huth if (st == 0) { 2948fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 29490ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 7) ^ 29500ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 18) ^ 2951730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 3); 2952fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 29530ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 17) ^ 29540ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 19) ^ 2955730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 10); 2956fcf5ef2aSThomas Huth } 2957fcf5ef2aSThomas Huth } else { /* st == 1 */ 2958fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 29590ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 2) ^ 29600ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 13) ^ 29610ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 22); 2962fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 29630ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 6) ^ 29640ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 11) ^ 29650ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 25); 2966fcf5ef2aSThomas Huth } 2967fcf5ef2aSThomas Huth } 2968fcf5ef2aSThomas Huth } 2969fcf5ef2aSThomas Huth } 2970fcf5ef2aSThomas Huth 2971fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2972fcf5ef2aSThomas Huth { 2973fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2974fcf5ef2aSThomas Huth int six = st_six & 0xF; 2975fcf5ef2aSThomas Huth int i; 2976fcf5ef2aSThomas Huth 2977730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 2978fcf5ef2aSThomas Huth if (st == 0) { 2979fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 29800ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 1) ^ 29810ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 8) ^ 2982730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 7); 2983fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 29840ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 19) ^ 29850ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 61) ^ 2986730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 6); 2987fcf5ef2aSThomas Huth } 2988fcf5ef2aSThomas Huth } else { /* st == 1 */ 2989fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 29900ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 28) ^ 29910ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 34) ^ 29920ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 39); 2993fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 29940ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 14) ^ 29950ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 18) ^ 29960ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 41); 2997fcf5ef2aSThomas Huth } 2998fcf5ef2aSThomas Huth } 2999fcf5ef2aSThomas Huth } 3000fcf5ef2aSThomas Huth } 3001fcf5ef2aSThomas Huth 3002fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 3003fcf5ef2aSThomas Huth { 3004fcf5ef2aSThomas Huth ppc_avr_t result; 3005fcf5ef2aSThomas Huth int i; 3006fcf5ef2aSThomas Huth 300760594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 300860594feaSMark Cave-Ayland int indexA = c->VsrB(i) >> 4; 300960594feaSMark Cave-Ayland int indexB = c->VsrB(i) & 0xF; 301060594feaSMark Cave-Ayland 301160594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB); 3012fcf5ef2aSThomas Huth } 3013fcf5ef2aSThomas Huth *r = result; 3014fcf5ef2aSThomas Huth } 3015fcf5ef2aSThomas Huth 3016fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I 3017fcf5ef2aSThomas Huth 3018fcf5ef2aSThomas Huth /*****************************************************************************/ 3019fcf5ef2aSThomas Huth /* SPE extension helpers */ 3020fcf5ef2aSThomas Huth /* Use a table to make this quicker */ 3021fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = { 3022fcf5ef2aSThomas Huth 0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE, 3023fcf5ef2aSThomas Huth 0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF, 3024fcf5ef2aSThomas Huth }; 3025fcf5ef2aSThomas Huth 3026fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val) 3027fcf5ef2aSThomas Huth { 3028fcf5ef2aSThomas Huth return hbrev[val >> 4] | (hbrev[val & 0xF] << 4); 3029fcf5ef2aSThomas Huth } 3030fcf5ef2aSThomas Huth 3031fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val) 3032fcf5ef2aSThomas Huth { 3033fcf5ef2aSThomas Huth return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) | 3034fcf5ef2aSThomas Huth (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24); 3035fcf5ef2aSThomas Huth } 3036fcf5ef2aSThomas Huth 3037fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */ 3038fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2) 3039fcf5ef2aSThomas Huth { 3040fcf5ef2aSThomas Huth uint32_t a, b, d, mask; 3041fcf5ef2aSThomas Huth 3042fcf5ef2aSThomas Huth mask = UINT32_MAX >> (32 - MASKBITS); 3043fcf5ef2aSThomas Huth a = arg1 & mask; 3044fcf5ef2aSThomas Huth b = arg2 & mask; 3045fcf5ef2aSThomas Huth d = word_reverse(1 + word_reverse(a | ~b)); 3046fcf5ef2aSThomas Huth return (arg1 & ~mask) | (d & b); 3047fcf5ef2aSThomas Huth } 3048fcf5ef2aSThomas Huth 3049fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val) 3050fcf5ef2aSThomas Huth { 3051fcf5ef2aSThomas Huth if (val & 0x80000000) { 3052fcf5ef2aSThomas Huth return clz32(~val); 3053fcf5ef2aSThomas Huth } else { 3054fcf5ef2aSThomas Huth return clz32(val); 3055fcf5ef2aSThomas Huth } 3056fcf5ef2aSThomas Huth } 3057fcf5ef2aSThomas Huth 3058fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val) 3059fcf5ef2aSThomas Huth { 3060fcf5ef2aSThomas Huth return clz32(val); 3061fcf5ef2aSThomas Huth } 3062fcf5ef2aSThomas Huth 3063fcf5ef2aSThomas Huth /* 440 specific */ 3064fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high, 3065fcf5ef2aSThomas Huth target_ulong low, uint32_t update_Rc) 3066fcf5ef2aSThomas Huth { 3067fcf5ef2aSThomas Huth target_ulong mask; 3068fcf5ef2aSThomas Huth int i; 3069fcf5ef2aSThomas Huth 3070fcf5ef2aSThomas Huth i = 1; 3071fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3072fcf5ef2aSThomas Huth if ((high & mask) == 0) { 3073fcf5ef2aSThomas Huth if (update_Rc) { 3074fcf5ef2aSThomas Huth env->crf[0] = 0x4; 3075fcf5ef2aSThomas Huth } 3076fcf5ef2aSThomas Huth goto done; 3077fcf5ef2aSThomas Huth } 3078fcf5ef2aSThomas Huth i++; 3079fcf5ef2aSThomas Huth } 3080fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3081fcf5ef2aSThomas Huth if ((low & mask) == 0) { 3082fcf5ef2aSThomas Huth if (update_Rc) { 3083fcf5ef2aSThomas Huth env->crf[0] = 0x8; 3084fcf5ef2aSThomas Huth } 3085fcf5ef2aSThomas Huth goto done; 3086fcf5ef2aSThomas Huth } 3087fcf5ef2aSThomas Huth i++; 3088fcf5ef2aSThomas Huth } 3089fcf5ef2aSThomas Huth i = 8; 3090fcf5ef2aSThomas Huth if (update_Rc) { 3091fcf5ef2aSThomas Huth env->crf[0] = 0x2; 3092fcf5ef2aSThomas Huth } 3093fcf5ef2aSThomas Huth done: 3094fcf5ef2aSThomas Huth env->xer = (env->xer & ~0x7F) | i; 3095fcf5ef2aSThomas Huth if (update_Rc) { 3096fcf5ef2aSThomas Huth env->crf[0] |= xer_so; 3097fcf5ef2aSThomas Huth } 3098fcf5ef2aSThomas Huth return i; 3099fcf5ef2aSThomas Huth } 3100