1fcf5ef2aSThomas Huth /* 2fcf5ef2aSThomas Huth * PowerPC integer and vector emulation helpers for QEMU. 3fcf5ef2aSThomas Huth * 4fcf5ef2aSThomas Huth * Copyright (c) 2003-2007 Jocelyn Mayer 5fcf5ef2aSThomas Huth * 6fcf5ef2aSThomas Huth * This library is free software; you can redistribute it and/or 7fcf5ef2aSThomas Huth * modify it under the terms of the GNU Lesser General Public 8fcf5ef2aSThomas Huth * License as published by the Free Software Foundation; either 96bd039cdSChetan Pant * version 2.1 of the License, or (at your option) any later version. 10fcf5ef2aSThomas Huth * 11fcf5ef2aSThomas Huth * This library is distributed in the hope that it will be useful, 12fcf5ef2aSThomas Huth * but WITHOUT ANY WARRANTY; without even the implied warranty of 13fcf5ef2aSThomas Huth * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14fcf5ef2aSThomas Huth * Lesser General Public License for more details. 15fcf5ef2aSThomas Huth * 16fcf5ef2aSThomas Huth * You should have received a copy of the GNU Lesser General Public 17fcf5ef2aSThomas Huth * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18fcf5ef2aSThomas Huth */ 19db725815SMarkus Armbruster 20fcf5ef2aSThomas Huth #include "qemu/osdep.h" 21fcf5ef2aSThomas Huth #include "cpu.h" 22fcf5ef2aSThomas Huth #include "internal.h" 23fcf5ef2aSThomas Huth #include "qemu/host-utils.h" 24db725815SMarkus Armbruster #include "qemu/main-loop.h" 258a05fd9aSRichard Henderson #include "qemu/log.h" 26fcf5ef2aSThomas Huth #include "exec/helper-proto.h" 27fcf5ef2aSThomas Huth #include "crypto/aes.h" 2824f91e81SAlex Bennée #include "fpu/softfloat.h" 293f74b632SRichard Henderson #include "qapi/error.h" 303f74b632SRichard Henderson #include "qemu/guest-random.h" 31fcf5ef2aSThomas Huth 32fcf5ef2aSThomas Huth #include "helper_regs.h" 33fcf5ef2aSThomas Huth /*****************************************************************************/ 34fcf5ef2aSThomas Huth /* Fixed point operations helpers */ 35fcf5ef2aSThomas Huth 36f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov) 37f32899deSNikunj A Dadhania { 38f32899deSNikunj A Dadhania if (unlikely(ov)) { 39f32899deSNikunj A Dadhania env->so = env->ov = 1; 40f32899deSNikunj A Dadhania } else { 41f32899deSNikunj A Dadhania env->ov = 0; 42f32899deSNikunj A Dadhania } 43f32899deSNikunj A Dadhania } 44f32899deSNikunj A Dadhania 45fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb, 46fcf5ef2aSThomas Huth uint32_t oe) 47fcf5ef2aSThomas Huth { 48fcf5ef2aSThomas Huth uint64_t rt = 0; 49fcf5ef2aSThomas Huth int overflow = 0; 50fcf5ef2aSThomas Huth 51fcf5ef2aSThomas Huth uint64_t dividend = (uint64_t)ra << 32; 52fcf5ef2aSThomas Huth uint64_t divisor = (uint32_t)rb; 53fcf5ef2aSThomas Huth 54fcf5ef2aSThomas Huth if (unlikely(divisor == 0)) { 55fcf5ef2aSThomas Huth overflow = 1; 56fcf5ef2aSThomas Huth } else { 57fcf5ef2aSThomas Huth rt = dividend / divisor; 58fcf5ef2aSThomas Huth overflow = rt > UINT32_MAX; 59fcf5ef2aSThomas Huth } 60fcf5ef2aSThomas Huth 61fcf5ef2aSThomas Huth if (unlikely(overflow)) { 62fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 63fcf5ef2aSThomas Huth } 64fcf5ef2aSThomas Huth 65fcf5ef2aSThomas Huth if (oe) { 66f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 67fcf5ef2aSThomas Huth } 68fcf5ef2aSThomas Huth 69fcf5ef2aSThomas Huth return (target_ulong)rt; 70fcf5ef2aSThomas Huth } 71fcf5ef2aSThomas Huth 72fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb, 73fcf5ef2aSThomas Huth uint32_t oe) 74fcf5ef2aSThomas Huth { 75fcf5ef2aSThomas Huth int64_t rt = 0; 76fcf5ef2aSThomas Huth int overflow = 0; 77fcf5ef2aSThomas Huth 78fcf5ef2aSThomas Huth int64_t dividend = (int64_t)ra << 32; 79fcf5ef2aSThomas Huth int64_t divisor = (int64_t)((int32_t)rb); 80fcf5ef2aSThomas Huth 81fcf5ef2aSThomas Huth if (unlikely((divisor == 0) || 82fcf5ef2aSThomas Huth ((divisor == -1ull) && (dividend == INT64_MIN)))) { 83fcf5ef2aSThomas Huth overflow = 1; 84fcf5ef2aSThomas Huth } else { 85fcf5ef2aSThomas Huth rt = dividend / divisor; 86fcf5ef2aSThomas Huth overflow = rt != (int32_t)rt; 87fcf5ef2aSThomas Huth } 88fcf5ef2aSThomas Huth 89fcf5ef2aSThomas Huth if (unlikely(overflow)) { 90fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 91fcf5ef2aSThomas Huth } 92fcf5ef2aSThomas Huth 93fcf5ef2aSThomas Huth if (oe) { 94f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 95fcf5ef2aSThomas Huth } 96fcf5ef2aSThomas Huth 97fcf5ef2aSThomas Huth return (target_ulong)rt; 98fcf5ef2aSThomas Huth } 99fcf5ef2aSThomas Huth 100fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 101fcf5ef2aSThomas Huth 102fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe) 103fcf5ef2aSThomas Huth { 104fcf5ef2aSThomas Huth uint64_t rt = 0; 105fcf5ef2aSThomas Huth int overflow = 0; 106fcf5ef2aSThomas Huth 107fcf5ef2aSThomas Huth overflow = divu128(&rt, &ra, rb); 108fcf5ef2aSThomas Huth 109fcf5ef2aSThomas Huth if (unlikely(overflow)) { 110fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 111fcf5ef2aSThomas Huth } 112fcf5ef2aSThomas Huth 113fcf5ef2aSThomas Huth if (oe) { 114f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 115fcf5ef2aSThomas Huth } 116fcf5ef2aSThomas Huth 117fcf5ef2aSThomas Huth return rt; 118fcf5ef2aSThomas Huth } 119fcf5ef2aSThomas Huth 120fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe) 121fcf5ef2aSThomas Huth { 122fcf5ef2aSThomas Huth int64_t rt = 0; 123fcf5ef2aSThomas Huth int64_t ra = (int64_t)rau; 124fcf5ef2aSThomas Huth int64_t rb = (int64_t)rbu; 125fcf5ef2aSThomas Huth int overflow = divs128(&rt, &ra, rb); 126fcf5ef2aSThomas Huth 127fcf5ef2aSThomas Huth if (unlikely(overflow)) { 128fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 129fcf5ef2aSThomas Huth } 130fcf5ef2aSThomas Huth 131fcf5ef2aSThomas Huth if (oe) { 132f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 133fcf5ef2aSThomas Huth } 134fcf5ef2aSThomas Huth 135fcf5ef2aSThomas Huth return rt; 136fcf5ef2aSThomas Huth } 137fcf5ef2aSThomas Huth 138fcf5ef2aSThomas Huth #endif 139fcf5ef2aSThomas Huth 140fcf5ef2aSThomas Huth 141fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 142fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */ 143fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff)) 144fcf5ef2aSThomas Huth 145b6cb41b2SDavid Gibson /* 146b6cb41b2SDavid Gibson * subtract 1 from each byte, and with inverse, check if MSB is set at each 147fcf5ef2aSThomas Huth * byte. 148fcf5ef2aSThomas Huth * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80 149fcf5ef2aSThomas Huth * (0xFF & 0xFF) & 0x80 = 0x80 (zero found) 150fcf5ef2aSThomas Huth */ 151fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80)) 152fcf5ef2aSThomas Huth 153fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */ 154fcf5ef2aSThomas Huth #define hasvalue(x, n) (haszero((x) ^ pattern(n))) 155fcf5ef2aSThomas Huth 156fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb) 157fcf5ef2aSThomas Huth { 158efa73196SNikunj A Dadhania return hasvalue(rb, ra) ? CRF_GT : 0; 159fcf5ef2aSThomas Huth } 160fcf5ef2aSThomas Huth 161fcf5ef2aSThomas Huth #undef pattern 162fcf5ef2aSThomas Huth #undef haszero 163fcf5ef2aSThomas Huth #undef hasvalue 164fcf5ef2aSThomas Huth 165b6cb41b2SDavid Gibson /* 1663f74b632SRichard Henderson * Return a random number. 167fcf5ef2aSThomas Huth */ 1683f74b632SRichard Henderson uint64_t helper_darn32(void) 169fcf5ef2aSThomas Huth { 1703f74b632SRichard Henderson Error *err = NULL; 1713f74b632SRichard Henderson uint32_t ret; 1723f74b632SRichard Henderson 1733f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1743f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1753f74b632SRichard Henderson error_get_pretty(err)); 1763f74b632SRichard Henderson error_free(err); 177fcf5ef2aSThomas Huth return -1; 178fcf5ef2aSThomas Huth } 179fcf5ef2aSThomas Huth 1803f74b632SRichard Henderson return ret; 1813f74b632SRichard Henderson } 1823f74b632SRichard Henderson 1833f74b632SRichard Henderson uint64_t helper_darn64(void) 184fcf5ef2aSThomas Huth { 1853f74b632SRichard Henderson Error *err = NULL; 1863f74b632SRichard Henderson uint64_t ret; 1873f74b632SRichard Henderson 1883f74b632SRichard Henderson if (qemu_guest_getrandom(&ret, sizeof(ret), &err) < 0) { 1893f74b632SRichard Henderson qemu_log_mask(LOG_UNIMP, "darn: Crypto failure: %s", 1903f74b632SRichard Henderson error_get_pretty(err)); 1913f74b632SRichard Henderson error_free(err); 192fcf5ef2aSThomas Huth return -1; 193fcf5ef2aSThomas Huth } 194fcf5ef2aSThomas Huth 1953f74b632SRichard Henderson return ret; 1963f74b632SRichard Henderson } 197fcf5ef2aSThomas Huth 198fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb) 199fcf5ef2aSThomas Huth { 200fcf5ef2aSThomas Huth int i; 201fcf5ef2aSThomas Huth uint64_t ra = 0; 202fcf5ef2aSThomas Huth 203fcf5ef2aSThomas Huth for (i = 0; i < 8; i++) { 204fcf5ef2aSThomas Huth int index = (rs >> (i * 8)) & 0xFF; 205fcf5ef2aSThomas Huth if (index < 64) { 206a6a444a8SCédric Le Goater if (rb & PPC_BIT(index)) { 207fcf5ef2aSThomas Huth ra |= 1 << i; 208fcf5ef2aSThomas Huth } 209fcf5ef2aSThomas Huth } 210fcf5ef2aSThomas Huth } 211fcf5ef2aSThomas Huth return ra; 212fcf5ef2aSThomas Huth } 213fcf5ef2aSThomas Huth 214fcf5ef2aSThomas Huth #endif 215fcf5ef2aSThomas Huth 216fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb) 217fcf5ef2aSThomas Huth { 218fcf5ef2aSThomas Huth target_ulong mask = 0xff; 219fcf5ef2aSThomas Huth target_ulong ra = 0; 220fcf5ef2aSThomas Huth int i; 221fcf5ef2aSThomas Huth 222fcf5ef2aSThomas Huth for (i = 0; i < sizeof(target_ulong); i++) { 223fcf5ef2aSThomas Huth if ((rs & mask) == (rb & mask)) { 224fcf5ef2aSThomas Huth ra |= mask; 225fcf5ef2aSThomas Huth } 226fcf5ef2aSThomas Huth mask <<= 8; 227fcf5ef2aSThomas Huth } 228fcf5ef2aSThomas Huth return ra; 229fcf5ef2aSThomas Huth } 230fcf5ef2aSThomas Huth 231fcf5ef2aSThomas Huth /* shift right arithmetic helper */ 232fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value, 233fcf5ef2aSThomas Huth target_ulong shift) 234fcf5ef2aSThomas Huth { 235fcf5ef2aSThomas Huth int32_t ret; 236fcf5ef2aSThomas Huth 237fcf5ef2aSThomas Huth if (likely(!(shift & 0x20))) { 238fcf5ef2aSThomas Huth if (likely((uint32_t)shift != 0)) { 239fcf5ef2aSThomas Huth shift &= 0x1f; 240fcf5ef2aSThomas Huth ret = (int32_t)value >> shift; 241fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) { 242af1c259fSSandipan Das env->ca32 = env->ca = 0; 243fcf5ef2aSThomas Huth } else { 244af1c259fSSandipan Das env->ca32 = env->ca = 1; 245fcf5ef2aSThomas Huth } 246fcf5ef2aSThomas Huth } else { 247fcf5ef2aSThomas Huth ret = (int32_t)value; 248af1c259fSSandipan Das env->ca32 = env->ca = 0; 249fcf5ef2aSThomas Huth } 250fcf5ef2aSThomas Huth } else { 251fcf5ef2aSThomas Huth ret = (int32_t)value >> 31; 252af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 253fcf5ef2aSThomas Huth } 254fcf5ef2aSThomas Huth return (target_long)ret; 255fcf5ef2aSThomas Huth } 256fcf5ef2aSThomas Huth 257fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 258fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value, 259fcf5ef2aSThomas Huth target_ulong shift) 260fcf5ef2aSThomas Huth { 261fcf5ef2aSThomas Huth int64_t ret; 262fcf5ef2aSThomas Huth 263fcf5ef2aSThomas Huth if (likely(!(shift & 0x40))) { 264fcf5ef2aSThomas Huth if (likely((uint64_t)shift != 0)) { 265fcf5ef2aSThomas Huth shift &= 0x3f; 266fcf5ef2aSThomas Huth ret = (int64_t)value >> shift; 267fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) { 268af1c259fSSandipan Das env->ca32 = env->ca = 0; 269fcf5ef2aSThomas Huth } else { 270af1c259fSSandipan Das env->ca32 = env->ca = 1; 271fcf5ef2aSThomas Huth } 272fcf5ef2aSThomas Huth } else { 273fcf5ef2aSThomas Huth ret = (int64_t)value; 274af1c259fSSandipan Das env->ca32 = env->ca = 0; 275fcf5ef2aSThomas Huth } 276fcf5ef2aSThomas Huth } else { 277fcf5ef2aSThomas Huth ret = (int64_t)value >> 63; 278af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 279fcf5ef2aSThomas Huth } 280fcf5ef2aSThomas Huth return ret; 281fcf5ef2aSThomas Huth } 282fcf5ef2aSThomas Huth #endif 283fcf5ef2aSThomas Huth 284fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 285fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 286fcf5ef2aSThomas Huth { 28779770002SRichard Henderson /* Note that we don't fold past bytes */ 288fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 289fcf5ef2aSThomas Huth 0x5555555555555555ULL); 290fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 291fcf5ef2aSThomas Huth 0x3333333333333333ULL); 292fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 293fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 294fcf5ef2aSThomas Huth return val; 295fcf5ef2aSThomas Huth } 296fcf5ef2aSThomas Huth 297fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val) 298fcf5ef2aSThomas Huth { 29979770002SRichard Henderson /* Note that we don't fold past words. */ 300fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 301fcf5ef2aSThomas Huth 0x5555555555555555ULL); 302fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 303fcf5ef2aSThomas Huth 0x3333333333333333ULL); 304fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 305fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 306fcf5ef2aSThomas Huth val = (val & 0x00ff00ff00ff00ffULL) + ((val >> 8) & 307fcf5ef2aSThomas Huth 0x00ff00ff00ff00ffULL); 308fcf5ef2aSThomas Huth val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) & 309fcf5ef2aSThomas Huth 0x0000ffff0000ffffULL); 310fcf5ef2aSThomas Huth return val; 311fcf5ef2aSThomas Huth } 312fcf5ef2aSThomas Huth #else 313fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 314fcf5ef2aSThomas Huth { 31579770002SRichard Henderson /* Note that we don't fold past bytes */ 316fcf5ef2aSThomas Huth val = (val & 0x55555555) + ((val >> 1) & 0x55555555); 317fcf5ef2aSThomas Huth val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 318fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f) + ((val >> 4) & 0x0f0f0f0f); 319fcf5ef2aSThomas Huth return val; 320fcf5ef2aSThomas Huth } 321fcf5ef2aSThomas Huth #endif 322fcf5ef2aSThomas Huth 323fcf5ef2aSThomas Huth /*****************************************************************************/ 324fcf5ef2aSThomas Huth /* PowerPC 601 specific instructions (POWER bridge) */ 325fcf5ef2aSThomas Huth target_ulong helper_div(CPUPPCState *env, target_ulong arg1, target_ulong arg2) 326fcf5ef2aSThomas Huth { 327fcf5ef2aSThomas Huth uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ]; 328fcf5ef2aSThomas Huth 329fcf5ef2aSThomas Huth if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 330fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 331fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 332fcf5ef2aSThomas Huth return INT32_MIN; 333fcf5ef2aSThomas Huth } else { 334fcf5ef2aSThomas Huth env->spr[SPR_MQ] = tmp % arg2; 335fcf5ef2aSThomas Huth return tmp / (int32_t)arg2; 336fcf5ef2aSThomas Huth } 337fcf5ef2aSThomas Huth } 338fcf5ef2aSThomas Huth 339fcf5ef2aSThomas Huth target_ulong helper_divo(CPUPPCState *env, target_ulong arg1, 340fcf5ef2aSThomas Huth target_ulong arg2) 341fcf5ef2aSThomas Huth { 342fcf5ef2aSThomas Huth uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ]; 343fcf5ef2aSThomas Huth 344fcf5ef2aSThomas Huth if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 345fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 346fcf5ef2aSThomas Huth env->so = env->ov = 1; 347fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 348fcf5ef2aSThomas Huth return INT32_MIN; 349fcf5ef2aSThomas Huth } else { 350fcf5ef2aSThomas Huth env->spr[SPR_MQ] = tmp % arg2; 351fcf5ef2aSThomas Huth tmp /= (int32_t)arg2; 352fcf5ef2aSThomas Huth if ((int32_t)tmp != tmp) { 353fcf5ef2aSThomas Huth env->so = env->ov = 1; 354fcf5ef2aSThomas Huth } else { 355fcf5ef2aSThomas Huth env->ov = 0; 356fcf5ef2aSThomas Huth } 357fcf5ef2aSThomas Huth return tmp; 358fcf5ef2aSThomas Huth } 359fcf5ef2aSThomas Huth } 360fcf5ef2aSThomas Huth 361fcf5ef2aSThomas Huth target_ulong helper_divs(CPUPPCState *env, target_ulong arg1, 362fcf5ef2aSThomas Huth target_ulong arg2) 363fcf5ef2aSThomas Huth { 364fcf5ef2aSThomas Huth if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 365fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 366fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 367fcf5ef2aSThomas Huth return INT32_MIN; 368fcf5ef2aSThomas Huth } else { 369fcf5ef2aSThomas Huth env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2; 370fcf5ef2aSThomas Huth return (int32_t)arg1 / (int32_t)arg2; 371fcf5ef2aSThomas Huth } 372fcf5ef2aSThomas Huth } 373fcf5ef2aSThomas Huth 374fcf5ef2aSThomas Huth target_ulong helper_divso(CPUPPCState *env, target_ulong arg1, 375fcf5ef2aSThomas Huth target_ulong arg2) 376fcf5ef2aSThomas Huth { 377fcf5ef2aSThomas Huth if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 378fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 379fcf5ef2aSThomas Huth env->so = env->ov = 1; 380fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 381fcf5ef2aSThomas Huth return INT32_MIN; 382fcf5ef2aSThomas Huth } else { 383fcf5ef2aSThomas Huth env->ov = 0; 384fcf5ef2aSThomas Huth env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2; 385fcf5ef2aSThomas Huth return (int32_t)arg1 / (int32_t)arg2; 386fcf5ef2aSThomas Huth } 387fcf5ef2aSThomas Huth } 388fcf5ef2aSThomas Huth 389fcf5ef2aSThomas Huth /*****************************************************************************/ 390fcf5ef2aSThomas Huth /* 602 specific instructions */ 391fcf5ef2aSThomas Huth /* mfrom is the most crazy instruction ever seen, imho ! */ 392fcf5ef2aSThomas Huth /* Real implementation uses a ROM table. Do the same */ 393b6cb41b2SDavid Gibson /* 394b6cb41b2SDavid Gibson * Extremely decomposed: 395fcf5ef2aSThomas Huth * -arg / 256 396fcf5ef2aSThomas Huth * return 256 * log10(10 + 1.0) + 0.5 397fcf5ef2aSThomas Huth */ 398fcf5ef2aSThomas Huth #if !defined(CONFIG_USER_ONLY) 399fcf5ef2aSThomas Huth target_ulong helper_602_mfrom(target_ulong arg) 400fcf5ef2aSThomas Huth { 401fcf5ef2aSThomas Huth if (likely(arg < 602)) { 402139c1837SPaolo Bonzini #include "mfrom_table.c.inc" 403fcf5ef2aSThomas Huth return mfrom_ROM_table[arg]; 404fcf5ef2aSThomas Huth } else { 405fcf5ef2aSThomas Huth return 0; 406fcf5ef2aSThomas Huth } 407fcf5ef2aSThomas Huth } 408fcf5ef2aSThomas Huth #endif 409fcf5ef2aSThomas Huth 410fcf5ef2aSThomas Huth /*****************************************************************************/ 411fcf5ef2aSThomas Huth /* Altivec extension helpers */ 412fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 413fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 414fcf5ef2aSThomas Huth for (index = 0; index < ARRAY_SIZE(r->element); index++) 415fcf5ef2aSThomas Huth #else 416fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 417fcf5ef2aSThomas Huth for (index = ARRAY_SIZE(r->element) - 1; index >= 0; index--) 418fcf5ef2aSThomas Huth #endif 419fcf5ef2aSThomas Huth 420fcf5ef2aSThomas Huth /* Saturating arithmetic helpers. */ 421fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max) \ 422fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 423fcf5ef2aSThomas Huth { \ 424fcf5ef2aSThomas Huth to_type r; \ 425fcf5ef2aSThomas Huth \ 426fcf5ef2aSThomas Huth if (x < (from_type)min) { \ 427fcf5ef2aSThomas Huth r = min; \ 428fcf5ef2aSThomas Huth *sat = 1; \ 429fcf5ef2aSThomas Huth } else if (x > (from_type)max) { \ 430fcf5ef2aSThomas Huth r = max; \ 431fcf5ef2aSThomas Huth *sat = 1; \ 432fcf5ef2aSThomas Huth } else { \ 433fcf5ef2aSThomas Huth r = x; \ 434fcf5ef2aSThomas Huth } \ 435fcf5ef2aSThomas Huth return r; \ 436fcf5ef2aSThomas Huth } 437fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max) \ 438fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 439fcf5ef2aSThomas Huth { \ 440fcf5ef2aSThomas Huth to_type r; \ 441fcf5ef2aSThomas Huth \ 442fcf5ef2aSThomas Huth if (x > (from_type)max) { \ 443fcf5ef2aSThomas Huth r = max; \ 444fcf5ef2aSThomas Huth *sat = 1; \ 445fcf5ef2aSThomas Huth } else { \ 446fcf5ef2aSThomas Huth r = x; \ 447fcf5ef2aSThomas Huth } \ 448fcf5ef2aSThomas Huth return r; \ 449fcf5ef2aSThomas Huth } 450fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX) 451fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX) 452fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX) 453fcf5ef2aSThomas Huth 454fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX) 455fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX) 456fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX) 457fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX) 458fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX) 459fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX) 460fcf5ef2aSThomas Huth #undef SATCVT 461fcf5ef2aSThomas Huth #undef SATCVTU 462fcf5ef2aSThomas Huth 463dedfaac7SRichard Henderson void helper_mtvscr(CPUPPCState *env, uint32_t vscr) 464fcf5ef2aSThomas Huth { 465*c19940dbSBruno Larsen (billionai) ppc_store_vscr(env, vscr); 466fcf5ef2aSThomas Huth } 467fcf5ef2aSThomas Huth 468cc2b90d7SRichard Henderson uint32_t helper_mfvscr(CPUPPCState *env) 469cc2b90d7SRichard Henderson { 470*c19940dbSBruno Larsen (billionai) return ppc_get_vscr(env); 471cc2b90d7SRichard Henderson } 472cc2b90d7SRichard Henderson 4736175f5a0SRichard Henderson static inline void set_vscr_sat(CPUPPCState *env) 4746175f5a0SRichard Henderson { 4759b5b74daSRichard Henderson /* The choice of non-zero value is arbitrary. */ 4769b5b74daSRichard Henderson env->vscr_sat.u32[0] = 1; 4776175f5a0SRichard Henderson } 4786175f5a0SRichard Henderson 479fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 480fcf5ef2aSThomas Huth { 481fcf5ef2aSThomas Huth int i; 482fcf5ef2aSThomas Huth 483fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 484fcf5ef2aSThomas Huth r->u32[i] = ~a->u32[i] < b->u32[i]; 485fcf5ef2aSThomas Huth } 486fcf5ef2aSThomas Huth } 487fcf5ef2aSThomas Huth 488fcf5ef2aSThomas Huth /* vprtybw */ 489fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b) 490fcf5ef2aSThomas Huth { 491fcf5ef2aSThomas Huth int i; 492fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 493fcf5ef2aSThomas Huth uint64_t res = b->u32[i] ^ (b->u32[i] >> 16); 494fcf5ef2aSThomas Huth res ^= res >> 8; 495fcf5ef2aSThomas Huth r->u32[i] = res & 1; 496fcf5ef2aSThomas Huth } 497fcf5ef2aSThomas Huth } 498fcf5ef2aSThomas Huth 499fcf5ef2aSThomas Huth /* vprtybd */ 500fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b) 501fcf5ef2aSThomas Huth { 502fcf5ef2aSThomas Huth int i; 503fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 504fcf5ef2aSThomas Huth uint64_t res = b->u64[i] ^ (b->u64[i] >> 32); 505fcf5ef2aSThomas Huth res ^= res >> 16; 506fcf5ef2aSThomas Huth res ^= res >> 8; 507fcf5ef2aSThomas Huth r->u64[i] = res & 1; 508fcf5ef2aSThomas Huth } 509fcf5ef2aSThomas Huth } 510fcf5ef2aSThomas Huth 511fcf5ef2aSThomas Huth /* vprtybq */ 512fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b) 513fcf5ef2aSThomas Huth { 514fcf5ef2aSThomas Huth uint64_t res = b->u64[0] ^ b->u64[1]; 515fcf5ef2aSThomas Huth res ^= res >> 32; 516fcf5ef2aSThomas Huth res ^= res >> 16; 517fcf5ef2aSThomas Huth res ^= res >> 8; 5183c385a93SMark Cave-Ayland r->VsrD(1) = res & 1; 5193c385a93SMark Cave-Ayland r->VsrD(0) = 0; 520fcf5ef2aSThomas Huth } 521fcf5ef2aSThomas Huth 522fcf5ef2aSThomas Huth #define VARITHFP(suffix, func) \ 523fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 524fcf5ef2aSThomas Huth ppc_avr_t *b) \ 525fcf5ef2aSThomas Huth { \ 526fcf5ef2aSThomas Huth int i; \ 527fcf5ef2aSThomas Huth \ 52805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 52905ee3e8aSMark Cave-Ayland r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status); \ 530fcf5ef2aSThomas Huth } \ 531fcf5ef2aSThomas Huth } 532fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add) 533fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub) 534fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min) 535fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max) 536fcf5ef2aSThomas Huth #undef VARITHFP 537fcf5ef2aSThomas Huth 538fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type) \ 539fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 540fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) \ 541fcf5ef2aSThomas Huth { \ 542fcf5ef2aSThomas Huth int i; \ 54305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 54405ee3e8aSMark Cave-Ayland r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \ 545fcf5ef2aSThomas Huth type, &env->vec_status); \ 546fcf5ef2aSThomas Huth } \ 547fcf5ef2aSThomas Huth } 548fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0); 549fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c); 550fcf5ef2aSThomas Huth #undef VARITHFPFMA 551fcf5ef2aSThomas Huth 552fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element) \ 553fcf5ef2aSThomas Huth { \ 554fcf5ef2aSThomas Huth type result = (type)a->element[i] op (type)b->element[i]; \ 555fcf5ef2aSThomas Huth r->element[i] = cvt(result, &sat); \ 556fcf5ef2aSThomas Huth } 557fcf5ef2aSThomas Huth 558fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element) \ 559fb11ae7dSRichard Henderson void helper_v##name(ppc_avr_t *r, ppc_avr_t *vscr_sat, \ 560fb11ae7dSRichard Henderson ppc_avr_t *a, ppc_avr_t *b, uint32_t desc) \ 561fcf5ef2aSThomas Huth { \ 562fcf5ef2aSThomas Huth int sat = 0; \ 563fcf5ef2aSThomas Huth int i; \ 564fcf5ef2aSThomas Huth \ 565fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 566fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 567fcf5ef2aSThomas Huth } \ 568fcf5ef2aSThomas Huth if (sat) { \ 569fb11ae7dSRichard Henderson vscr_sat->u32[0] = 1; \ 570fcf5ef2aSThomas Huth } \ 571fcf5ef2aSThomas Huth } 572fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt) \ 573fcf5ef2aSThomas Huth VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element) \ 574fcf5ef2aSThomas Huth VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element) 575fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt) \ 576fcf5ef2aSThomas Huth VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element) \ 577fcf5ef2aSThomas Huth VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element) 578fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb) 579fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh) 580fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw) 581fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub) 582fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh) 583fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw) 584fcf5ef2aSThomas Huth #undef VARITHSAT_CASE 585fcf5ef2aSThomas Huth #undef VARITHSAT_DO 586fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED 587fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED 588fcf5ef2aSThomas Huth 589fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype) \ 590fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 591fcf5ef2aSThomas Huth { \ 592fcf5ef2aSThomas Huth int i; \ 593fcf5ef2aSThomas Huth \ 594fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 595fcf5ef2aSThomas Huth etype x = (etype)a->element[i] + (etype)b->element[i] + 1; \ 596fcf5ef2aSThomas Huth r->element[i] = x >> 1; \ 597fcf5ef2aSThomas Huth } \ 598fcf5ef2aSThomas Huth } 599fcf5ef2aSThomas Huth 600fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element, \ 601fcf5ef2aSThomas Huth unsigned_type) \ 602fcf5ef2aSThomas Huth VAVG_DO(avgs##type, signed_element, signed_type) \ 603fcf5ef2aSThomas Huth VAVG_DO(avgu##type, unsigned_element, unsigned_type) 604fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t) 605fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t) 606fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t) 607fcf5ef2aSThomas Huth #undef VAVG_DO 608fcf5ef2aSThomas Huth #undef VAVG 609fcf5ef2aSThomas Huth 610fcf5ef2aSThomas Huth #define VABSDU_DO(name, element) \ 611fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 612fcf5ef2aSThomas Huth { \ 613fcf5ef2aSThomas Huth int i; \ 614fcf5ef2aSThomas Huth \ 615fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 616fcf5ef2aSThomas Huth r->element[i] = (a->element[i] > b->element[i]) ? \ 617fcf5ef2aSThomas Huth (a->element[i] - b->element[i]) : \ 618fcf5ef2aSThomas Huth (b->element[i] - a->element[i]); \ 619fcf5ef2aSThomas Huth } \ 620fcf5ef2aSThomas Huth } 621fcf5ef2aSThomas Huth 622b6cb41b2SDavid Gibson /* 623b6cb41b2SDavid Gibson * VABSDU - Vector absolute difference unsigned 624fcf5ef2aSThomas Huth * name - instruction mnemonic suffix (b: byte, h: halfword, w: word) 625fcf5ef2aSThomas Huth * element - element type to access from vector 626fcf5ef2aSThomas Huth */ 627fcf5ef2aSThomas Huth #define VABSDU(type, element) \ 628fcf5ef2aSThomas Huth VABSDU_DO(absdu##type, element) 629fcf5ef2aSThomas Huth VABSDU(b, u8) 630fcf5ef2aSThomas Huth VABSDU(h, u16) 631fcf5ef2aSThomas Huth VABSDU(w, u32) 632fcf5ef2aSThomas Huth #undef VABSDU_DO 633fcf5ef2aSThomas Huth #undef VABSDU 634fcf5ef2aSThomas Huth 635fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element) \ 636fcf5ef2aSThomas Huth void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r, \ 637fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 638fcf5ef2aSThomas Huth { \ 639fcf5ef2aSThomas Huth int i; \ 640fcf5ef2aSThomas Huth \ 64105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 642fcf5ef2aSThomas Huth float32 t = cvt(b->element[i], &env->vec_status); \ 64305ee3e8aSMark Cave-Ayland r->f32[i] = float32_scalbn(t, -uim, &env->vec_status); \ 644fcf5ef2aSThomas Huth } \ 645fcf5ef2aSThomas Huth } 646fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32) 647fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32) 648fcf5ef2aSThomas Huth #undef VCF 649fcf5ef2aSThomas Huth 650fcf5ef2aSThomas Huth #define VCMP_DO(suffix, compare, element, record) \ 651fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 652fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 653fcf5ef2aSThomas Huth { \ 654fcf5ef2aSThomas Huth uint64_t ones = (uint64_t)-1; \ 655fcf5ef2aSThomas Huth uint64_t all = ones; \ 656fcf5ef2aSThomas Huth uint64_t none = 0; \ 657fcf5ef2aSThomas Huth int i; \ 658fcf5ef2aSThomas Huth \ 659fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 660fcf5ef2aSThomas Huth uint64_t result = (a->element[i] compare b->element[i] ? \ 661fcf5ef2aSThomas Huth ones : 0x0); \ 662fcf5ef2aSThomas Huth switch (sizeof(a->element[0])) { \ 663fcf5ef2aSThomas Huth case 8: \ 664fcf5ef2aSThomas Huth r->u64[i] = result; \ 665fcf5ef2aSThomas Huth break; \ 666fcf5ef2aSThomas Huth case 4: \ 667fcf5ef2aSThomas Huth r->u32[i] = result; \ 668fcf5ef2aSThomas Huth break; \ 669fcf5ef2aSThomas Huth case 2: \ 670fcf5ef2aSThomas Huth r->u16[i] = result; \ 671fcf5ef2aSThomas Huth break; \ 672fcf5ef2aSThomas Huth case 1: \ 673fcf5ef2aSThomas Huth r->u8[i] = result; \ 674fcf5ef2aSThomas Huth break; \ 675fcf5ef2aSThomas Huth } \ 676fcf5ef2aSThomas Huth all &= result; \ 677fcf5ef2aSThomas Huth none |= result; \ 678fcf5ef2aSThomas Huth } \ 679fcf5ef2aSThomas Huth if (record) { \ 680fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 681fcf5ef2aSThomas Huth } \ 682fcf5ef2aSThomas Huth } 683fcf5ef2aSThomas Huth #define VCMP(suffix, compare, element) \ 684fcf5ef2aSThomas Huth VCMP_DO(suffix, compare, element, 0) \ 685fcf5ef2aSThomas Huth VCMP_DO(suffix##_dot, compare, element, 1) 686fcf5ef2aSThomas Huth VCMP(equb, ==, u8) 687fcf5ef2aSThomas Huth VCMP(equh, ==, u16) 688fcf5ef2aSThomas Huth VCMP(equw, ==, u32) 689fcf5ef2aSThomas Huth VCMP(equd, ==, u64) 690fcf5ef2aSThomas Huth VCMP(gtub, >, u8) 691fcf5ef2aSThomas Huth VCMP(gtuh, >, u16) 692fcf5ef2aSThomas Huth VCMP(gtuw, >, u32) 693fcf5ef2aSThomas Huth VCMP(gtud, >, u64) 694fcf5ef2aSThomas Huth VCMP(gtsb, >, s8) 695fcf5ef2aSThomas Huth VCMP(gtsh, >, s16) 696fcf5ef2aSThomas Huth VCMP(gtsw, >, s32) 697fcf5ef2aSThomas Huth VCMP(gtsd, >, s64) 698fcf5ef2aSThomas Huth #undef VCMP_DO 699fcf5ef2aSThomas Huth #undef VCMP 700fcf5ef2aSThomas Huth 701fcf5ef2aSThomas Huth #define VCMPNE_DO(suffix, element, etype, cmpzero, record) \ 702fcf5ef2aSThomas Huth void helper_vcmpne##suffix(CPUPPCState *env, ppc_avr_t *r, \ 703fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 704fcf5ef2aSThomas Huth { \ 705fcf5ef2aSThomas Huth etype ones = (etype)-1; \ 706fcf5ef2aSThomas Huth etype all = ones; \ 707fcf5ef2aSThomas Huth etype result, none = 0; \ 708fcf5ef2aSThomas Huth int i; \ 709fcf5ef2aSThomas Huth \ 710fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 711fcf5ef2aSThomas Huth if (cmpzero) { \ 712fcf5ef2aSThomas Huth result = ((a->element[i] == 0) \ 713fcf5ef2aSThomas Huth || (b->element[i] == 0) \ 714fcf5ef2aSThomas Huth || (a->element[i] != b->element[i]) ? \ 715fcf5ef2aSThomas Huth ones : 0x0); \ 716fcf5ef2aSThomas Huth } else { \ 717fcf5ef2aSThomas Huth result = (a->element[i] != b->element[i]) ? ones : 0x0; \ 718fcf5ef2aSThomas Huth } \ 719fcf5ef2aSThomas Huth r->element[i] = result; \ 720fcf5ef2aSThomas Huth all &= result; \ 721fcf5ef2aSThomas Huth none |= result; \ 722fcf5ef2aSThomas Huth } \ 723fcf5ef2aSThomas Huth if (record) { \ 724fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 725fcf5ef2aSThomas Huth } \ 726fcf5ef2aSThomas Huth } 727fcf5ef2aSThomas Huth 728b6cb41b2SDavid Gibson /* 729b6cb41b2SDavid Gibson * VCMPNEZ - Vector compare not equal to zero 730fcf5ef2aSThomas Huth * suffix - instruction mnemonic suffix (b: byte, h: halfword, w: word) 731fcf5ef2aSThomas Huth * element - element type to access from vector 732fcf5ef2aSThomas Huth */ 733fcf5ef2aSThomas Huth #define VCMPNE(suffix, element, etype, cmpzero) \ 734fcf5ef2aSThomas Huth VCMPNE_DO(suffix, element, etype, cmpzero, 0) \ 735fcf5ef2aSThomas Huth VCMPNE_DO(suffix##_dot, element, etype, cmpzero, 1) 736fcf5ef2aSThomas Huth VCMPNE(zb, u8, uint8_t, 1) 737fcf5ef2aSThomas Huth VCMPNE(zh, u16, uint16_t, 1) 738fcf5ef2aSThomas Huth VCMPNE(zw, u32, uint32_t, 1) 739fcf5ef2aSThomas Huth VCMPNE(b, u8, uint8_t, 0) 740fcf5ef2aSThomas Huth VCMPNE(h, u16, uint16_t, 0) 741fcf5ef2aSThomas Huth VCMPNE(w, u32, uint32_t, 0) 742fcf5ef2aSThomas Huth #undef VCMPNE_DO 743fcf5ef2aSThomas Huth #undef VCMPNE 744fcf5ef2aSThomas Huth 745fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record) \ 746fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 747fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 748fcf5ef2aSThomas Huth { \ 749fcf5ef2aSThomas Huth uint32_t ones = (uint32_t)-1; \ 750fcf5ef2aSThomas Huth uint32_t all = ones; \ 751fcf5ef2aSThomas Huth uint32_t none = 0; \ 752fcf5ef2aSThomas Huth int i; \ 753fcf5ef2aSThomas Huth \ 75405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 755fcf5ef2aSThomas Huth uint32_t result; \ 75671bfd65cSRichard Henderson FloatRelation rel = \ 75771bfd65cSRichard Henderson float32_compare_quiet(a->f32[i], b->f32[i], \ 758fcf5ef2aSThomas Huth &env->vec_status); \ 759fcf5ef2aSThomas Huth if (rel == float_relation_unordered) { \ 760fcf5ef2aSThomas Huth result = 0; \ 761fcf5ef2aSThomas Huth } else if (rel compare order) { \ 762fcf5ef2aSThomas Huth result = ones; \ 763fcf5ef2aSThomas Huth } else { \ 764fcf5ef2aSThomas Huth result = 0; \ 765fcf5ef2aSThomas Huth } \ 766fcf5ef2aSThomas Huth r->u32[i] = result; \ 767fcf5ef2aSThomas Huth all &= result; \ 768fcf5ef2aSThomas Huth none |= result; \ 769fcf5ef2aSThomas Huth } \ 770fcf5ef2aSThomas Huth if (record) { \ 771fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 772fcf5ef2aSThomas Huth } \ 773fcf5ef2aSThomas Huth } 774fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order) \ 775fcf5ef2aSThomas Huth VCMPFP_DO(suffix, compare, order, 0) \ 776fcf5ef2aSThomas Huth VCMPFP_DO(suffix##_dot, compare, order, 1) 777fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal) 778fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less) 779fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater) 780fcf5ef2aSThomas Huth #undef VCMPFP_DO 781fcf5ef2aSThomas Huth #undef VCMPFP 782fcf5ef2aSThomas Huth 783fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r, 784fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b, int record) 785fcf5ef2aSThomas Huth { 786fcf5ef2aSThomas Huth int i; 787fcf5ef2aSThomas Huth int all_in = 0; 788fcf5ef2aSThomas Huth 78905ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 79071bfd65cSRichard Henderson FloatRelation le_rel = float32_compare_quiet(a->f32[i], b->f32[i], 79105ee3e8aSMark Cave-Ayland &env->vec_status); 792fcf5ef2aSThomas Huth if (le_rel == float_relation_unordered) { 793fcf5ef2aSThomas Huth r->u32[i] = 0xc0000000; 794fcf5ef2aSThomas Huth all_in = 1; 795fcf5ef2aSThomas Huth } else { 79605ee3e8aSMark Cave-Ayland float32 bneg = float32_chs(b->f32[i]); 79771bfd65cSRichard Henderson FloatRelation ge_rel = float32_compare_quiet(a->f32[i], bneg, 79805ee3e8aSMark Cave-Ayland &env->vec_status); 799fcf5ef2aSThomas Huth int le = le_rel != float_relation_greater; 800fcf5ef2aSThomas Huth int ge = ge_rel != float_relation_less; 801fcf5ef2aSThomas Huth 802fcf5ef2aSThomas Huth r->u32[i] = ((!le) << 31) | ((!ge) << 30); 803fcf5ef2aSThomas Huth all_in |= (!le | !ge); 804fcf5ef2aSThomas Huth } 805fcf5ef2aSThomas Huth } 806fcf5ef2aSThomas Huth if (record) { 807fcf5ef2aSThomas Huth env->crf[6] = (all_in == 0) << 1; 808fcf5ef2aSThomas Huth } 809fcf5ef2aSThomas Huth } 810fcf5ef2aSThomas Huth 811fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 812fcf5ef2aSThomas Huth { 813fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 0); 814fcf5ef2aSThomas Huth } 815fcf5ef2aSThomas Huth 816fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 817fcf5ef2aSThomas Huth ppc_avr_t *b) 818fcf5ef2aSThomas Huth { 819fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 1); 820fcf5ef2aSThomas Huth } 821fcf5ef2aSThomas Huth 822fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element) \ 823fcf5ef2aSThomas Huth void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r, \ 824fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 825fcf5ef2aSThomas Huth { \ 826fcf5ef2aSThomas Huth int i; \ 827fcf5ef2aSThomas Huth int sat = 0; \ 828fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 829fcf5ef2aSThomas Huth \ 830fcf5ef2aSThomas Huth set_float_rounding_mode(float_round_to_zero, &s); \ 83105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 83205ee3e8aSMark Cave-Ayland if (float32_is_any_nan(b->f32[i])) { \ 833fcf5ef2aSThomas Huth r->element[i] = 0; \ 834fcf5ef2aSThomas Huth } else { \ 83505ee3e8aSMark Cave-Ayland float64 t = float32_to_float64(b->f32[i], &s); \ 836fcf5ef2aSThomas Huth int64_t j; \ 837fcf5ef2aSThomas Huth \ 838fcf5ef2aSThomas Huth t = float64_scalbn(t, uim, &s); \ 839fcf5ef2aSThomas Huth j = float64_to_int64(t, &s); \ 840fcf5ef2aSThomas Huth r->element[i] = satcvt(j, &sat); \ 841fcf5ef2aSThomas Huth } \ 842fcf5ef2aSThomas Huth } \ 843fcf5ef2aSThomas Huth if (sat) { \ 8446175f5a0SRichard Henderson set_vscr_sat(env); \ 845fcf5ef2aSThomas Huth } \ 846fcf5ef2aSThomas Huth } 847fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32) 848fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32) 849fcf5ef2aSThomas Huth #undef VCT 850fcf5ef2aSThomas Huth 851fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r) 852fcf5ef2aSThomas Huth { 853fcf5ef2aSThomas Huth target_ulong count = 0; 854fcf5ef2aSThomas Huth int i; 85560594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 85660594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 857fcf5ef2aSThomas Huth break; 858fcf5ef2aSThomas Huth } 859fcf5ef2aSThomas Huth count++; 860fcf5ef2aSThomas Huth } 861fcf5ef2aSThomas Huth return count; 862fcf5ef2aSThomas Huth } 863fcf5ef2aSThomas Huth 864fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r) 865fcf5ef2aSThomas Huth { 866fcf5ef2aSThomas Huth target_ulong count = 0; 867fcf5ef2aSThomas Huth int i; 868fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 86960594feaSMark Cave-Ayland if (r->VsrB(i) & 0x01) { 870fcf5ef2aSThomas Huth break; 871fcf5ef2aSThomas Huth } 872fcf5ef2aSThomas Huth count++; 873fcf5ef2aSThomas Huth } 874fcf5ef2aSThomas Huth return count; 875fcf5ef2aSThomas Huth } 876fcf5ef2aSThomas Huth 877fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 878fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 879fcf5ef2aSThomas Huth { 880fcf5ef2aSThomas Huth int sat = 0; 881fcf5ef2aSThomas Huth int i; 882fcf5ef2aSThomas Huth 883fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 884fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 885fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 886fcf5ef2aSThomas Huth 887fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 888fcf5ef2aSThomas Huth } 889fcf5ef2aSThomas Huth 890fcf5ef2aSThomas Huth if (sat) { 8916175f5a0SRichard Henderson set_vscr_sat(env); 892fcf5ef2aSThomas Huth } 893fcf5ef2aSThomas Huth } 894fcf5ef2aSThomas Huth 895fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 896fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 897fcf5ef2aSThomas Huth { 898fcf5ef2aSThomas Huth int sat = 0; 899fcf5ef2aSThomas Huth int i; 900fcf5ef2aSThomas Huth 901fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 902fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i] + 0x00004000; 903fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 904fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 905fcf5ef2aSThomas Huth } 906fcf5ef2aSThomas Huth 907fcf5ef2aSThomas Huth if (sat) { 9086175f5a0SRichard Henderson set_vscr_sat(env); 909fcf5ef2aSThomas Huth } 910fcf5ef2aSThomas Huth } 911fcf5ef2aSThomas Huth 912fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 913fcf5ef2aSThomas Huth { 914fcf5ef2aSThomas Huth int i; 915fcf5ef2aSThomas Huth 916fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 917fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 918fcf5ef2aSThomas Huth r->s16[i] = (int16_t) (prod + c->s16[i]); 919fcf5ef2aSThomas Huth } 920fcf5ef2aSThomas Huth } 921fcf5ef2aSThomas Huth 922d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs) \ 923fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 924fcf5ef2aSThomas Huth { \ 925fcf5ef2aSThomas Huth ppc_avr_t result; \ 926d81c2040SMark Cave-Ayland int i, half = ARRAY_SIZE(r->element) / 2; \ 927fcf5ef2aSThomas Huth \ 928d81c2040SMark Cave-Ayland for (i = 0; i < half; i++) { \ 929d81c2040SMark Cave-Ayland result.access(i * 2 + 0) = a->access(i + ofs); \ 930d81c2040SMark Cave-Ayland result.access(i * 2 + 1) = b->access(i + ofs); \ 931fcf5ef2aSThomas Huth } \ 932fcf5ef2aSThomas Huth *r = result; \ 933fcf5ef2aSThomas Huth } 934d81c2040SMark Cave-Ayland 935d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access) \ 936d81c2040SMark Cave-Ayland VMRG_DO(mrgl##suffix, element, access, half) \ 937d81c2040SMark Cave-Ayland VMRG_DO(mrgh##suffix, element, access, 0) 938d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB) 939d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH) 940d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW) 941fcf5ef2aSThomas Huth #undef VMRG_DO 942fcf5ef2aSThomas Huth #undef VMRG 943fcf5ef2aSThomas Huth 944fcf5ef2aSThomas Huth void helper_vmsummbm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 945fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 946fcf5ef2aSThomas Huth { 947fcf5ef2aSThomas Huth int32_t prod[16]; 948fcf5ef2aSThomas Huth int i; 949fcf5ef2aSThomas Huth 950fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s8); i++) { 951fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s8[i] * b->u8[i]; 952fcf5ef2aSThomas Huth } 953fcf5ef2aSThomas Huth 954fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 955fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] + 956fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 957fcf5ef2aSThomas Huth } 958fcf5ef2aSThomas Huth } 959fcf5ef2aSThomas Huth 960fcf5ef2aSThomas Huth void helper_vmsumshm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 961fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 962fcf5ef2aSThomas Huth { 963fcf5ef2aSThomas Huth int32_t prod[8]; 964fcf5ef2aSThomas Huth int i; 965fcf5ef2aSThomas Huth 966fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 967fcf5ef2aSThomas Huth prod[i] = a->s16[i] * b->s16[i]; 968fcf5ef2aSThomas Huth } 969fcf5ef2aSThomas Huth 970fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 971fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 972fcf5ef2aSThomas Huth } 973fcf5ef2aSThomas Huth } 974fcf5ef2aSThomas Huth 975fcf5ef2aSThomas Huth void helper_vmsumshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 976fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 977fcf5ef2aSThomas Huth { 978fcf5ef2aSThomas Huth int32_t prod[8]; 979fcf5ef2aSThomas Huth int i; 980fcf5ef2aSThomas Huth int sat = 0; 981fcf5ef2aSThomas Huth 982fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 983fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s16[i] * b->s16[i]; 984fcf5ef2aSThomas Huth } 985fcf5ef2aSThomas Huth 986fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 987fcf5ef2aSThomas Huth int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 988fcf5ef2aSThomas Huth 989fcf5ef2aSThomas Huth r->u32[i] = cvtsdsw(t, &sat); 990fcf5ef2aSThomas Huth } 991fcf5ef2aSThomas Huth 992fcf5ef2aSThomas Huth if (sat) { 9936175f5a0SRichard Henderson set_vscr_sat(env); 994fcf5ef2aSThomas Huth } 995fcf5ef2aSThomas Huth } 996fcf5ef2aSThomas Huth 997fcf5ef2aSThomas Huth void helper_vmsumubm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 998fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 999fcf5ef2aSThomas Huth { 1000fcf5ef2aSThomas Huth uint16_t prod[16]; 1001fcf5ef2aSThomas Huth int i; 1002fcf5ef2aSThomas Huth 1003fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1004fcf5ef2aSThomas Huth prod[i] = a->u8[i] * b->u8[i]; 1005fcf5ef2aSThomas Huth } 1006fcf5ef2aSThomas Huth 1007fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1008fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] + 1009fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1010fcf5ef2aSThomas Huth } 1011fcf5ef2aSThomas Huth } 1012fcf5ef2aSThomas Huth 1013fcf5ef2aSThomas Huth void helper_vmsumuhm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1014fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1015fcf5ef2aSThomas Huth { 1016fcf5ef2aSThomas Huth uint32_t prod[8]; 1017fcf5ef2aSThomas Huth int i; 1018fcf5ef2aSThomas Huth 1019fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1020fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1021fcf5ef2aSThomas Huth } 1022fcf5ef2aSThomas Huth 1023fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1024fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1025fcf5ef2aSThomas Huth } 1026fcf5ef2aSThomas Huth } 1027fcf5ef2aSThomas Huth 1028fcf5ef2aSThomas Huth void helper_vmsumuhs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1029fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1030fcf5ef2aSThomas Huth { 1031fcf5ef2aSThomas Huth uint32_t prod[8]; 1032fcf5ef2aSThomas Huth int i; 1033fcf5ef2aSThomas Huth int sat = 0; 1034fcf5ef2aSThomas Huth 1035fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1036fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1037fcf5ef2aSThomas Huth } 1038fcf5ef2aSThomas Huth 1039fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1040fcf5ef2aSThomas Huth uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1041fcf5ef2aSThomas Huth 1042fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1043fcf5ef2aSThomas Huth } 1044fcf5ef2aSThomas Huth 1045fcf5ef2aSThomas Huth if (sat) { 10466175f5a0SRichard Henderson set_vscr_sat(env); 1047fcf5ef2aSThomas Huth } 1048fcf5ef2aSThomas Huth } 1049fcf5ef2aSThomas Huth 10504fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast) \ 1051fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1052fcf5ef2aSThomas Huth { \ 1053fcf5ef2aSThomas Huth int i; \ 1054fcf5ef2aSThomas Huth \ 10554fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 10564fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i) * \ 10574fbc89edSMark Cave-Ayland (cast)b->mul_access(i); \ 1058fcf5ef2aSThomas Huth } \ 1059fcf5ef2aSThomas Huth } 10604fbc89edSMark Cave-Ayland 10614fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast) \ 10624fbc89edSMark Cave-Ayland void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 10634fbc89edSMark Cave-Ayland { \ 10644fbc89edSMark Cave-Ayland int i; \ 10654fbc89edSMark Cave-Ayland \ 10664fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 10674fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) * \ 10684fbc89edSMark Cave-Ayland (cast)b->mul_access(i + 1); \ 10694fbc89edSMark Cave-Ayland } \ 10704fbc89edSMark Cave-Ayland } 10714fbc89edSMark Cave-Ayland 10724fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast) \ 10734fbc89edSMark Cave-Ayland VMUL_DO_EVN(mule##suffix, mul_element, mul_access, prod_access, cast) \ 10744fbc89edSMark Cave-Ayland VMUL_DO_ODD(mulo##suffix, mul_element, mul_access, prod_access, cast) 10754fbc89edSMark Cave-Ayland VMUL(sb, s8, VsrSB, VsrSH, int16_t) 10764fbc89edSMark Cave-Ayland VMUL(sh, s16, VsrSH, VsrSW, int32_t) 10774fbc89edSMark Cave-Ayland VMUL(sw, s32, VsrSW, VsrSD, int64_t) 10784fbc89edSMark Cave-Ayland VMUL(ub, u8, VsrB, VsrH, uint16_t) 10794fbc89edSMark Cave-Ayland VMUL(uh, u16, VsrH, VsrW, uint32_t) 10804fbc89edSMark Cave-Ayland VMUL(uw, u32, VsrW, VsrD, uint64_t) 10814fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN 10824fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD 1083fcf5ef2aSThomas Huth #undef VMUL 1084fcf5ef2aSThomas Huth 1085f3e0d864SLijun Pan void helper_vmulhsw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1086f3e0d864SLijun Pan { 1087f3e0d864SLijun Pan int i; 1088f3e0d864SLijun Pan 1089f3e0d864SLijun Pan for (i = 0; i < 4; i++) { 1090f3e0d864SLijun Pan r->s32[i] = (int32_t)(((int64_t)a->s32[i] * (int64_t)b->s32[i]) >> 32); 1091f3e0d864SLijun Pan } 1092f3e0d864SLijun Pan } 1093f3e0d864SLijun Pan 1094f3e0d864SLijun Pan void helper_vmulhuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1095f3e0d864SLijun Pan { 1096f3e0d864SLijun Pan int i; 1097f3e0d864SLijun Pan 1098f3e0d864SLijun Pan for (i = 0; i < 4; i++) { 1099f3e0d864SLijun Pan r->u32[i] = (uint32_t)(((uint64_t)a->u32[i] * 1100f3e0d864SLijun Pan (uint64_t)b->u32[i]) >> 32); 1101f3e0d864SLijun Pan } 1102f3e0d864SLijun Pan } 1103f3e0d864SLijun Pan 1104c4b8b49dSLijun Pan void helper_vmulhsd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1105c4b8b49dSLijun Pan { 1106c4b8b49dSLijun Pan uint64_t discard; 1107c4b8b49dSLijun Pan 1108c4b8b49dSLijun Pan muls64(&discard, &r->u64[0], a->s64[0], b->s64[0]); 1109c4b8b49dSLijun Pan muls64(&discard, &r->u64[1], a->s64[1], b->s64[1]); 1110c4b8b49dSLijun Pan } 1111c4b8b49dSLijun Pan 1112c4b8b49dSLijun Pan void helper_vmulhud(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1113c4b8b49dSLijun Pan { 1114c4b8b49dSLijun Pan uint64_t discard; 1115c4b8b49dSLijun Pan 1116c4b8b49dSLijun Pan mulu64(&discard, &r->u64[0], a->u64[0], b->u64[0]); 1117c4b8b49dSLijun Pan mulu64(&discard, &r->u64[1], a->u64[1], b->u64[1]); 1118c4b8b49dSLijun Pan } 1119c4b8b49dSLijun Pan 1120fcf5ef2aSThomas Huth void helper_vperm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1121fcf5ef2aSThomas Huth ppc_avr_t *c) 1122fcf5ef2aSThomas Huth { 1123fcf5ef2aSThomas Huth ppc_avr_t result; 1124fcf5ef2aSThomas Huth int i; 1125fcf5ef2aSThomas Huth 112660594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 112760594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1128fcf5ef2aSThomas Huth int index = s & 0xf; 1129fcf5ef2aSThomas Huth 1130fcf5ef2aSThomas Huth if (s & 0x10) { 113160594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1132fcf5ef2aSThomas Huth } else { 113360594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1134fcf5ef2aSThomas Huth } 1135fcf5ef2aSThomas Huth } 1136fcf5ef2aSThomas Huth *r = result; 1137fcf5ef2aSThomas Huth } 1138fcf5ef2aSThomas Huth 1139fcf5ef2aSThomas Huth void helper_vpermr(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1140fcf5ef2aSThomas Huth ppc_avr_t *c) 1141fcf5ef2aSThomas Huth { 1142fcf5ef2aSThomas Huth ppc_avr_t result; 1143fcf5ef2aSThomas Huth int i; 1144fcf5ef2aSThomas Huth 114560594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 114660594feaSMark Cave-Ayland int s = c->VsrB(i) & 0x1f; 1147fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1148fcf5ef2aSThomas Huth 1149fcf5ef2aSThomas Huth if (s & 0x10) { 115060594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1151fcf5ef2aSThomas Huth } else { 115260594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index); 1153fcf5ef2aSThomas Huth } 1154fcf5ef2aSThomas Huth } 1155fcf5ef2aSThomas Huth *r = result; 1156fcf5ef2aSThomas Huth } 1157fcf5ef2aSThomas Huth 1158fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1159fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)]) 1160fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i) 1161fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0) 1162fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1)) 1163fcf5ef2aSThomas Huth #else 1164fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15 - (i)]) 1165fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i) 1166fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0) 1167fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \ 1168fcf5ef2aSThomas Huth (extract64((avr)->u64[1 - i], 63 - index, 1)) 1169fcf5ef2aSThomas Huth #endif 1170fcf5ef2aSThomas Huth 1171fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1172fcf5ef2aSThomas Huth { 1173fcf5ef2aSThomas Huth int i, j; 1174fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 1175fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1176fcf5ef2aSThomas Huth for (j = 0; j < 8; j++) { 1177fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, (i * 8) + j); 1178fcf5ef2aSThomas Huth if (index < 64 && EXTRACT_BIT(a, i, index)) { 1179fcf5ef2aSThomas Huth result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j); 1180fcf5ef2aSThomas Huth } 1181fcf5ef2aSThomas Huth } 1182fcf5ef2aSThomas Huth } 1183fcf5ef2aSThomas Huth *r = result; 1184fcf5ef2aSThomas Huth } 1185fcf5ef2aSThomas Huth 1186fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1187fcf5ef2aSThomas Huth { 1188fcf5ef2aSThomas Huth int i; 1189fcf5ef2aSThomas Huth uint64_t perm = 0; 1190fcf5ef2aSThomas Huth 1191fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1192fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, i); 1193fcf5ef2aSThomas Huth 1194fcf5ef2aSThomas Huth if (index < 128) { 1195fcf5ef2aSThomas Huth uint64_t mask = (1ull << (63 - (index & 0x3F))); 1196fcf5ef2aSThomas Huth if (a->u64[VBPERMQ_DW(index)] & mask) { 1197fcf5ef2aSThomas Huth perm |= (0x8000 >> i); 1198fcf5ef2aSThomas Huth } 1199fcf5ef2aSThomas Huth } 1200fcf5ef2aSThomas Huth } 1201fcf5ef2aSThomas Huth 12023c385a93SMark Cave-Ayland r->VsrD(0) = perm; 12033c385a93SMark Cave-Ayland r->VsrD(1) = 0; 1204fcf5ef2aSThomas Huth } 1205fcf5ef2aSThomas Huth 1206fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX 1207fcf5ef2aSThomas Huth #undef VBPERMQ_DW 1208fcf5ef2aSThomas Huth 1209fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp) \ 1210fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1211fcf5ef2aSThomas Huth { \ 1212fcf5ef2aSThomas Huth int i, j; \ 1213fcf5ef2aSThomas Huth trgtyp prod[sizeof(ppc_avr_t) / sizeof(a->srcfld[0])]; \ 1214fcf5ef2aSThomas Huth \ 1215fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, srcfld) { \ 1216fcf5ef2aSThomas Huth prod[i] = 0; \ 1217fcf5ef2aSThomas Huth for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) { \ 1218fcf5ef2aSThomas Huth if (a->srcfld[i] & (1ull << j)) { \ 1219fcf5ef2aSThomas Huth prod[i] ^= ((trgtyp)b->srcfld[i] << j); \ 1220fcf5ef2aSThomas Huth } \ 1221fcf5ef2aSThomas Huth } \ 1222fcf5ef2aSThomas Huth } \ 1223fcf5ef2aSThomas Huth \ 1224fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, trgfld) { \ 1225fcf5ef2aSThomas Huth r->trgfld[i] = prod[2 * i] ^ prod[2 * i + 1]; \ 1226fcf5ef2aSThomas Huth } \ 1227fcf5ef2aSThomas Huth } 1228fcf5ef2aSThomas Huth 1229fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t) 1230fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t) 1231fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t) 1232fcf5ef2aSThomas Huth 1233fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1234fcf5ef2aSThomas Huth { 1235fcf5ef2aSThomas Huth 1236fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1237fcf5ef2aSThomas Huth int i, j; 1238fcf5ef2aSThomas Huth __uint128_t prod[2]; 1239fcf5ef2aSThomas Huth 1240fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1241fcf5ef2aSThomas Huth prod[i] = 0; 1242fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1243fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1244fcf5ef2aSThomas Huth prod[i] ^= (((__uint128_t)b->u64[i]) << j); 1245fcf5ef2aSThomas Huth } 1246fcf5ef2aSThomas Huth } 1247fcf5ef2aSThomas Huth } 1248fcf5ef2aSThomas Huth 1249fcf5ef2aSThomas Huth r->u128 = prod[0] ^ prod[1]; 1250fcf5ef2aSThomas Huth 1251fcf5ef2aSThomas Huth #else 1252fcf5ef2aSThomas Huth int i, j; 1253fcf5ef2aSThomas Huth ppc_avr_t prod[2]; 1254fcf5ef2aSThomas Huth 1255fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 12563c385a93SMark Cave-Ayland prod[i].VsrD(1) = prod[i].VsrD(0) = 0; 1257fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1258fcf5ef2aSThomas Huth if (a->u64[i] & (1ull << j)) { 1259fcf5ef2aSThomas Huth ppc_avr_t bshift; 1260fcf5ef2aSThomas Huth if (j == 0) { 12613c385a93SMark Cave-Ayland bshift.VsrD(0) = 0; 12623c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i]; 1263fcf5ef2aSThomas Huth } else { 12643c385a93SMark Cave-Ayland bshift.VsrD(0) = b->u64[i] >> (64 - j); 12653c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i] << j; 1266fcf5ef2aSThomas Huth } 12673c385a93SMark Cave-Ayland prod[i].VsrD(1) ^= bshift.VsrD(1); 12683c385a93SMark Cave-Ayland prod[i].VsrD(0) ^= bshift.VsrD(0); 1269fcf5ef2aSThomas Huth } 1270fcf5ef2aSThomas Huth } 1271fcf5ef2aSThomas Huth } 1272fcf5ef2aSThomas Huth 12733c385a93SMark Cave-Ayland r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1); 12743c385a93SMark Cave-Ayland r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0); 1275fcf5ef2aSThomas Huth #endif 1276fcf5ef2aSThomas Huth } 1277fcf5ef2aSThomas Huth 1278fcf5ef2aSThomas Huth 1279fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1280fcf5ef2aSThomas Huth #define PKBIG 1 1281fcf5ef2aSThomas Huth #else 1282fcf5ef2aSThomas Huth #define PKBIG 0 1283fcf5ef2aSThomas Huth #endif 1284fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1285fcf5ef2aSThomas Huth { 1286fcf5ef2aSThomas Huth int i, j; 1287fcf5ef2aSThomas Huth ppc_avr_t result; 1288fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1289fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { a, b }; 1290fcf5ef2aSThomas Huth #else 1291fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { b, a }; 1292fcf5ef2aSThomas Huth #endif 1293fcf5ef2aSThomas Huth 1294fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1295fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(j, u32) { 1296fcf5ef2aSThomas Huth uint32_t e = x[i]->u32[j]; 1297fcf5ef2aSThomas Huth 1298fcf5ef2aSThomas Huth result.u16[4 * i + j] = (((e >> 9) & 0xfc00) | 1299fcf5ef2aSThomas Huth ((e >> 6) & 0x3e0) | 1300fcf5ef2aSThomas Huth ((e >> 3) & 0x1f)); 1301fcf5ef2aSThomas Huth } 1302fcf5ef2aSThomas Huth } 1303fcf5ef2aSThomas Huth *r = result; 1304fcf5ef2aSThomas Huth } 1305fcf5ef2aSThomas Huth 1306fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat) \ 1307fcf5ef2aSThomas Huth void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1308fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 1309fcf5ef2aSThomas Huth { \ 1310fcf5ef2aSThomas Huth int i; \ 1311fcf5ef2aSThomas Huth int sat = 0; \ 1312fcf5ef2aSThomas Huth ppc_avr_t result; \ 1313fcf5ef2aSThomas Huth ppc_avr_t *a0 = PKBIG ? a : b; \ 1314fcf5ef2aSThomas Huth ppc_avr_t *a1 = PKBIG ? b : a; \ 1315fcf5ef2aSThomas Huth \ 1316fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, from) { \ 1317fcf5ef2aSThomas Huth result.to[i] = cvt(a0->from[i], &sat); \ 1318fcf5ef2aSThomas Huth result.to[i + ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat);\ 1319fcf5ef2aSThomas Huth } \ 1320fcf5ef2aSThomas Huth *r = result; \ 1321fcf5ef2aSThomas Huth if (dosat && sat) { \ 13226175f5a0SRichard Henderson set_vscr_sat(env); \ 1323fcf5ef2aSThomas Huth } \ 1324fcf5ef2aSThomas Huth } 1325fcf5ef2aSThomas Huth #define I(x, y) (x) 1326fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1) 1327fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1) 1328fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1) 1329fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1) 1330fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1) 1331fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1) 1332fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1) 1333fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1) 1334fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1) 1335fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0) 1336fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0) 1337fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0) 1338fcf5ef2aSThomas Huth #undef I 1339fcf5ef2aSThomas Huth #undef VPK 1340fcf5ef2aSThomas Huth #undef PKBIG 1341fcf5ef2aSThomas Huth 1342fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1343fcf5ef2aSThomas Huth { 1344fcf5ef2aSThomas Huth int i; 1345fcf5ef2aSThomas Huth 134605ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 134705ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status); 1348fcf5ef2aSThomas Huth } 1349fcf5ef2aSThomas Huth } 1350fcf5ef2aSThomas Huth 1351fcf5ef2aSThomas Huth #define VRFI(suffix, rounding) \ 1352fcf5ef2aSThomas Huth void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1353fcf5ef2aSThomas Huth ppc_avr_t *b) \ 1354fcf5ef2aSThomas Huth { \ 1355fcf5ef2aSThomas Huth int i; \ 1356fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 1357fcf5ef2aSThomas Huth \ 1358fcf5ef2aSThomas Huth set_float_rounding_mode(rounding, &s); \ 135905ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 136005ee3e8aSMark Cave-Ayland r->f32[i] = float32_round_to_int (b->f32[i], &s); \ 1361fcf5ef2aSThomas Huth } \ 1362fcf5ef2aSThomas Huth } 1363fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even) 1364fcf5ef2aSThomas Huth VRFI(m, float_round_down) 1365fcf5ef2aSThomas Huth VRFI(p, float_round_up) 1366fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero) 1367fcf5ef2aSThomas Huth #undef VRFI 1368fcf5ef2aSThomas Huth 1369fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1370fcf5ef2aSThomas Huth { 1371fcf5ef2aSThomas Huth int i; 1372fcf5ef2aSThomas Huth 137305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 137405ee3e8aSMark Cave-Ayland float32 t = float32_sqrt(b->f32[i], &env->vec_status); 1375fcf5ef2aSThomas Huth 137605ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, t, &env->vec_status); 1377fcf5ef2aSThomas Huth } 1378fcf5ef2aSThomas Huth } 1379fcf5ef2aSThomas Huth 1380fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert) \ 1381fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1382fcf5ef2aSThomas Huth { \ 1383fcf5ef2aSThomas Huth int i; \ 1384fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1385fcf5ef2aSThomas Huth uint##size##_t src1 = a->element[i]; \ 1386fcf5ef2aSThomas Huth uint##size##_t src2 = b->element[i]; \ 1387fcf5ef2aSThomas Huth uint##size##_t src3 = r->element[i]; \ 1388fcf5ef2aSThomas Huth uint##size##_t begin, end, shift, mask, rot_val; \ 1389fcf5ef2aSThomas Huth \ 1390fcf5ef2aSThomas Huth shift = extract##size(src2, 0, 6); \ 1391fcf5ef2aSThomas Huth end = extract##size(src2, 8, 6); \ 1392fcf5ef2aSThomas Huth begin = extract##size(src2, 16, 6); \ 1393fcf5ef2aSThomas Huth rot_val = rol##size(src1, shift); \ 1394fcf5ef2aSThomas Huth mask = mask_u##size(begin, end); \ 1395fcf5ef2aSThomas Huth if (insert) { \ 1396fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask) | (src3 & ~mask); \ 1397fcf5ef2aSThomas Huth } else { \ 1398fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask); \ 1399fcf5ef2aSThomas Huth } \ 1400fcf5ef2aSThomas Huth } \ 1401fcf5ef2aSThomas Huth } 1402fcf5ef2aSThomas Huth 1403fcf5ef2aSThomas Huth VRLMI(vrldmi, 64, u64, 1); 1404fcf5ef2aSThomas Huth VRLMI(vrlwmi, 32, u32, 1); 1405fcf5ef2aSThomas Huth VRLMI(vrldnm, 64, u64, 0); 1406fcf5ef2aSThomas Huth VRLMI(vrlwnm, 32, u32, 0); 1407fcf5ef2aSThomas Huth 1408fcf5ef2aSThomas Huth void helper_vsel(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1409fcf5ef2aSThomas Huth ppc_avr_t *c) 1410fcf5ef2aSThomas Huth { 1411fcf5ef2aSThomas Huth r->u64[0] = (a->u64[0] & ~c->u64[0]) | (b->u64[0] & c->u64[0]); 1412fcf5ef2aSThomas Huth r->u64[1] = (a->u64[1] & ~c->u64[1]) | (b->u64[1] & c->u64[1]); 1413fcf5ef2aSThomas Huth } 1414fcf5ef2aSThomas Huth 1415fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1416fcf5ef2aSThomas Huth { 1417fcf5ef2aSThomas Huth int i; 1418fcf5ef2aSThomas Huth 141905ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 142005ee3e8aSMark Cave-Ayland r->f32[i] = float32_exp2(b->f32[i], &env->vec_status); 1421fcf5ef2aSThomas Huth } 1422fcf5ef2aSThomas Huth } 1423fcf5ef2aSThomas Huth 1424fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1425fcf5ef2aSThomas Huth { 1426fcf5ef2aSThomas Huth int i; 1427fcf5ef2aSThomas Huth 142805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 142905ee3e8aSMark Cave-Ayland r->f32[i] = float32_log2(b->f32[i], &env->vec_status); 1430fcf5ef2aSThomas Huth } 1431fcf5ef2aSThomas Huth } 1432fcf5ef2aSThomas Huth 143360caf221SAvinesh Kumar #if defined(HOST_WORDS_BIGENDIAN) 143460caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 143560caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 143660caf221SAvinesh Kumar { \ 143760caf221SAvinesh Kumar int index; \ 143860caf221SAvinesh Kumar if (left) { \ 143960caf221SAvinesh Kumar index = (a & 0xf) * 8; \ 144060caf221SAvinesh Kumar } else { \ 144160caf221SAvinesh Kumar index = ((15 - (a & 0xf) + 1) * 8) - size; \ 144260caf221SAvinesh Kumar } \ 144360caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 144460caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 144560caf221SAvinesh Kumar } 144660caf221SAvinesh Kumar #else 144760caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 144860caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 144960caf221SAvinesh Kumar { \ 145060caf221SAvinesh Kumar int index; \ 145160caf221SAvinesh Kumar if (left) { \ 145260caf221SAvinesh Kumar index = ((15 - (a & 0xf) + 1) * 8) - size; \ 145360caf221SAvinesh Kumar } else { \ 145460caf221SAvinesh Kumar index = (a & 0xf) * 8; \ 145560caf221SAvinesh Kumar } \ 145660caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 145760caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 145860caf221SAvinesh Kumar } 145960caf221SAvinesh Kumar #endif 146060caf221SAvinesh Kumar 146160caf221SAvinesh Kumar VEXTU_X_DO(vextublx, 8, 1) 146260caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1) 146360caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1) 146460caf221SAvinesh Kumar VEXTU_X_DO(vextubrx, 8, 0) 146560caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0) 146660caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0) 146760caf221SAvinesh Kumar #undef VEXTU_X_DO 146860caf221SAvinesh Kumar 1469fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1470fcf5ef2aSThomas Huth { 1471fcf5ef2aSThomas Huth int i; 1472fcf5ef2aSThomas Huth unsigned int shift, bytes, size; 1473fcf5ef2aSThomas Huth 1474fcf5ef2aSThomas Huth size = ARRAY_SIZE(r->u8); 1475fcf5ef2aSThomas Huth for (i = 0; i < size; i++) { 147663be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 147763be02fcSAnton Blanchard bytes = (a->VsrB(i) << 8) + /* extract adjacent bytes */ 147863be02fcSAnton Blanchard (((i + 1) < size) ? a->VsrB(i + 1) : 0); 147963be02fcSAnton Blanchard r->VsrB(i) = (bytes << shift) >> 8; /* shift and store result */ 1480fcf5ef2aSThomas Huth } 1481fcf5ef2aSThomas Huth } 1482fcf5ef2aSThomas Huth 1483fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1484fcf5ef2aSThomas Huth { 1485fcf5ef2aSThomas Huth int i; 1486fcf5ef2aSThomas Huth unsigned int shift, bytes; 1487fcf5ef2aSThomas Huth 1488b6cb41b2SDavid Gibson /* 1489b6cb41b2SDavid Gibson * Use reverse order, as destination and source register can be 1490b6cb41b2SDavid Gibson * same. Its being modified in place saving temporary, reverse 1491b6cb41b2SDavid Gibson * order will guarantee that computed result is not fed back. 1492fcf5ef2aSThomas Huth */ 1493fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 149463be02fcSAnton Blanchard shift = b->VsrB(i) & 0x7; /* extract shift value */ 149563be02fcSAnton Blanchard bytes = ((i ? a->VsrB(i - 1) : 0) << 8) + a->VsrB(i); 1496fcf5ef2aSThomas Huth /* extract adjacent bytes */ 149763be02fcSAnton Blanchard r->VsrB(i) = (bytes >> shift) & 0xFF; /* shift and store result */ 1498fcf5ef2aSThomas Huth } 1499fcf5ef2aSThomas Huth } 1500fcf5ef2aSThomas Huth 1501fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift) 1502fcf5ef2aSThomas Huth { 1503fcf5ef2aSThomas Huth int sh = shift & 0xf; 1504fcf5ef2aSThomas Huth int i; 1505fcf5ef2aSThomas Huth ppc_avr_t result; 1506fcf5ef2aSThomas Huth 1507fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1508fcf5ef2aSThomas Huth int index = sh + i; 1509fcf5ef2aSThomas Huth if (index > 0xf) { 151060594feaSMark Cave-Ayland result.VsrB(i) = b->VsrB(index - 0x10); 1511fcf5ef2aSThomas Huth } else { 151260594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(index); 1513fcf5ef2aSThomas Huth } 1514fcf5ef2aSThomas Huth } 1515fcf5ef2aSThomas Huth *r = result; 1516fcf5ef2aSThomas Huth } 1517fcf5ef2aSThomas Huth 1518fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1519fcf5ef2aSThomas Huth { 15203c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1521fcf5ef2aSThomas Huth 1522fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1523fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1524fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1525fcf5ef2aSThomas Huth #else 1526fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1527fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1528fcf5ef2aSThomas Huth #endif 1529fcf5ef2aSThomas Huth } 1530fcf5ef2aSThomas Huth 1531fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1532fcf5ef2aSThomas Huth #define VINSERT(suffix, element) \ 1533fcf5ef2aSThomas Huth void helper_vinsert##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1534fcf5ef2aSThomas Huth { \ 15354fff7218SLaurent Vivier memmove(&r->u8[index], &b->u8[8 - sizeof(r->element[0])], \ 1536fcf5ef2aSThomas Huth sizeof(r->element[0])); \ 1537fcf5ef2aSThomas Huth } 1538fcf5ef2aSThomas Huth #else 1539fcf5ef2aSThomas Huth #define VINSERT(suffix, element) \ 1540fcf5ef2aSThomas Huth void helper_vinsert##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1541fcf5ef2aSThomas Huth { \ 1542fcf5ef2aSThomas Huth uint32_t d = (16 - index) - sizeof(r->element[0]); \ 1543fcf5ef2aSThomas Huth memmove(&r->u8[d], &b->u8[8], sizeof(r->element[0])); \ 1544fcf5ef2aSThomas Huth } 1545fcf5ef2aSThomas Huth #endif 1546fcf5ef2aSThomas Huth VINSERT(b, u8) 1547fcf5ef2aSThomas Huth VINSERT(h, u16) 1548fcf5ef2aSThomas Huth VINSERT(w, u32) 1549fcf5ef2aSThomas Huth VINSERT(d, u64) 1550fcf5ef2aSThomas Huth #undef VINSERT 1551fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1552fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1553fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1554fcf5ef2aSThomas Huth { \ 1555fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1556fcf5ef2aSThomas Huth memmove(&r->u8[8 - es], &b->u8[index], es); \ 1557fcf5ef2aSThomas Huth memset(&r->u8[8], 0, 8); \ 1558fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8 - es); \ 1559fcf5ef2aSThomas Huth } 1560fcf5ef2aSThomas Huth #else 1561fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1562fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1563fcf5ef2aSThomas Huth { \ 1564fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1565fcf5ef2aSThomas Huth uint32_t s = (16 - index) - es; \ 1566fcf5ef2aSThomas Huth memmove(&r->u8[8], &b->u8[s], es); \ 1567fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8); \ 1568fcf5ef2aSThomas Huth memset(&r->u8[8 + es], 0, 8 - es); \ 1569fcf5ef2aSThomas Huth } 1570fcf5ef2aSThomas Huth #endif 1571fcf5ef2aSThomas Huth VEXTRACT(ub, u8) 1572fcf5ef2aSThomas Huth VEXTRACT(uh, u16) 1573fcf5ef2aSThomas Huth VEXTRACT(uw, u32) 1574fcf5ef2aSThomas Huth VEXTRACT(d, u64) 1575fcf5ef2aSThomas Huth #undef VEXTRACT 1576fcf5ef2aSThomas Huth 15775ba5335dSMark Cave-Ayland void helper_xxextractuw(CPUPPCState *env, ppc_vsr_t *xt, 15785ba5335dSMark Cave-Ayland ppc_vsr_t *xb, uint32_t index) 15798ad901e5SNikunj A Dadhania { 158003b32c09SMark Cave-Ayland ppc_vsr_t t = { }; 15818ad901e5SNikunj A Dadhania size_t es = sizeof(uint32_t); 15828ad901e5SNikunj A Dadhania uint32_t ext_index; 15838ad901e5SNikunj A Dadhania int i; 15848ad901e5SNikunj A Dadhania 15858ad901e5SNikunj A Dadhania ext_index = index; 15868ad901e5SNikunj A Dadhania for (i = 0; i < es; i++, ext_index++) { 158703b32c09SMark Cave-Ayland t.VsrB(8 - es + i) = xb->VsrB(ext_index % 16); 15888ad901e5SNikunj A Dadhania } 15898ad901e5SNikunj A Dadhania 159003b32c09SMark Cave-Ayland *xt = t; 15918ad901e5SNikunj A Dadhania } 15928ad901e5SNikunj A Dadhania 15935ba5335dSMark Cave-Ayland void helper_xxinsertw(CPUPPCState *env, ppc_vsr_t *xt, 15945ba5335dSMark Cave-Ayland ppc_vsr_t *xb, uint32_t index) 15953398b742SNikunj A Dadhania { 159603b32c09SMark Cave-Ayland ppc_vsr_t t = *xt; 15973398b742SNikunj A Dadhania size_t es = sizeof(uint32_t); 15983398b742SNikunj A Dadhania int ins_index, i = 0; 15993398b742SNikunj A Dadhania 16003398b742SNikunj A Dadhania ins_index = index; 16013398b742SNikunj A Dadhania for (i = 0; i < es && ins_index < 16; i++, ins_index++) { 160203b32c09SMark Cave-Ayland t.VsrB(ins_index) = xb->VsrB(8 - es + i); 16033398b742SNikunj A Dadhania } 16043398b742SNikunj A Dadhania 160503b32c09SMark Cave-Ayland *xt = t; 16063398b742SNikunj A Dadhania } 16073398b742SNikunj A Dadhania 1608634c5835SMark Cave-Ayland #define VEXT_SIGNED(name, element, cast) \ 1609fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 1610fcf5ef2aSThomas Huth { \ 1611fcf5ef2aSThomas Huth int i; \ 161260594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1613634c5835SMark Cave-Ayland r->element[i] = (cast)b->element[i]; \ 1614fcf5ef2aSThomas Huth } \ 1615fcf5ef2aSThomas Huth } 1616634c5835SMark Cave-Ayland VEXT_SIGNED(vextsb2w, s32, int8_t) 1617634c5835SMark Cave-Ayland VEXT_SIGNED(vextsb2d, s64, int8_t) 1618634c5835SMark Cave-Ayland VEXT_SIGNED(vextsh2w, s32, int16_t) 1619634c5835SMark Cave-Ayland VEXT_SIGNED(vextsh2d, s64, int16_t) 1620634c5835SMark Cave-Ayland VEXT_SIGNED(vextsw2d, s64, int32_t) 1621fcf5ef2aSThomas Huth #undef VEXT_SIGNED 1622fcf5ef2aSThomas Huth 1623fcf5ef2aSThomas Huth #define VNEG(name, element) \ 1624fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 1625fcf5ef2aSThomas Huth { \ 1626fcf5ef2aSThomas Huth int i; \ 162760594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1628fcf5ef2aSThomas Huth r->element[i] = -b->element[i]; \ 1629fcf5ef2aSThomas Huth } \ 1630fcf5ef2aSThomas Huth } 1631fcf5ef2aSThomas Huth VNEG(vnegw, s32) 1632fcf5ef2aSThomas Huth VNEG(vnegd, s64) 1633fcf5ef2aSThomas Huth #undef VNEG 1634fcf5ef2aSThomas Huth 1635fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1636fcf5ef2aSThomas Huth { 16373c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1638fcf5ef2aSThomas Huth 1639fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1640fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1641fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1642fcf5ef2aSThomas Huth #else 1643fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1644fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 1645fcf5ef2aSThomas Huth #endif 1646fcf5ef2aSThomas Huth } 1647fcf5ef2aSThomas Huth 1648fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1649fcf5ef2aSThomas Huth { 1650fcf5ef2aSThomas Huth int i; 1651fcf5ef2aSThomas Huth 1652fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1653fcf5ef2aSThomas Huth r->u32[i] = a->u32[i] >= b->u32[i]; 1654fcf5ef2aSThomas Huth } 1655fcf5ef2aSThomas Huth } 1656fcf5ef2aSThomas Huth 1657fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1658fcf5ef2aSThomas Huth { 1659fcf5ef2aSThomas Huth int64_t t; 1660fcf5ef2aSThomas Huth int i, upper; 1661fcf5ef2aSThomas Huth ppc_avr_t result; 1662fcf5ef2aSThomas Huth int sat = 0; 1663fcf5ef2aSThomas Huth 1664fcf5ef2aSThomas Huth upper = ARRAY_SIZE(r->s32) - 1; 166560594feaSMark Cave-Ayland t = (int64_t)b->VsrSW(upper); 1666fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 166760594feaSMark Cave-Ayland t += a->VsrSW(i); 166860594feaSMark Cave-Ayland result.VsrSW(i) = 0; 1669fcf5ef2aSThomas Huth } 167060594feaSMark Cave-Ayland result.VsrSW(upper) = cvtsdsw(t, &sat); 1671fcf5ef2aSThomas Huth *r = result; 1672fcf5ef2aSThomas Huth 1673fcf5ef2aSThomas Huth if (sat) { 16746175f5a0SRichard Henderson set_vscr_sat(env); 1675fcf5ef2aSThomas Huth } 1676fcf5ef2aSThomas Huth } 1677fcf5ef2aSThomas Huth 1678fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1679fcf5ef2aSThomas Huth { 1680fcf5ef2aSThomas Huth int i, j, upper; 1681fcf5ef2aSThomas Huth ppc_avr_t result; 1682fcf5ef2aSThomas Huth int sat = 0; 1683fcf5ef2aSThomas Huth 1684fcf5ef2aSThomas Huth upper = 1; 1685fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 168660594feaSMark Cave-Ayland int64_t t = (int64_t)b->VsrSW(upper + i * 2); 1687fcf5ef2aSThomas Huth 16887fa0ddc1SAnton Blanchard result.VsrD(i) = 0; 1689fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u64); j++) { 169060594feaSMark Cave-Ayland t += a->VsrSW(2 * i + j); 1691fcf5ef2aSThomas Huth } 169260594feaSMark Cave-Ayland result.VsrSW(upper + i * 2) = cvtsdsw(t, &sat); 1693fcf5ef2aSThomas Huth } 1694fcf5ef2aSThomas Huth 1695fcf5ef2aSThomas Huth *r = result; 1696fcf5ef2aSThomas Huth if (sat) { 16976175f5a0SRichard Henderson set_vscr_sat(env); 1698fcf5ef2aSThomas Huth } 1699fcf5ef2aSThomas Huth } 1700fcf5ef2aSThomas Huth 1701fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1702fcf5ef2aSThomas Huth { 1703fcf5ef2aSThomas Huth int i, j; 1704fcf5ef2aSThomas Huth int sat = 0; 1705fcf5ef2aSThomas Huth 1706fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1707fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1708fcf5ef2aSThomas Huth 1709fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->s32); j++) { 1710fcf5ef2aSThomas Huth t += a->s8[4 * i + j]; 1711fcf5ef2aSThomas Huth } 1712fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1713fcf5ef2aSThomas Huth } 1714fcf5ef2aSThomas Huth 1715fcf5ef2aSThomas Huth if (sat) { 17166175f5a0SRichard Henderson set_vscr_sat(env); 1717fcf5ef2aSThomas Huth } 1718fcf5ef2aSThomas Huth } 1719fcf5ef2aSThomas Huth 1720fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1721fcf5ef2aSThomas Huth { 1722fcf5ef2aSThomas Huth int sat = 0; 1723fcf5ef2aSThomas Huth int i; 1724fcf5ef2aSThomas Huth 1725fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 1726fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 1727fcf5ef2aSThomas Huth 1728fcf5ef2aSThomas Huth t += a->s16[2 * i] + a->s16[2 * i + 1]; 1729fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 1730fcf5ef2aSThomas Huth } 1731fcf5ef2aSThomas Huth 1732fcf5ef2aSThomas Huth if (sat) { 17336175f5a0SRichard Henderson set_vscr_sat(env); 1734fcf5ef2aSThomas Huth } 1735fcf5ef2aSThomas Huth } 1736fcf5ef2aSThomas Huth 1737fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1738fcf5ef2aSThomas Huth { 1739fcf5ef2aSThomas Huth int i, j; 1740fcf5ef2aSThomas Huth int sat = 0; 1741fcf5ef2aSThomas Huth 1742fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 1743fcf5ef2aSThomas Huth uint64_t t = (uint64_t)b->u32[i]; 1744fcf5ef2aSThomas Huth 1745fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u32); j++) { 1746fcf5ef2aSThomas Huth t += a->u8[4 * i + j]; 1747fcf5ef2aSThomas Huth } 1748fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1749fcf5ef2aSThomas Huth } 1750fcf5ef2aSThomas Huth 1751fcf5ef2aSThomas Huth if (sat) { 17526175f5a0SRichard Henderson set_vscr_sat(env); 1753fcf5ef2aSThomas Huth } 1754fcf5ef2aSThomas Huth } 1755fcf5ef2aSThomas Huth 1756fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1757fcf5ef2aSThomas Huth #define UPKHI 1 1758fcf5ef2aSThomas Huth #define UPKLO 0 1759fcf5ef2aSThomas Huth #else 1760fcf5ef2aSThomas Huth #define UPKHI 0 1761fcf5ef2aSThomas Huth #define UPKLO 1 1762fcf5ef2aSThomas Huth #endif 1763fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi) \ 1764fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 1765fcf5ef2aSThomas Huth { \ 1766fcf5ef2aSThomas Huth int i; \ 1767fcf5ef2aSThomas Huth ppc_avr_t result; \ 1768fcf5ef2aSThomas Huth \ 1769fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { \ 1770fcf5ef2aSThomas Huth uint16_t e = b->u16[hi ? i : i + 4]; \ 1771fcf5ef2aSThomas Huth uint8_t a = (e >> 15) ? 0xff : 0; \ 1772fcf5ef2aSThomas Huth uint8_t r = (e >> 10) & 0x1f; \ 1773fcf5ef2aSThomas Huth uint8_t g = (e >> 5) & 0x1f; \ 1774fcf5ef2aSThomas Huth uint8_t b = e & 0x1f; \ 1775fcf5ef2aSThomas Huth \ 1776fcf5ef2aSThomas Huth result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b; \ 1777fcf5ef2aSThomas Huth } \ 1778fcf5ef2aSThomas Huth *r = result; \ 1779fcf5ef2aSThomas Huth } 1780fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO) 1781fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI) 1782fcf5ef2aSThomas Huth #undef VUPKPX 1783fcf5ef2aSThomas Huth 1784fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi) \ 1785fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 1786fcf5ef2aSThomas Huth { \ 1787fcf5ef2aSThomas Huth int i; \ 1788fcf5ef2aSThomas Huth ppc_avr_t result; \ 1789fcf5ef2aSThomas Huth \ 1790fcf5ef2aSThomas Huth if (hi) { \ 1791fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) { \ 1792fcf5ef2aSThomas Huth result.unpacked[i] = b->packee[i]; \ 1793fcf5ef2aSThomas Huth } \ 1794fcf5ef2aSThomas Huth } else { \ 1795fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \ 1796fcf5ef2aSThomas Huth i++) { \ 1797fcf5ef2aSThomas Huth result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \ 1798fcf5ef2aSThomas Huth } \ 1799fcf5ef2aSThomas Huth } \ 1800fcf5ef2aSThomas Huth *r = result; \ 1801fcf5ef2aSThomas Huth } 1802fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI) 1803fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI) 1804fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI) 1805fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO) 1806fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO) 1807fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO) 1808fcf5ef2aSThomas Huth #undef VUPK 1809fcf5ef2aSThomas Huth #undef UPKHI 1810fcf5ef2aSThomas Huth #undef UPKLO 1811fcf5ef2aSThomas Huth 1812fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element) \ 1813fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *b) \ 1814fcf5ef2aSThomas Huth { \ 1815fcf5ef2aSThomas Huth int i; \ 1816fcf5ef2aSThomas Huth \ 181760594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1818fcf5ef2aSThomas Huth r->element[i] = name(b->element[i]); \ 1819fcf5ef2aSThomas Huth } \ 1820fcf5ef2aSThomas Huth } 1821fcf5ef2aSThomas Huth 1822fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8) 1823fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16) 1824fcf5ef2aSThomas Huth 1825fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8) 1826fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16) 1827fcf5ef2aSThomas Huth 1828fcf5ef2aSThomas Huth #undef clzb 1829fcf5ef2aSThomas Huth #undef clzh 1830fcf5ef2aSThomas Huth 1831fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8) 1832fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16) 1833fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v)) 1834fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v)) 1835fcf5ef2aSThomas Huth 1836fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8) 1837fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16) 1838fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32) 1839fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64) 1840fcf5ef2aSThomas Huth 1841fcf5ef2aSThomas Huth #undef ctzb 1842fcf5ef2aSThomas Huth #undef ctzh 1843fcf5ef2aSThomas Huth #undef ctzw 1844fcf5ef2aSThomas Huth #undef ctzd 1845fcf5ef2aSThomas Huth 1846fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v) 1847fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v) 1848fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v) 1849fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v) 1850fcf5ef2aSThomas Huth 1851fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8) 1852fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16) 1853fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32) 1854fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64) 1855fcf5ef2aSThomas Huth 1856fcf5ef2aSThomas Huth #undef popcntb 1857fcf5ef2aSThomas Huth #undef popcnth 1858fcf5ef2aSThomas Huth #undef popcntw 1859fcf5ef2aSThomas Huth #undef popcntd 1860fcf5ef2aSThomas Huth 1861fcf5ef2aSThomas Huth #undef VGENERIC_DO 1862fcf5ef2aSThomas Huth 1863fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1864fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } } 1865fcf5ef2aSThomas Huth #else 1866fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } } 1867fcf5ef2aSThomas Huth #endif 1868fcf5ef2aSThomas Huth 1869fcf5ef2aSThomas Huth #ifndef CONFIG_INT128 1870fcf5ef2aSThomas Huth 1871fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a) 1872fcf5ef2aSThomas Huth { 1873fcf5ef2aSThomas Huth t->u64[0] = ~a.u64[0]; 1874fcf5ef2aSThomas Huth t->u64[1] = ~a.u64[1]; 1875fcf5ef2aSThomas Huth } 1876fcf5ef2aSThomas Huth 1877fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b) 1878fcf5ef2aSThomas Huth { 18793c385a93SMark Cave-Ayland if (a.VsrD(0) < b.VsrD(0)) { 1880fcf5ef2aSThomas Huth return -1; 18813c385a93SMark Cave-Ayland } else if (a.VsrD(0) > b.VsrD(0)) { 1882fcf5ef2aSThomas Huth return 1; 18833c385a93SMark Cave-Ayland } else if (a.VsrD(1) < b.VsrD(1)) { 1884fcf5ef2aSThomas Huth return -1; 18853c385a93SMark Cave-Ayland } else if (a.VsrD(1) > b.VsrD(1)) { 1886fcf5ef2aSThomas Huth return 1; 1887fcf5ef2aSThomas Huth } else { 1888fcf5ef2aSThomas Huth return 0; 1889fcf5ef2aSThomas Huth } 1890fcf5ef2aSThomas Huth } 1891fcf5ef2aSThomas Huth 1892fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 1893fcf5ef2aSThomas Huth { 18943c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 18953c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 18963c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 1897fcf5ef2aSThomas Huth } 1898fcf5ef2aSThomas Huth 1899fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 1900fcf5ef2aSThomas Huth { 1901fcf5ef2aSThomas Huth ppc_avr_t not_a; 19023c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 19033c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 19043c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 1905fcf5ef2aSThomas Huth avr_qw_not(¬_a, a); 1906fcf5ef2aSThomas Huth return avr_qw_cmpu(not_a, b) < 0; 1907fcf5ef2aSThomas Huth } 1908fcf5ef2aSThomas Huth 1909fcf5ef2aSThomas Huth #endif 1910fcf5ef2aSThomas Huth 1911fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1912fcf5ef2aSThomas Huth { 1913fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1914fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128; 1915fcf5ef2aSThomas Huth #else 1916fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 1917fcf5ef2aSThomas Huth #endif 1918fcf5ef2aSThomas Huth } 1919fcf5ef2aSThomas Huth 1920fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1921fcf5ef2aSThomas Huth { 1922fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1923fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128 + (c->u128 & 1); 1924fcf5ef2aSThomas Huth #else 1925fcf5ef2aSThomas Huth 19263c385a93SMark Cave-Ayland if (c->VsrD(1) & 1) { 1927fcf5ef2aSThomas Huth ppc_avr_t tmp; 1928fcf5ef2aSThomas Huth 19293c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 19303c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 1931fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 1932fcf5ef2aSThomas Huth avr_qw_add(r, tmp, *b); 1933fcf5ef2aSThomas Huth } else { 1934fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 1935fcf5ef2aSThomas Huth } 1936fcf5ef2aSThomas Huth #endif 1937fcf5ef2aSThomas Huth } 1938fcf5ef2aSThomas Huth 1939fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1940fcf5ef2aSThomas Huth { 1941fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1942fcf5ef2aSThomas Huth r->u128 = (~a->u128 < b->u128); 1943fcf5ef2aSThomas Huth #else 1944fcf5ef2aSThomas Huth ppc_avr_t not_a; 1945fcf5ef2aSThomas Huth 1946fcf5ef2aSThomas Huth avr_qw_not(¬_a, *a); 1947fcf5ef2aSThomas Huth 19483c385a93SMark Cave-Ayland r->VsrD(0) = 0; 19493c385a93SMark Cave-Ayland r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0); 1950fcf5ef2aSThomas Huth #endif 1951fcf5ef2aSThomas Huth } 1952fcf5ef2aSThomas Huth 1953fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1954fcf5ef2aSThomas Huth { 1955fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1956fcf5ef2aSThomas Huth int carry_out = (~a->u128 < b->u128); 1957fcf5ef2aSThomas Huth if (!carry_out && (c->u128 & 1)) { 1958fcf5ef2aSThomas Huth carry_out = ((a->u128 + b->u128 + 1) == 0) && 1959fcf5ef2aSThomas Huth ((a->u128 != 0) || (b->u128 != 0)); 1960fcf5ef2aSThomas Huth } 1961fcf5ef2aSThomas Huth r->u128 = carry_out; 1962fcf5ef2aSThomas Huth #else 1963fcf5ef2aSThomas Huth 19643c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 1965fcf5ef2aSThomas Huth int carry_out = 0; 1966fcf5ef2aSThomas Huth ppc_avr_t tmp; 1967fcf5ef2aSThomas Huth 1968fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, *a, *b); 1969fcf5ef2aSThomas Huth 1970fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 1971fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 1972fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, tmp, one); 1973fcf5ef2aSThomas Huth } 19743c385a93SMark Cave-Ayland r->VsrD(0) = 0; 19753c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 1976fcf5ef2aSThomas Huth #endif 1977fcf5ef2aSThomas Huth } 1978fcf5ef2aSThomas Huth 1979fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1980fcf5ef2aSThomas Huth { 1981fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1982fcf5ef2aSThomas Huth r->u128 = a->u128 - b->u128; 1983fcf5ef2aSThomas Huth #else 1984fcf5ef2aSThomas Huth ppc_avr_t tmp; 1985fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 1986fcf5ef2aSThomas Huth 1987fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 1988fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 1989fcf5ef2aSThomas Huth avr_qw_add(r, tmp, one); 1990fcf5ef2aSThomas Huth #endif 1991fcf5ef2aSThomas Huth } 1992fcf5ef2aSThomas Huth 1993fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 1994fcf5ef2aSThomas Huth { 1995fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1996fcf5ef2aSThomas Huth r->u128 = a->u128 + ~b->u128 + (c->u128 & 1); 1997fcf5ef2aSThomas Huth #else 1998fcf5ef2aSThomas Huth ppc_avr_t tmp, sum; 1999fcf5ef2aSThomas Huth 2000fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2001fcf5ef2aSThomas Huth avr_qw_add(&sum, *a, tmp); 2002fcf5ef2aSThomas Huth 20033c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 20043c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2005fcf5ef2aSThomas Huth avr_qw_add(r, sum, tmp); 2006fcf5ef2aSThomas Huth #endif 2007fcf5ef2aSThomas Huth } 2008fcf5ef2aSThomas Huth 2009fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2010fcf5ef2aSThomas Huth { 2011fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2012fcf5ef2aSThomas Huth r->u128 = (~a->u128 < ~b->u128) || 2013fcf5ef2aSThomas Huth (a->u128 + ~b->u128 == (__uint128_t)-1); 2014fcf5ef2aSThomas Huth #else 2015fcf5ef2aSThomas Huth int carry = (avr_qw_cmpu(*a, *b) > 0); 2016fcf5ef2aSThomas Huth if (!carry) { 2017fcf5ef2aSThomas Huth ppc_avr_t tmp; 2018fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2019fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 20203c385a93SMark Cave-Ayland carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull)); 2021fcf5ef2aSThomas Huth } 20223c385a93SMark Cave-Ayland r->VsrD(0) = 0; 20233c385a93SMark Cave-Ayland r->VsrD(1) = carry; 2024fcf5ef2aSThomas Huth #endif 2025fcf5ef2aSThomas Huth } 2026fcf5ef2aSThomas Huth 2027fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2028fcf5ef2aSThomas Huth { 2029fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2030fcf5ef2aSThomas Huth r->u128 = 2031fcf5ef2aSThomas Huth (~a->u128 < ~b->u128) || 2032fcf5ef2aSThomas Huth ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1)); 2033fcf5ef2aSThomas Huth #else 20343c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2035fcf5ef2aSThomas Huth int carry_out = (avr_qw_cmpu(*a, *b) > 0); 2036fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2037fcf5ef2aSThomas Huth ppc_avr_t tmp; 2038fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2039fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 20403c385a93SMark Cave-Ayland carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull)); 2041fcf5ef2aSThomas Huth } 2042fcf5ef2aSThomas Huth 20433c385a93SMark Cave-Ayland r->VsrD(0) = 0; 20443c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2045fcf5ef2aSThomas Huth #endif 2046fcf5ef2aSThomas Huth } 2047fcf5ef2aSThomas Huth 2048fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC 2049fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF 2050fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1 0xA 2051fcf5ef2aSThomas Huth #define BCD_NEG_PREF 0xD 2052fcf5ef2aSThomas Huth #define BCD_NEG_ALT 0xB 2053fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2 0xE 2054fcf5ef2aSThomas Huth #define NATIONAL_PLUS 0x2B 2055fcf5ef2aSThomas Huth #define NATIONAL_NEG 0x2D 2056fcf5ef2aSThomas Huth 2057365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2)) 2058fcf5ef2aSThomas Huth 2059fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd) 2060fcf5ef2aSThomas Huth { 2061428115c3SMark Cave-Ayland switch (bcd->VsrB(BCD_DIG_BYTE(0)) & 0xF) { 2062fcf5ef2aSThomas Huth case BCD_PLUS_PREF_1: 2063fcf5ef2aSThomas Huth case BCD_PLUS_PREF_2: 2064fcf5ef2aSThomas Huth case BCD_PLUS_ALT_1: 2065fcf5ef2aSThomas Huth case BCD_PLUS_ALT_2: 2066fcf5ef2aSThomas Huth { 2067fcf5ef2aSThomas Huth return 1; 2068fcf5ef2aSThomas Huth } 2069fcf5ef2aSThomas Huth 2070fcf5ef2aSThomas Huth case BCD_NEG_PREF: 2071fcf5ef2aSThomas Huth case BCD_NEG_ALT: 2072fcf5ef2aSThomas Huth { 2073fcf5ef2aSThomas Huth return -1; 2074fcf5ef2aSThomas Huth } 2075fcf5ef2aSThomas Huth 2076fcf5ef2aSThomas Huth default: 2077fcf5ef2aSThomas Huth { 2078fcf5ef2aSThomas Huth return 0; 2079fcf5ef2aSThomas Huth } 2080fcf5ef2aSThomas Huth } 2081fcf5ef2aSThomas Huth } 2082fcf5ef2aSThomas Huth 2083fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps) 2084fcf5ef2aSThomas Huth { 2085fcf5ef2aSThomas Huth if (sgn >= 0) { 2086fcf5ef2aSThomas Huth return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2; 2087fcf5ef2aSThomas Huth } else { 2088fcf5ef2aSThomas Huth return BCD_NEG_PREF; 2089fcf5ef2aSThomas Huth } 2090fcf5ef2aSThomas Huth } 2091fcf5ef2aSThomas Huth 2092fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid) 2093fcf5ef2aSThomas Huth { 2094fcf5ef2aSThomas Huth uint8_t result; 2095fcf5ef2aSThomas Huth if (n & 1) { 2096428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) >> 4; 2097fcf5ef2aSThomas Huth } else { 2098428115c3SMark Cave-Ayland result = bcd->VsrB(BCD_DIG_BYTE(n)) & 0xF; 2099fcf5ef2aSThomas Huth } 2100fcf5ef2aSThomas Huth 2101fcf5ef2aSThomas Huth if (unlikely(result > 9)) { 2102fcf5ef2aSThomas Huth *invalid = true; 2103fcf5ef2aSThomas Huth } 2104fcf5ef2aSThomas Huth return result; 2105fcf5ef2aSThomas Huth } 2106fcf5ef2aSThomas Huth 2107fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n) 2108fcf5ef2aSThomas Huth { 2109fcf5ef2aSThomas Huth if (n & 1) { 2110428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0x0F; 2111428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= (digit << 4); 2112fcf5ef2aSThomas Huth } else { 2113428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) &= 0xF0; 2114428115c3SMark Cave-Ayland bcd->VsrB(BCD_DIG_BYTE(n)) |= digit; 2115fcf5ef2aSThomas Huth } 2116fcf5ef2aSThomas Huth } 2117fcf5ef2aSThomas Huth 2118071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd) 2119071663dfSJose Ricardo Ziviani { 2120071663dfSJose Ricardo Ziviani int i; 2121071663dfSJose Ricardo Ziviani int invalid = 0; 2122071663dfSJose Ricardo Ziviani 2123071663dfSJose Ricardo Ziviani if (bcd_get_sgn(bcd) == 0) { 2124071663dfSJose Ricardo Ziviani return false; 2125071663dfSJose Ricardo Ziviani } 2126071663dfSJose Ricardo Ziviani 2127071663dfSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2128071663dfSJose Ricardo Ziviani bcd_get_digit(bcd, i, &invalid); 2129071663dfSJose Ricardo Ziviani if (unlikely(invalid)) { 2130071663dfSJose Ricardo Ziviani return false; 2131071663dfSJose Ricardo Ziviani } 2132071663dfSJose Ricardo Ziviani } 2133071663dfSJose Ricardo Ziviani return true; 2134071663dfSJose Ricardo Ziviani } 2135071663dfSJose Ricardo Ziviani 2136fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd) 2137fcf5ef2aSThomas Huth { 21383c385a93SMark Cave-Ayland if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) { 2139efa73196SNikunj A Dadhania return CRF_EQ; 2140fcf5ef2aSThomas Huth } else { 2141efa73196SNikunj A Dadhania return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT; 2142fcf5ef2aSThomas Huth } 2143fcf5ef2aSThomas Huth } 2144fcf5ef2aSThomas Huth 2145fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n) 2146fcf5ef2aSThomas Huth { 214760594feaSMark Cave-Ayland return reg->VsrH(7 - n); 2148fcf5ef2aSThomas Huth } 2149fcf5ef2aSThomas Huth 2150fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n) 2151fcf5ef2aSThomas Huth { 215260594feaSMark Cave-Ayland reg->VsrH(7 - n) = val; 2153fcf5ef2aSThomas Huth } 2154fcf5ef2aSThomas Huth 2155fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b) 2156fcf5ef2aSThomas Huth { 2157fcf5ef2aSThomas Huth int i; 2158fcf5ef2aSThomas Huth int invalid = 0; 2159fcf5ef2aSThomas Huth for (i = 31; i > 0; i--) { 2160fcf5ef2aSThomas Huth uint8_t dig_a = bcd_get_digit(a, i, &invalid); 2161fcf5ef2aSThomas Huth uint8_t dig_b = bcd_get_digit(b, i, &invalid); 2162fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2163fcf5ef2aSThomas Huth return 0; /* doesn't matter */ 2164fcf5ef2aSThomas Huth } else if (dig_a > dig_b) { 2165fcf5ef2aSThomas Huth return 1; 2166fcf5ef2aSThomas Huth } else if (dig_a < dig_b) { 2167fcf5ef2aSThomas Huth return -1; 2168fcf5ef2aSThomas Huth } 2169fcf5ef2aSThomas Huth } 2170fcf5ef2aSThomas Huth 2171fcf5ef2aSThomas Huth return 0; 2172fcf5ef2aSThomas Huth } 2173fcf5ef2aSThomas Huth 2174936fda4dSFabiano Rosas static int bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2175fcf5ef2aSThomas Huth int *overflow) 2176fcf5ef2aSThomas Huth { 2177fcf5ef2aSThomas Huth int carry = 0; 2178fcf5ef2aSThomas Huth int i; 2179936fda4dSFabiano Rosas int is_zero = 1; 2180936fda4dSFabiano Rosas 2181fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2182fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) + 2183fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2184936fda4dSFabiano Rosas is_zero &= (digit == 0); 2185fcf5ef2aSThomas Huth if (digit > 9) { 2186fcf5ef2aSThomas Huth carry = 1; 2187fcf5ef2aSThomas Huth digit -= 10; 2188fcf5ef2aSThomas Huth } else { 2189fcf5ef2aSThomas Huth carry = 0; 2190fcf5ef2aSThomas Huth } 2191fcf5ef2aSThomas Huth 2192fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2193fcf5ef2aSThomas Huth } 2194fcf5ef2aSThomas Huth 2195fcf5ef2aSThomas Huth *overflow = carry; 2196936fda4dSFabiano Rosas return is_zero; 2197fcf5ef2aSThomas Huth } 2198fcf5ef2aSThomas Huth 2199d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2200fcf5ef2aSThomas Huth int *overflow) 2201fcf5ef2aSThomas Huth { 2202fcf5ef2aSThomas Huth int carry = 0; 2203fcf5ef2aSThomas Huth int i; 2204d03b174aSYasmin Beatriz 2205fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2206fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) - 2207fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2208fcf5ef2aSThomas Huth if (digit & 0x80) { 2209fcf5ef2aSThomas Huth carry = -1; 2210fcf5ef2aSThomas Huth digit += 10; 2211fcf5ef2aSThomas Huth } else { 2212fcf5ef2aSThomas Huth carry = 0; 2213fcf5ef2aSThomas Huth } 2214fcf5ef2aSThomas Huth 2215fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2216fcf5ef2aSThomas Huth } 2217fcf5ef2aSThomas Huth 2218fcf5ef2aSThomas Huth *overflow = carry; 2219fcf5ef2aSThomas Huth } 2220fcf5ef2aSThomas Huth 2221fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2222fcf5ef2aSThomas Huth { 2223fcf5ef2aSThomas Huth 2224fcf5ef2aSThomas Huth int sgna = bcd_get_sgn(a); 2225fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2226fcf5ef2aSThomas Huth int invalid = (sgna == 0) || (sgnb == 0); 2227fcf5ef2aSThomas Huth int overflow = 0; 2228936fda4dSFabiano Rosas int zero = 0; 2229fcf5ef2aSThomas Huth uint32_t cr = 0; 2230fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 2231fcf5ef2aSThomas Huth 2232fcf5ef2aSThomas Huth if (!invalid) { 2233fcf5ef2aSThomas Huth if (sgna == sgnb) { 2234428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2235936fda4dSFabiano Rosas zero = bcd_add_mag(&result, a, b, &invalid, &overflow); 2236936fda4dSFabiano Rosas cr = (sgna > 0) ? CRF_GT : CRF_LT; 2237fcf5ef2aSThomas Huth } else { 2238d03b174aSYasmin Beatriz int magnitude = bcd_cmp_mag(a, b); 2239d03b174aSYasmin Beatriz if (magnitude > 0) { 2240428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgna, ps); 2241d03b174aSYasmin Beatriz bcd_sub_mag(&result, a, b, &invalid, &overflow); 2242d03b174aSYasmin Beatriz cr = (sgna > 0) ? CRF_GT : CRF_LT; 2243d03b174aSYasmin Beatriz } else if (magnitude < 0) { 2244428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(sgnb, ps); 2245d03b174aSYasmin Beatriz bcd_sub_mag(&result, b, a, &invalid, &overflow); 2246efa73196SNikunj A Dadhania cr = (sgnb > 0) ? CRF_GT : CRF_LT; 2247d03b174aSYasmin Beatriz } else { 2248428115c3SMark Cave-Ayland result.VsrB(BCD_DIG_BYTE(0)) = bcd_preferred_sgn(0, ps); 2249d03b174aSYasmin Beatriz cr = CRF_EQ; 2250d03b174aSYasmin Beatriz } 2251fcf5ef2aSThomas Huth } 2252fcf5ef2aSThomas Huth } 2253fcf5ef2aSThomas Huth 2254fcf5ef2aSThomas Huth if (unlikely(invalid)) { 22553c385a93SMark Cave-Ayland result.VsrD(0) = result.VsrD(1) = -1; 2256efa73196SNikunj A Dadhania cr = CRF_SO; 2257fcf5ef2aSThomas Huth } else if (overflow) { 2258efa73196SNikunj A Dadhania cr |= CRF_SO; 2259936fda4dSFabiano Rosas } else if (zero) { 2260936fda4dSFabiano Rosas cr |= CRF_EQ; 2261fcf5ef2aSThomas Huth } 2262fcf5ef2aSThomas Huth 2263fcf5ef2aSThomas Huth *r = result; 2264fcf5ef2aSThomas Huth 2265fcf5ef2aSThomas Huth return cr; 2266fcf5ef2aSThomas Huth } 2267fcf5ef2aSThomas Huth 2268fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2269fcf5ef2aSThomas Huth { 2270fcf5ef2aSThomas Huth ppc_avr_t bcopy = *b; 2271fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2272fcf5ef2aSThomas Huth if (sgnb < 0) { 2273fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0); 2274fcf5ef2aSThomas Huth } else if (sgnb > 0) { 2275fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_NEG_PREF, 0); 2276fcf5ef2aSThomas Huth } 2277fcf5ef2aSThomas Huth /* else invalid ... defer to bcdadd code for proper handling */ 2278fcf5ef2aSThomas Huth 2279fcf5ef2aSThomas Huth return helper_bcdadd(r, a, &bcopy, ps); 2280fcf5ef2aSThomas Huth } 2281fcf5ef2aSThomas Huth 2282fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2283fcf5ef2aSThomas Huth { 2284fcf5ef2aSThomas Huth int i; 2285fcf5ef2aSThomas Huth int cr = 0; 2286fcf5ef2aSThomas Huth uint16_t national = 0; 2287fcf5ef2aSThomas Huth uint16_t sgnb = get_national_digit(b, 0); 2288fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2289fcf5ef2aSThomas Huth int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG); 2290fcf5ef2aSThomas Huth 2291fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2292fcf5ef2aSThomas Huth national = get_national_digit(b, i); 2293fcf5ef2aSThomas Huth if (unlikely(national < 0x30 || national > 0x39)) { 2294fcf5ef2aSThomas Huth invalid = 1; 2295fcf5ef2aSThomas Huth break; 2296fcf5ef2aSThomas Huth } 2297fcf5ef2aSThomas Huth 2298fcf5ef2aSThomas Huth bcd_put_digit(&ret, national & 0xf, i); 2299fcf5ef2aSThomas Huth } 2300fcf5ef2aSThomas Huth 2301fcf5ef2aSThomas Huth if (sgnb == NATIONAL_PLUS) { 2302fcf5ef2aSThomas Huth bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0); 2303fcf5ef2aSThomas Huth } else { 2304fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2305fcf5ef2aSThomas Huth } 2306fcf5ef2aSThomas Huth 2307fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2308fcf5ef2aSThomas Huth 2309fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2310efa73196SNikunj A Dadhania cr = CRF_SO; 2311fcf5ef2aSThomas Huth } 2312fcf5ef2aSThomas Huth 2313fcf5ef2aSThomas Huth *r = ret; 2314fcf5ef2aSThomas Huth 2315fcf5ef2aSThomas Huth return cr; 2316fcf5ef2aSThomas Huth } 2317fcf5ef2aSThomas Huth 2318fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2319fcf5ef2aSThomas Huth { 2320fcf5ef2aSThomas Huth int i; 2321fcf5ef2aSThomas Huth int cr = 0; 2322fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2323fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2324fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2325fcf5ef2aSThomas Huth 23263c385a93SMark Cave-Ayland int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0); 2327fcf5ef2aSThomas Huth 2328fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2329fcf5ef2aSThomas Huth set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i); 2330fcf5ef2aSThomas Huth 2331fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2332fcf5ef2aSThomas Huth break; 2333fcf5ef2aSThomas Huth } 2334fcf5ef2aSThomas Huth } 2335fcf5ef2aSThomas Huth set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0); 2336fcf5ef2aSThomas Huth 2337fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2338fcf5ef2aSThomas Huth 2339fcf5ef2aSThomas Huth if (ox_flag) { 2340efa73196SNikunj A Dadhania cr |= CRF_SO; 2341fcf5ef2aSThomas Huth } 2342fcf5ef2aSThomas Huth 2343fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2344efa73196SNikunj A Dadhania cr = CRF_SO; 2345fcf5ef2aSThomas Huth } 2346fcf5ef2aSThomas Huth 2347fcf5ef2aSThomas Huth *r = ret; 2348fcf5ef2aSThomas Huth 2349fcf5ef2aSThomas Huth return cr; 2350fcf5ef2aSThomas Huth } 2351fcf5ef2aSThomas Huth 2352fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2353fcf5ef2aSThomas Huth { 2354fcf5ef2aSThomas Huth int i; 2355fcf5ef2aSThomas Huth int cr = 0; 2356fcf5ef2aSThomas Huth int invalid = 0; 2357fcf5ef2aSThomas Huth int zone_digit = 0; 2358fcf5ef2aSThomas Huth int zone_lead = ps ? 0xF : 0x3; 2359fcf5ef2aSThomas Huth int digit = 0; 2360fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2361428115c3SMark Cave-Ayland int sgnb = b->VsrB(BCD_DIG_BYTE(0)) >> 4; 2362fcf5ef2aSThomas Huth 2363fcf5ef2aSThomas Huth if (unlikely((sgnb < 0xA) && ps)) { 2364fcf5ef2aSThomas Huth invalid = 1; 2365fcf5ef2aSThomas Huth } 2366fcf5ef2aSThomas Huth 2367fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2368428115c3SMark Cave-Ayland zone_digit = i ? b->VsrB(BCD_DIG_BYTE(i * 2)) >> 4 : zone_lead; 2369428115c3SMark Cave-Ayland digit = b->VsrB(BCD_DIG_BYTE(i * 2)) & 0xF; 2370fcf5ef2aSThomas Huth if (unlikely(zone_digit != zone_lead || digit > 0x9)) { 2371fcf5ef2aSThomas Huth invalid = 1; 2372fcf5ef2aSThomas Huth break; 2373fcf5ef2aSThomas Huth } 2374fcf5ef2aSThomas Huth 2375fcf5ef2aSThomas Huth bcd_put_digit(&ret, digit, i + 1); 2376fcf5ef2aSThomas Huth } 2377fcf5ef2aSThomas Huth 2378fcf5ef2aSThomas Huth if ((ps && (sgnb == 0xB || sgnb == 0xD)) || 2379fcf5ef2aSThomas Huth (!ps && (sgnb & 0x4))) { 2380fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2381fcf5ef2aSThomas Huth } else { 2382fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0); 2383fcf5ef2aSThomas Huth } 2384fcf5ef2aSThomas Huth 2385fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2386fcf5ef2aSThomas Huth 2387fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2388efa73196SNikunj A Dadhania cr = CRF_SO; 2389fcf5ef2aSThomas Huth } 2390fcf5ef2aSThomas Huth 2391fcf5ef2aSThomas Huth *r = ret; 2392fcf5ef2aSThomas Huth 2393fcf5ef2aSThomas Huth return cr; 2394fcf5ef2aSThomas Huth } 2395fcf5ef2aSThomas Huth 2396fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2397fcf5ef2aSThomas Huth { 2398fcf5ef2aSThomas Huth int i; 2399fcf5ef2aSThomas Huth int cr = 0; 2400fcf5ef2aSThomas Huth uint8_t digit = 0; 2401fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2402fcf5ef2aSThomas Huth int zone_lead = (ps) ? 0xF0 : 0x30; 2403fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2404fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2405fcf5ef2aSThomas Huth 24063c385a93SMark Cave-Ayland int ox_flag = ((b->VsrD(0) >> 4) != 0); 2407fcf5ef2aSThomas Huth 2408fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2409fcf5ef2aSThomas Huth digit = bcd_get_digit(b, i + 1, &invalid); 2410fcf5ef2aSThomas Huth 2411fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2412fcf5ef2aSThomas Huth break; 2413fcf5ef2aSThomas Huth } 2414fcf5ef2aSThomas Huth 2415428115c3SMark Cave-Ayland ret.VsrB(BCD_DIG_BYTE(i * 2)) = zone_lead + digit; 2416fcf5ef2aSThomas Huth } 2417fcf5ef2aSThomas Huth 2418fcf5ef2aSThomas Huth if (ps) { 2419fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1); 2420fcf5ef2aSThomas Huth } else { 2421fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1); 2422fcf5ef2aSThomas Huth } 2423fcf5ef2aSThomas Huth 2424fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2425fcf5ef2aSThomas Huth 2426fcf5ef2aSThomas Huth if (ox_flag) { 2427efa73196SNikunj A Dadhania cr |= CRF_SO; 2428fcf5ef2aSThomas Huth } 2429fcf5ef2aSThomas Huth 2430fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2431efa73196SNikunj A Dadhania cr = CRF_SO; 2432fcf5ef2aSThomas Huth } 2433fcf5ef2aSThomas Huth 2434fcf5ef2aSThomas Huth *r = ret; 2435fcf5ef2aSThomas Huth 2436fcf5ef2aSThomas Huth return cr; 2437fcf5ef2aSThomas Huth } 2438fcf5ef2aSThomas Huth 2439a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2440a406c058SJose Ricardo Ziviani { 2441a406c058SJose Ricardo Ziviani int i; 2442a406c058SJose Ricardo Ziviani int cr = 0; 2443a406c058SJose Ricardo Ziviani uint64_t lo_value; 2444a406c058SJose Ricardo Ziviani uint64_t hi_value; 2445a406c058SJose Ricardo Ziviani ppc_avr_t ret = { .u64 = { 0, 0 } }; 2446a406c058SJose Ricardo Ziviani 24473c385a93SMark Cave-Ayland if (b->VsrSD(0) < 0) { 24483c385a93SMark Cave-Ayland lo_value = -b->VsrSD(1); 24493c385a93SMark Cave-Ayland hi_value = ~b->VsrD(0) + !lo_value; 2450a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, 0xD, 0); 2451a406c058SJose Ricardo Ziviani } else { 24523c385a93SMark Cave-Ayland lo_value = b->VsrD(1); 24533c385a93SMark Cave-Ayland hi_value = b->VsrD(0); 2454a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0); 2455a406c058SJose Ricardo Ziviani } 2456a406c058SJose Ricardo Ziviani 2457a406c058SJose Ricardo Ziviani if (divu128(&lo_value, &hi_value, 1000000000000000ULL) || 2458a406c058SJose Ricardo Ziviani lo_value > 9999999999999999ULL) { 2459a406c058SJose Ricardo Ziviani cr = CRF_SO; 2460a406c058SJose Ricardo Ziviani } 2461a406c058SJose Ricardo Ziviani 2462a406c058SJose Ricardo Ziviani for (i = 1; i < 16; hi_value /= 10, i++) { 2463a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, hi_value % 10, i); 2464a406c058SJose Ricardo Ziviani } 2465a406c058SJose Ricardo Ziviani 2466a406c058SJose Ricardo Ziviani for (; i < 32; lo_value /= 10, i++) { 2467a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, lo_value % 10, i); 2468a406c058SJose Ricardo Ziviani } 2469a406c058SJose Ricardo Ziviani 2470a406c058SJose Ricardo Ziviani cr |= bcd_cmp_zero(&ret); 2471a406c058SJose Ricardo Ziviani 2472a406c058SJose Ricardo Ziviani *r = ret; 2473a406c058SJose Ricardo Ziviani 2474a406c058SJose Ricardo Ziviani return cr; 2475a406c058SJose Ricardo Ziviani } 2476a406c058SJose Ricardo Ziviani 2477c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2478c85bc7ddSJose Ricardo Ziviani { 2479c85bc7ddSJose Ricardo Ziviani uint8_t i; 2480c85bc7ddSJose Ricardo Ziviani int cr; 2481c85bc7ddSJose Ricardo Ziviani uint64_t carry; 2482c85bc7ddSJose Ricardo Ziviani uint64_t unused; 2483c85bc7ddSJose Ricardo Ziviani uint64_t lo_value; 2484c85bc7ddSJose Ricardo Ziviani uint64_t hi_value = 0; 2485c85bc7ddSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2486c85bc7ddSJose Ricardo Ziviani int invalid = (sgnb == 0); 2487c85bc7ddSJose Ricardo Ziviani 2488c85bc7ddSJose Ricardo Ziviani lo_value = bcd_get_digit(b, 31, &invalid); 2489c85bc7ddSJose Ricardo Ziviani for (i = 30; i > 0; i--) { 2490c85bc7ddSJose Ricardo Ziviani mulu64(&lo_value, &carry, lo_value, 10ULL); 2491c85bc7ddSJose Ricardo Ziviani mulu64(&hi_value, &unused, hi_value, 10ULL); 2492c85bc7ddSJose Ricardo Ziviani lo_value += bcd_get_digit(b, i, &invalid); 2493c85bc7ddSJose Ricardo Ziviani hi_value += carry; 2494c85bc7ddSJose Ricardo Ziviani 2495c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2496c85bc7ddSJose Ricardo Ziviani break; 2497c85bc7ddSJose Ricardo Ziviani } 2498c85bc7ddSJose Ricardo Ziviani } 2499c85bc7ddSJose Ricardo Ziviani 2500c85bc7ddSJose Ricardo Ziviani if (sgnb == -1) { 25013c385a93SMark Cave-Ayland r->VsrSD(1) = -lo_value; 25023c385a93SMark Cave-Ayland r->VsrSD(0) = ~hi_value + !r->VsrSD(1); 2503c85bc7ddSJose Ricardo Ziviani } else { 25043c385a93SMark Cave-Ayland r->VsrSD(1) = lo_value; 25053c385a93SMark Cave-Ayland r->VsrSD(0) = hi_value; 2506c85bc7ddSJose Ricardo Ziviani } 2507c85bc7ddSJose Ricardo Ziviani 2508c85bc7ddSJose Ricardo Ziviani cr = bcd_cmp_zero(b); 2509c85bc7ddSJose Ricardo Ziviani 2510c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2511c85bc7ddSJose Ricardo Ziviani cr = CRF_SO; 2512c85bc7ddSJose Ricardo Ziviani } 2513c85bc7ddSJose Ricardo Ziviani 2514c85bc7ddSJose Ricardo Ziviani return cr; 2515c85bc7ddSJose Ricardo Ziviani } 2516c85bc7ddSJose Ricardo Ziviani 2517c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2518c3025c3bSJose Ricardo Ziviani { 2519c3025c3bSJose Ricardo Ziviani int i; 2520c3025c3bSJose Ricardo Ziviani int invalid = 0; 2521c3025c3bSJose Ricardo Ziviani 2522c3025c3bSJose Ricardo Ziviani if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) { 2523c3025c3bSJose Ricardo Ziviani return CRF_SO; 2524c3025c3bSJose Ricardo Ziviani } 2525c3025c3bSJose Ricardo Ziviani 2526c3025c3bSJose Ricardo Ziviani *r = *a; 2527428115c3SMark Cave-Ayland bcd_put_digit(r, b->VsrB(BCD_DIG_BYTE(0)) & 0xF, 0); 2528c3025c3bSJose Ricardo Ziviani 2529c3025c3bSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2530c3025c3bSJose Ricardo Ziviani bcd_get_digit(a, i, &invalid); 2531c3025c3bSJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2532c3025c3bSJose Ricardo Ziviani if (unlikely(invalid)) { 2533c3025c3bSJose Ricardo Ziviani return CRF_SO; 2534c3025c3bSJose Ricardo Ziviani } 2535c3025c3bSJose Ricardo Ziviani } 2536c3025c3bSJose Ricardo Ziviani 2537c3025c3bSJose Ricardo Ziviani return bcd_cmp_zero(r); 2538c3025c3bSJose Ricardo Ziviani } 2539c3025c3bSJose Ricardo Ziviani 2540466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2541466a3f9cSJose Ricardo Ziviani { 2542466a3f9cSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2543466a3f9cSJose Ricardo Ziviani 2544466a3f9cSJose Ricardo Ziviani *r = *b; 2545466a3f9cSJose Ricardo Ziviani bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0); 2546466a3f9cSJose Ricardo Ziviani 2547071663dfSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2548466a3f9cSJose Ricardo Ziviani return CRF_SO; 2549466a3f9cSJose Ricardo Ziviani } 2550466a3f9cSJose Ricardo Ziviani 2551466a3f9cSJose Ricardo Ziviani return bcd_cmp_zero(r); 2552466a3f9cSJose Ricardo Ziviani } 2553466a3f9cSJose Ricardo Ziviani 2554e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2555e04797f7SJose Ricardo Ziviani { 2556e04797f7SJose Ricardo Ziviani int cr; 2557428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2558e04797f7SJose Ricardo Ziviani bool ox_flag = false; 2559e04797f7SJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2560e04797f7SJose Ricardo Ziviani ppc_avr_t ret = *b; 25613c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2562e04797f7SJose Ricardo Ziviani 2563e04797f7SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2564e04797f7SJose Ricardo Ziviani return CRF_SO; 2565e04797f7SJose Ricardo Ziviani } 2566e04797f7SJose Ricardo Ziviani 2567e04797f7SJose Ricardo Ziviani if (unlikely(i > 31)) { 2568e04797f7SJose Ricardo Ziviani i = 31; 2569e04797f7SJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2570e04797f7SJose Ricardo Ziviani i = -31; 2571e04797f7SJose Ricardo Ziviani } 2572e04797f7SJose Ricardo Ziviani 2573e04797f7SJose Ricardo Ziviani if (i > 0) { 25743c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2575e04797f7SJose Ricardo Ziviani } else { 25763c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2577e04797f7SJose Ricardo Ziviani } 2578e04797f7SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2579e04797f7SJose Ricardo Ziviani 2580e04797f7SJose Ricardo Ziviani *r = ret; 2581e04797f7SJose Ricardo Ziviani 2582e04797f7SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2583e04797f7SJose Ricardo Ziviani if (ox_flag) { 2584e04797f7SJose Ricardo Ziviani cr |= CRF_SO; 2585e04797f7SJose Ricardo Ziviani } 2586e04797f7SJose Ricardo Ziviani 2587e04797f7SJose Ricardo Ziviani return cr; 2588e04797f7SJose Ricardo Ziviani } 2589e04797f7SJose Ricardo Ziviani 2590a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2591a49a95e9SJose Ricardo Ziviani { 2592a49a95e9SJose Ricardo Ziviani int cr; 2593a49a95e9SJose Ricardo Ziviani int i; 2594a49a95e9SJose Ricardo Ziviani int invalid = 0; 2595a49a95e9SJose Ricardo Ziviani bool ox_flag = false; 2596a49a95e9SJose Ricardo Ziviani ppc_avr_t ret = *b; 2597a49a95e9SJose Ricardo Ziviani 2598a49a95e9SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 2599a49a95e9SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 2600a49a95e9SJose Ricardo Ziviani 2601a49a95e9SJose Ricardo Ziviani if (unlikely(invalid)) { 2602a49a95e9SJose Ricardo Ziviani return CRF_SO; 2603a49a95e9SJose Ricardo Ziviani } 2604a49a95e9SJose Ricardo Ziviani } 2605a49a95e9SJose Ricardo Ziviani 2606428115c3SMark Cave-Ayland i = a->VsrSB(7); 2607a49a95e9SJose Ricardo Ziviani if (i >= 32) { 2608a49a95e9SJose Ricardo Ziviani ox_flag = true; 26093c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2610a49a95e9SJose Ricardo Ziviani } else if (i <= -32) { 26113c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 2612a49a95e9SJose Ricardo Ziviani } else if (i > 0) { 26133c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2614a49a95e9SJose Ricardo Ziviani } else { 26153c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2616a49a95e9SJose Ricardo Ziviani } 2617a49a95e9SJose Ricardo Ziviani *r = ret; 2618a49a95e9SJose Ricardo Ziviani 2619a49a95e9SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 2620a49a95e9SJose Ricardo Ziviani if (ox_flag) { 2621a49a95e9SJose Ricardo Ziviani cr |= CRF_SO; 2622a49a95e9SJose Ricardo Ziviani } 2623a49a95e9SJose Ricardo Ziviani 2624a49a95e9SJose Ricardo Ziviani return cr; 2625a49a95e9SJose Ricardo Ziviani } 2626a49a95e9SJose Ricardo Ziviani 2627a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2628a54238adSJose Ricardo Ziviani { 2629a54238adSJose Ricardo Ziviani int cr; 2630a54238adSJose Ricardo Ziviani int unused = 0; 2631a54238adSJose Ricardo Ziviani int invalid = 0; 2632a54238adSJose Ricardo Ziviani bool ox_flag = false; 2633a54238adSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2634a54238adSJose Ricardo Ziviani ppc_avr_t ret = *b; 26353c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 2636a54238adSJose Ricardo Ziviani 2637428115c3SMark Cave-Ayland int i = a->VsrSB(7); 2638428115c3SMark Cave-Ayland ppc_avr_t bcd_one; 2639428115c3SMark Cave-Ayland 2640428115c3SMark Cave-Ayland bcd_one.VsrD(0) = 0; 2641428115c3SMark Cave-Ayland bcd_one.VsrD(1) = 0x10; 2642a54238adSJose Ricardo Ziviani 2643a54238adSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 2644a54238adSJose Ricardo Ziviani return CRF_SO; 2645a54238adSJose Ricardo Ziviani } 2646a54238adSJose Ricardo Ziviani 2647a54238adSJose Ricardo Ziviani if (unlikely(i > 31)) { 2648a54238adSJose Ricardo Ziviani i = 31; 2649a54238adSJose Ricardo Ziviani } else if (unlikely(i < -31)) { 2650a54238adSJose Ricardo Ziviani i = -31; 2651a54238adSJose Ricardo Ziviani } 2652a54238adSJose Ricardo Ziviani 2653a54238adSJose Ricardo Ziviani if (i > 0) { 26543c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 2655a54238adSJose Ricardo Ziviani } else { 26563c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 2657a54238adSJose Ricardo Ziviani 2658a54238adSJose Ricardo Ziviani if (bcd_get_digit(&ret, 0, &invalid) >= 5) { 2659a54238adSJose Ricardo Ziviani bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused); 2660a54238adSJose Ricardo Ziviani } 2661a54238adSJose Ricardo Ziviani } 2662a54238adSJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 2663a54238adSJose Ricardo Ziviani 2664a54238adSJose Ricardo Ziviani cr = bcd_cmp_zero(&ret); 2665a54238adSJose Ricardo Ziviani if (ox_flag) { 2666a54238adSJose Ricardo Ziviani cr |= CRF_SO; 2667a54238adSJose Ricardo Ziviani } 2668a54238adSJose Ricardo Ziviani *r = ret; 2669a54238adSJose Ricardo Ziviani 2670a54238adSJose Ricardo Ziviani return cr; 2671a54238adSJose Ricardo Ziviani } 2672a54238adSJose Ricardo Ziviani 267331bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 267431bc4d11SJose Ricardo Ziviani { 267531bc4d11SJose Ricardo Ziviani uint64_t mask; 267631bc4d11SJose Ricardo Ziviani uint32_t ox_flag = 0; 2677428115c3SMark Cave-Ayland int i = a->VsrSH(3) + 1; 267831bc4d11SJose Ricardo Ziviani ppc_avr_t ret = *b; 267931bc4d11SJose Ricardo Ziviani 268031bc4d11SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 268131bc4d11SJose Ricardo Ziviani return CRF_SO; 268231bc4d11SJose Ricardo Ziviani } 268331bc4d11SJose Ricardo Ziviani 268431bc4d11SJose Ricardo Ziviani if (i > 16 && i < 32) { 268531bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 26863c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 268731bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 268831bc4d11SJose Ricardo Ziviani } 268931bc4d11SJose Ricardo Ziviani 26903c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 269131bc4d11SJose Ricardo Ziviani } else if (i >= 0 && i <= 16) { 269231bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 26933c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 269431bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 269531bc4d11SJose Ricardo Ziviani } 269631bc4d11SJose Ricardo Ziviani 26973c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 26983c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 269931bc4d11SJose Ricardo Ziviani } 270031bc4d11SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0); 270131bc4d11SJose Ricardo Ziviani *r = ret; 270231bc4d11SJose Ricardo Ziviani 270331bc4d11SJose Ricardo Ziviani return bcd_cmp_zero(&ret) | ox_flag; 270431bc4d11SJose Ricardo Ziviani } 270531bc4d11SJose Ricardo Ziviani 27065c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 27075c32e2e4SJose Ricardo Ziviani { 27085c32e2e4SJose Ricardo Ziviani int i; 27095c32e2e4SJose Ricardo Ziviani uint64_t mask; 27105c32e2e4SJose Ricardo Ziviani uint32_t ox_flag = 0; 27115c32e2e4SJose Ricardo Ziviani int invalid = 0; 27125c32e2e4SJose Ricardo Ziviani ppc_avr_t ret = *b; 27135c32e2e4SJose Ricardo Ziviani 27145c32e2e4SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 27155c32e2e4SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 27165c32e2e4SJose Ricardo Ziviani 27175c32e2e4SJose Ricardo Ziviani if (unlikely(invalid)) { 27185c32e2e4SJose Ricardo Ziviani return CRF_SO; 27195c32e2e4SJose Ricardo Ziviani } 27205c32e2e4SJose Ricardo Ziviani } 27215c32e2e4SJose Ricardo Ziviani 2722428115c3SMark Cave-Ayland i = a->VsrSH(3); 27235c32e2e4SJose Ricardo Ziviani if (i > 16 && i < 33) { 27245c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 27253c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 27265c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 27275c32e2e4SJose Ricardo Ziviani } 27285c32e2e4SJose Ricardo Ziviani 27293c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 27305c32e2e4SJose Ricardo Ziviani } else if (i > 0 && i <= 16) { 27315c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 27323c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 27335c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 27345c32e2e4SJose Ricardo Ziviani } 27355c32e2e4SJose Ricardo Ziviani 27363c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 27373c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 27385c32e2e4SJose Ricardo Ziviani } else if (i == 0) { 27393c385a93SMark Cave-Ayland if (ret.VsrD(0) || ret.VsrD(1)) { 27405c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 27415c32e2e4SJose Ricardo Ziviani } 27423c385a93SMark Cave-Ayland ret.VsrD(0) = ret.VsrD(1) = 0; 27435c32e2e4SJose Ricardo Ziviani } 27445c32e2e4SJose Ricardo Ziviani 27455c32e2e4SJose Ricardo Ziviani *r = ret; 27463c385a93SMark Cave-Ayland if (r->VsrD(0) == 0 && r->VsrD(1) == 0) { 27475c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_EQ; 27485c32e2e4SJose Ricardo Ziviani } 27495c32e2e4SJose Ricardo Ziviani 27505c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_GT; 27515c32e2e4SJose Ricardo Ziviani } 27525c32e2e4SJose Ricardo Ziviani 2753fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a) 2754fcf5ef2aSThomas Huth { 2755fcf5ef2aSThomas Huth int i; 2756fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 2757fcf5ef2aSThomas Huth r->u8[i] = AES_sbox[a->u8[i]]; 2758fcf5ef2aSThomas Huth } 2759fcf5ef2aSThomas Huth } 2760fcf5ef2aSThomas Huth 2761fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2762fcf5ef2aSThomas Huth { 2763fcf5ef2aSThomas Huth ppc_avr_t result; 2764fcf5ef2aSThomas Huth int i; 2765fcf5ef2aSThomas Huth 2766fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 27672dea57dbSMark Cave-Ayland result.VsrW(i) = b->VsrW(i) ^ 27682dea57dbSMark Cave-Ayland (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^ 27692dea57dbSMark Cave-Ayland AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^ 27702dea57dbSMark Cave-Ayland AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^ 27712dea57dbSMark Cave-Ayland AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]); 2772fcf5ef2aSThomas Huth } 2773fcf5ef2aSThomas Huth *r = result; 2774fcf5ef2aSThomas Huth } 2775fcf5ef2aSThomas Huth 2776fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2777fcf5ef2aSThomas Huth { 2778fcf5ef2aSThomas Huth ppc_avr_t result; 2779fcf5ef2aSThomas Huth int i; 2780fcf5ef2aSThomas Huth 2781fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 27822dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]); 2783fcf5ef2aSThomas Huth } 2784fcf5ef2aSThomas Huth *r = result; 2785fcf5ef2aSThomas Huth } 2786fcf5ef2aSThomas Huth 2787fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2788fcf5ef2aSThomas Huth { 2789fcf5ef2aSThomas Huth /* This differs from what is written in ISA V2.07. The RTL is */ 2790fcf5ef2aSThomas Huth /* incorrect and will be fixed in V2.07B. */ 2791fcf5ef2aSThomas Huth int i; 2792fcf5ef2aSThomas Huth ppc_avr_t tmp; 2793fcf5ef2aSThomas Huth 2794fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 27952dea57dbSMark Cave-Ayland tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])]; 2796fcf5ef2aSThomas Huth } 2797fcf5ef2aSThomas Huth 2798fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 27992dea57dbSMark Cave-Ayland r->VsrW(i) = 28002dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 0)][0] ^ 28012dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 1)][1] ^ 28022dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 2)][2] ^ 28032dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 3)][3]; 2804fcf5ef2aSThomas Huth } 2805fcf5ef2aSThomas Huth } 2806fcf5ef2aSThomas Huth 2807fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2808fcf5ef2aSThomas Huth { 2809fcf5ef2aSThomas Huth ppc_avr_t result; 2810fcf5ef2aSThomas Huth int i; 2811fcf5ef2aSThomas Huth 2812fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 28132dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]); 2814fcf5ef2aSThomas Huth } 2815fcf5ef2aSThomas Huth *r = result; 2816fcf5ef2aSThomas Huth } 2817fcf5ef2aSThomas Huth 2818fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2819fcf5ef2aSThomas Huth { 2820fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2821fcf5ef2aSThomas Huth int six = st_six & 0xF; 2822fcf5ef2aSThomas Huth int i; 2823fcf5ef2aSThomas Huth 2824730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2825fcf5ef2aSThomas Huth if (st == 0) { 2826fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 28270ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 7) ^ 28280ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 18) ^ 2829730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 3); 2830fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 28310ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 17) ^ 28320ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 19) ^ 2833730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 10); 2834fcf5ef2aSThomas Huth } 2835fcf5ef2aSThomas Huth } else { /* st == 1 */ 2836fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 28370ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 2) ^ 28380ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 13) ^ 28390ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 22); 2840fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 28410ef83bf2SMark Cave-Ayland r->VsrW(i) = ror32(a->VsrW(i), 6) ^ 28420ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 11) ^ 28430ef83bf2SMark Cave-Ayland ror32(a->VsrW(i), 25); 2844fcf5ef2aSThomas Huth } 2845fcf5ef2aSThomas Huth } 2846fcf5ef2aSThomas Huth } 2847fcf5ef2aSThomas Huth } 2848fcf5ef2aSThomas Huth 2849fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 2850fcf5ef2aSThomas Huth { 2851fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 2852fcf5ef2aSThomas Huth int six = st_six & 0xF; 2853fcf5ef2aSThomas Huth int i; 2854fcf5ef2aSThomas Huth 2855730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 2856fcf5ef2aSThomas Huth if (st == 0) { 2857fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 28580ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 1) ^ 28590ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 8) ^ 2860730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 7); 2861fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 28620ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 19) ^ 28630ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 61) ^ 2864730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 6); 2865fcf5ef2aSThomas Huth } 2866fcf5ef2aSThomas Huth } else { /* st == 1 */ 2867fcf5ef2aSThomas Huth if ((six & (0x8 >> (2 * i))) == 0) { 28680ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 28) ^ 28690ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 34) ^ 28700ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 39); 2871fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 28720ef83bf2SMark Cave-Ayland r->VsrD(i) = ror64(a->VsrD(i), 14) ^ 28730ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 18) ^ 28740ef83bf2SMark Cave-Ayland ror64(a->VsrD(i), 41); 2875fcf5ef2aSThomas Huth } 2876fcf5ef2aSThomas Huth } 2877fcf5ef2aSThomas Huth } 2878fcf5ef2aSThomas Huth } 2879fcf5ef2aSThomas Huth 2880fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2881fcf5ef2aSThomas Huth { 2882fcf5ef2aSThomas Huth ppc_avr_t result; 2883fcf5ef2aSThomas Huth int i; 2884fcf5ef2aSThomas Huth 288560594feaSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 288660594feaSMark Cave-Ayland int indexA = c->VsrB(i) >> 4; 288760594feaSMark Cave-Ayland int indexB = c->VsrB(i) & 0xF; 288860594feaSMark Cave-Ayland 288960594feaSMark Cave-Ayland result.VsrB(i) = a->VsrB(indexA) ^ b->VsrB(indexB); 2890fcf5ef2aSThomas Huth } 2891fcf5ef2aSThomas Huth *r = result; 2892fcf5ef2aSThomas Huth } 2893fcf5ef2aSThomas Huth 2894fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I 2895fcf5ef2aSThomas Huth 2896fcf5ef2aSThomas Huth /*****************************************************************************/ 2897fcf5ef2aSThomas Huth /* SPE extension helpers */ 2898fcf5ef2aSThomas Huth /* Use a table to make this quicker */ 2899fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = { 2900fcf5ef2aSThomas Huth 0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE, 2901fcf5ef2aSThomas Huth 0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF, 2902fcf5ef2aSThomas Huth }; 2903fcf5ef2aSThomas Huth 2904fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val) 2905fcf5ef2aSThomas Huth { 2906fcf5ef2aSThomas Huth return hbrev[val >> 4] | (hbrev[val & 0xF] << 4); 2907fcf5ef2aSThomas Huth } 2908fcf5ef2aSThomas Huth 2909fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val) 2910fcf5ef2aSThomas Huth { 2911fcf5ef2aSThomas Huth return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) | 2912fcf5ef2aSThomas Huth (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24); 2913fcf5ef2aSThomas Huth } 2914fcf5ef2aSThomas Huth 2915fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */ 2916fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2) 2917fcf5ef2aSThomas Huth { 2918fcf5ef2aSThomas Huth uint32_t a, b, d, mask; 2919fcf5ef2aSThomas Huth 2920fcf5ef2aSThomas Huth mask = UINT32_MAX >> (32 - MASKBITS); 2921fcf5ef2aSThomas Huth a = arg1 & mask; 2922fcf5ef2aSThomas Huth b = arg2 & mask; 2923fcf5ef2aSThomas Huth d = word_reverse(1 + word_reverse(a | ~b)); 2924fcf5ef2aSThomas Huth return (arg1 & ~mask) | (d & b); 2925fcf5ef2aSThomas Huth } 2926fcf5ef2aSThomas Huth 2927fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val) 2928fcf5ef2aSThomas Huth { 2929fcf5ef2aSThomas Huth if (val & 0x80000000) { 2930fcf5ef2aSThomas Huth return clz32(~val); 2931fcf5ef2aSThomas Huth } else { 2932fcf5ef2aSThomas Huth return clz32(val); 2933fcf5ef2aSThomas Huth } 2934fcf5ef2aSThomas Huth } 2935fcf5ef2aSThomas Huth 2936fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val) 2937fcf5ef2aSThomas Huth { 2938fcf5ef2aSThomas Huth return clz32(val); 2939fcf5ef2aSThomas Huth } 2940fcf5ef2aSThomas Huth 2941fcf5ef2aSThomas Huth /* 440 specific */ 2942fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high, 2943fcf5ef2aSThomas Huth target_ulong low, uint32_t update_Rc) 2944fcf5ef2aSThomas Huth { 2945fcf5ef2aSThomas Huth target_ulong mask; 2946fcf5ef2aSThomas Huth int i; 2947fcf5ef2aSThomas Huth 2948fcf5ef2aSThomas Huth i = 1; 2949fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 2950fcf5ef2aSThomas Huth if ((high & mask) == 0) { 2951fcf5ef2aSThomas Huth if (update_Rc) { 2952fcf5ef2aSThomas Huth env->crf[0] = 0x4; 2953fcf5ef2aSThomas Huth } 2954fcf5ef2aSThomas Huth goto done; 2955fcf5ef2aSThomas Huth } 2956fcf5ef2aSThomas Huth i++; 2957fcf5ef2aSThomas Huth } 2958fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 2959fcf5ef2aSThomas Huth if ((low & mask) == 0) { 2960fcf5ef2aSThomas Huth if (update_Rc) { 2961fcf5ef2aSThomas Huth env->crf[0] = 0x8; 2962fcf5ef2aSThomas Huth } 2963fcf5ef2aSThomas Huth goto done; 2964fcf5ef2aSThomas Huth } 2965fcf5ef2aSThomas Huth i++; 2966fcf5ef2aSThomas Huth } 2967fcf5ef2aSThomas Huth i = 8; 2968fcf5ef2aSThomas Huth if (update_Rc) { 2969fcf5ef2aSThomas Huth env->crf[0] = 0x2; 2970fcf5ef2aSThomas Huth } 2971fcf5ef2aSThomas Huth done: 2972fcf5ef2aSThomas Huth env->xer = (env->xer & ~0x7F) | i; 2973fcf5ef2aSThomas Huth if (update_Rc) { 2974fcf5ef2aSThomas Huth env->crf[0] |= xer_so; 2975fcf5ef2aSThomas Huth } 2976fcf5ef2aSThomas Huth return i; 2977fcf5ef2aSThomas Huth } 2978