1fcf5ef2aSThomas Huth /* 2fcf5ef2aSThomas Huth * PowerPC integer and vector emulation helpers for QEMU. 3fcf5ef2aSThomas Huth * 4fcf5ef2aSThomas Huth * Copyright (c) 2003-2007 Jocelyn Mayer 5fcf5ef2aSThomas Huth * 6fcf5ef2aSThomas Huth * This library is free software; you can redistribute it and/or 7fcf5ef2aSThomas Huth * modify it under the terms of the GNU Lesser General Public 8fcf5ef2aSThomas Huth * License as published by the Free Software Foundation; either 9fcf5ef2aSThomas Huth * version 2 of the License, or (at your option) any later version. 10fcf5ef2aSThomas Huth * 11fcf5ef2aSThomas Huth * This library is distributed in the hope that it will be useful, 12fcf5ef2aSThomas Huth * but WITHOUT ANY WARRANTY; without even the implied warranty of 13fcf5ef2aSThomas Huth * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14fcf5ef2aSThomas Huth * Lesser General Public License for more details. 15fcf5ef2aSThomas Huth * 16fcf5ef2aSThomas Huth * You should have received a copy of the GNU Lesser General Public 17fcf5ef2aSThomas Huth * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18fcf5ef2aSThomas Huth */ 19fcf5ef2aSThomas Huth #include "qemu/osdep.h" 20fcf5ef2aSThomas Huth #include "cpu.h" 21fcf5ef2aSThomas Huth #include "internal.h" 22fcf5ef2aSThomas Huth #include "qemu/host-utils.h" 23fcf5ef2aSThomas Huth #include "exec/helper-proto.h" 24fcf5ef2aSThomas Huth #include "crypto/aes.h" 2524f91e81SAlex Bennée #include "fpu/softfloat.h" 26fcf5ef2aSThomas Huth 27fcf5ef2aSThomas Huth #include "helper_regs.h" 28fcf5ef2aSThomas Huth /*****************************************************************************/ 29fcf5ef2aSThomas Huth /* Fixed point operations helpers */ 30fcf5ef2aSThomas Huth 31f32899deSNikunj A Dadhania static inline void helper_update_ov_legacy(CPUPPCState *env, int ov) 32f32899deSNikunj A Dadhania { 33f32899deSNikunj A Dadhania if (unlikely(ov)) { 34f32899deSNikunj A Dadhania env->so = env->ov = 1; 35f32899deSNikunj A Dadhania } else { 36f32899deSNikunj A Dadhania env->ov = 0; 37f32899deSNikunj A Dadhania } 38f32899deSNikunj A Dadhania } 39f32899deSNikunj A Dadhania 40fcf5ef2aSThomas Huth target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb, 41fcf5ef2aSThomas Huth uint32_t oe) 42fcf5ef2aSThomas Huth { 43fcf5ef2aSThomas Huth uint64_t rt = 0; 44fcf5ef2aSThomas Huth int overflow = 0; 45fcf5ef2aSThomas Huth 46fcf5ef2aSThomas Huth uint64_t dividend = (uint64_t)ra << 32; 47fcf5ef2aSThomas Huth uint64_t divisor = (uint32_t)rb; 48fcf5ef2aSThomas Huth 49fcf5ef2aSThomas Huth if (unlikely(divisor == 0)) { 50fcf5ef2aSThomas Huth overflow = 1; 51fcf5ef2aSThomas Huth } else { 52fcf5ef2aSThomas Huth rt = dividend / divisor; 53fcf5ef2aSThomas Huth overflow = rt > UINT32_MAX; 54fcf5ef2aSThomas Huth } 55fcf5ef2aSThomas Huth 56fcf5ef2aSThomas Huth if (unlikely(overflow)) { 57fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 58fcf5ef2aSThomas Huth } 59fcf5ef2aSThomas Huth 60fcf5ef2aSThomas Huth if (oe) { 61f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 62fcf5ef2aSThomas Huth } 63fcf5ef2aSThomas Huth 64fcf5ef2aSThomas Huth return (target_ulong)rt; 65fcf5ef2aSThomas Huth } 66fcf5ef2aSThomas Huth 67fcf5ef2aSThomas Huth target_ulong helper_divwe(CPUPPCState *env, target_ulong ra, target_ulong rb, 68fcf5ef2aSThomas Huth uint32_t oe) 69fcf5ef2aSThomas Huth { 70fcf5ef2aSThomas Huth int64_t rt = 0; 71fcf5ef2aSThomas Huth int overflow = 0; 72fcf5ef2aSThomas Huth 73fcf5ef2aSThomas Huth int64_t dividend = (int64_t)ra << 32; 74fcf5ef2aSThomas Huth int64_t divisor = (int64_t)((int32_t)rb); 75fcf5ef2aSThomas Huth 76fcf5ef2aSThomas Huth if (unlikely((divisor == 0) || 77fcf5ef2aSThomas Huth ((divisor == -1ull) && (dividend == INT64_MIN)))) { 78fcf5ef2aSThomas Huth overflow = 1; 79fcf5ef2aSThomas Huth } else { 80fcf5ef2aSThomas Huth rt = dividend / divisor; 81fcf5ef2aSThomas Huth overflow = rt != (int32_t)rt; 82fcf5ef2aSThomas Huth } 83fcf5ef2aSThomas Huth 84fcf5ef2aSThomas Huth if (unlikely(overflow)) { 85fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 86fcf5ef2aSThomas Huth } 87fcf5ef2aSThomas Huth 88fcf5ef2aSThomas Huth if (oe) { 89f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 90fcf5ef2aSThomas Huth } 91fcf5ef2aSThomas Huth 92fcf5ef2aSThomas Huth return (target_ulong)rt; 93fcf5ef2aSThomas Huth } 94fcf5ef2aSThomas Huth 95fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 96fcf5ef2aSThomas Huth 97fcf5ef2aSThomas Huth uint64_t helper_divdeu(CPUPPCState *env, uint64_t ra, uint64_t rb, uint32_t oe) 98fcf5ef2aSThomas Huth { 99fcf5ef2aSThomas Huth uint64_t rt = 0; 100fcf5ef2aSThomas Huth int overflow = 0; 101fcf5ef2aSThomas Huth 102fcf5ef2aSThomas Huth overflow = divu128(&rt, &ra, rb); 103fcf5ef2aSThomas Huth 104fcf5ef2aSThomas Huth if (unlikely(overflow)) { 105fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 106fcf5ef2aSThomas Huth } 107fcf5ef2aSThomas Huth 108fcf5ef2aSThomas Huth if (oe) { 109f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 110fcf5ef2aSThomas Huth } 111fcf5ef2aSThomas Huth 112fcf5ef2aSThomas Huth return rt; 113fcf5ef2aSThomas Huth } 114fcf5ef2aSThomas Huth 115fcf5ef2aSThomas Huth uint64_t helper_divde(CPUPPCState *env, uint64_t rau, uint64_t rbu, uint32_t oe) 116fcf5ef2aSThomas Huth { 117fcf5ef2aSThomas Huth int64_t rt = 0; 118fcf5ef2aSThomas Huth int64_t ra = (int64_t)rau; 119fcf5ef2aSThomas Huth int64_t rb = (int64_t)rbu; 120fcf5ef2aSThomas Huth int overflow = divs128(&rt, &ra, rb); 121fcf5ef2aSThomas Huth 122fcf5ef2aSThomas Huth if (unlikely(overflow)) { 123fcf5ef2aSThomas Huth rt = 0; /* Undefined */ 124fcf5ef2aSThomas Huth } 125fcf5ef2aSThomas Huth 126fcf5ef2aSThomas Huth if (oe) { 127f32899deSNikunj A Dadhania helper_update_ov_legacy(env, overflow); 128fcf5ef2aSThomas Huth } 129fcf5ef2aSThomas Huth 130fcf5ef2aSThomas Huth return rt; 131fcf5ef2aSThomas Huth } 132fcf5ef2aSThomas Huth 133fcf5ef2aSThomas Huth #endif 134fcf5ef2aSThomas Huth 135fcf5ef2aSThomas Huth 136fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 137fcf5ef2aSThomas Huth /* if x = 0xab, returns 0xababababababababa */ 138fcf5ef2aSThomas Huth #define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff)) 139fcf5ef2aSThomas Huth 140fcf5ef2aSThomas Huth /* substract 1 from each byte, and with inverse, check if MSB is set at each 141fcf5ef2aSThomas Huth * byte. 142fcf5ef2aSThomas Huth * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80 143fcf5ef2aSThomas Huth * (0xFF & 0xFF) & 0x80 = 0x80 (zero found) 144fcf5ef2aSThomas Huth */ 145fcf5ef2aSThomas Huth #define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80)) 146fcf5ef2aSThomas Huth 147fcf5ef2aSThomas Huth /* When you XOR the pattern and there is a match, that byte will be zero */ 148fcf5ef2aSThomas Huth #define hasvalue(x, n) (haszero((x) ^ pattern(n))) 149fcf5ef2aSThomas Huth 150fcf5ef2aSThomas Huth uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb) 151fcf5ef2aSThomas Huth { 152efa73196SNikunj A Dadhania return hasvalue(rb, ra) ? CRF_GT : 0; 153fcf5ef2aSThomas Huth } 154fcf5ef2aSThomas Huth 155fcf5ef2aSThomas Huth #undef pattern 156fcf5ef2aSThomas Huth #undef haszero 157fcf5ef2aSThomas Huth #undef hasvalue 158fcf5ef2aSThomas Huth 159fcf5ef2aSThomas Huth /* Return invalid random number. 160fcf5ef2aSThomas Huth * 161fcf5ef2aSThomas Huth * FIXME: Add rng backend or other mechanism to get cryptographically suitable 162fcf5ef2aSThomas Huth * random number 163fcf5ef2aSThomas Huth */ 164fcf5ef2aSThomas Huth target_ulong helper_darn32(void) 165fcf5ef2aSThomas Huth { 166fcf5ef2aSThomas Huth return -1; 167fcf5ef2aSThomas Huth } 168fcf5ef2aSThomas Huth 169fcf5ef2aSThomas Huth target_ulong helper_darn64(void) 170fcf5ef2aSThomas Huth { 171fcf5ef2aSThomas Huth return -1; 172fcf5ef2aSThomas Huth } 173fcf5ef2aSThomas Huth 174fcf5ef2aSThomas Huth #endif 175fcf5ef2aSThomas Huth 176fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 177fcf5ef2aSThomas Huth 178fcf5ef2aSThomas Huth uint64_t helper_bpermd(uint64_t rs, uint64_t rb) 179fcf5ef2aSThomas Huth { 180fcf5ef2aSThomas Huth int i; 181fcf5ef2aSThomas Huth uint64_t ra = 0; 182fcf5ef2aSThomas Huth 183fcf5ef2aSThomas Huth for (i = 0; i < 8; i++) { 184fcf5ef2aSThomas Huth int index = (rs >> (i*8)) & 0xFF; 185fcf5ef2aSThomas Huth if (index < 64) { 186a6a444a8SCédric Le Goater if (rb & PPC_BIT(index)) { 187fcf5ef2aSThomas Huth ra |= 1 << i; 188fcf5ef2aSThomas Huth } 189fcf5ef2aSThomas Huth } 190fcf5ef2aSThomas Huth } 191fcf5ef2aSThomas Huth return ra; 192fcf5ef2aSThomas Huth } 193fcf5ef2aSThomas Huth 194fcf5ef2aSThomas Huth #endif 195fcf5ef2aSThomas Huth 196fcf5ef2aSThomas Huth target_ulong helper_cmpb(target_ulong rs, target_ulong rb) 197fcf5ef2aSThomas Huth { 198fcf5ef2aSThomas Huth target_ulong mask = 0xff; 199fcf5ef2aSThomas Huth target_ulong ra = 0; 200fcf5ef2aSThomas Huth int i; 201fcf5ef2aSThomas Huth 202fcf5ef2aSThomas Huth for (i = 0; i < sizeof(target_ulong); i++) { 203fcf5ef2aSThomas Huth if ((rs & mask) == (rb & mask)) { 204fcf5ef2aSThomas Huth ra |= mask; 205fcf5ef2aSThomas Huth } 206fcf5ef2aSThomas Huth mask <<= 8; 207fcf5ef2aSThomas Huth } 208fcf5ef2aSThomas Huth return ra; 209fcf5ef2aSThomas Huth } 210fcf5ef2aSThomas Huth 211fcf5ef2aSThomas Huth /* shift right arithmetic helper */ 212fcf5ef2aSThomas Huth target_ulong helper_sraw(CPUPPCState *env, target_ulong value, 213fcf5ef2aSThomas Huth target_ulong shift) 214fcf5ef2aSThomas Huth { 215fcf5ef2aSThomas Huth int32_t ret; 216fcf5ef2aSThomas Huth 217fcf5ef2aSThomas Huth if (likely(!(shift & 0x20))) { 218fcf5ef2aSThomas Huth if (likely((uint32_t)shift != 0)) { 219fcf5ef2aSThomas Huth shift &= 0x1f; 220fcf5ef2aSThomas Huth ret = (int32_t)value >> shift; 221fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) { 222af1c259fSSandipan Das env->ca32 = env->ca = 0; 223fcf5ef2aSThomas Huth } else { 224af1c259fSSandipan Das env->ca32 = env->ca = 1; 225fcf5ef2aSThomas Huth } 226fcf5ef2aSThomas Huth } else { 227fcf5ef2aSThomas Huth ret = (int32_t)value; 228af1c259fSSandipan Das env->ca32 = env->ca = 0; 229fcf5ef2aSThomas Huth } 230fcf5ef2aSThomas Huth } else { 231fcf5ef2aSThomas Huth ret = (int32_t)value >> 31; 232af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 233fcf5ef2aSThomas Huth } 234fcf5ef2aSThomas Huth return (target_long)ret; 235fcf5ef2aSThomas Huth } 236fcf5ef2aSThomas Huth 237fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 238fcf5ef2aSThomas Huth target_ulong helper_srad(CPUPPCState *env, target_ulong value, 239fcf5ef2aSThomas Huth target_ulong shift) 240fcf5ef2aSThomas Huth { 241fcf5ef2aSThomas Huth int64_t ret; 242fcf5ef2aSThomas Huth 243fcf5ef2aSThomas Huth if (likely(!(shift & 0x40))) { 244fcf5ef2aSThomas Huth if (likely((uint64_t)shift != 0)) { 245fcf5ef2aSThomas Huth shift &= 0x3f; 246fcf5ef2aSThomas Huth ret = (int64_t)value >> shift; 247fcf5ef2aSThomas Huth if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) { 248af1c259fSSandipan Das env->ca32 = env->ca = 0; 249fcf5ef2aSThomas Huth } else { 250af1c259fSSandipan Das env->ca32 = env->ca = 1; 251fcf5ef2aSThomas Huth } 252fcf5ef2aSThomas Huth } else { 253fcf5ef2aSThomas Huth ret = (int64_t)value; 254af1c259fSSandipan Das env->ca32 = env->ca = 0; 255fcf5ef2aSThomas Huth } 256fcf5ef2aSThomas Huth } else { 257fcf5ef2aSThomas Huth ret = (int64_t)value >> 63; 258af1c259fSSandipan Das env->ca32 = env->ca = (ret != 0); 259fcf5ef2aSThomas Huth } 260fcf5ef2aSThomas Huth return ret; 261fcf5ef2aSThomas Huth } 262fcf5ef2aSThomas Huth #endif 263fcf5ef2aSThomas Huth 264fcf5ef2aSThomas Huth #if defined(TARGET_PPC64) 265fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 266fcf5ef2aSThomas Huth { 26779770002SRichard Henderson /* Note that we don't fold past bytes */ 268fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 269fcf5ef2aSThomas Huth 0x5555555555555555ULL); 270fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 271fcf5ef2aSThomas Huth 0x3333333333333333ULL); 272fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 273fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 274fcf5ef2aSThomas Huth return val; 275fcf5ef2aSThomas Huth } 276fcf5ef2aSThomas Huth 277fcf5ef2aSThomas Huth target_ulong helper_popcntw(target_ulong val) 278fcf5ef2aSThomas Huth { 27979770002SRichard Henderson /* Note that we don't fold past words. */ 280fcf5ef2aSThomas Huth val = (val & 0x5555555555555555ULL) + ((val >> 1) & 281fcf5ef2aSThomas Huth 0x5555555555555555ULL); 282fcf5ef2aSThomas Huth val = (val & 0x3333333333333333ULL) + ((val >> 2) & 283fcf5ef2aSThomas Huth 0x3333333333333333ULL); 284fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f0f0f0f0fULL) + ((val >> 4) & 285fcf5ef2aSThomas Huth 0x0f0f0f0f0f0f0f0fULL); 286fcf5ef2aSThomas Huth val = (val & 0x00ff00ff00ff00ffULL) + ((val >> 8) & 287fcf5ef2aSThomas Huth 0x00ff00ff00ff00ffULL); 288fcf5ef2aSThomas Huth val = (val & 0x0000ffff0000ffffULL) + ((val >> 16) & 289fcf5ef2aSThomas Huth 0x0000ffff0000ffffULL); 290fcf5ef2aSThomas Huth return val; 291fcf5ef2aSThomas Huth } 292fcf5ef2aSThomas Huth #else 293fcf5ef2aSThomas Huth target_ulong helper_popcntb(target_ulong val) 294fcf5ef2aSThomas Huth { 29579770002SRichard Henderson /* Note that we don't fold past bytes */ 296fcf5ef2aSThomas Huth val = (val & 0x55555555) + ((val >> 1) & 0x55555555); 297fcf5ef2aSThomas Huth val = (val & 0x33333333) + ((val >> 2) & 0x33333333); 298fcf5ef2aSThomas Huth val = (val & 0x0f0f0f0f) + ((val >> 4) & 0x0f0f0f0f); 299fcf5ef2aSThomas Huth return val; 300fcf5ef2aSThomas Huth } 301fcf5ef2aSThomas Huth #endif 302fcf5ef2aSThomas Huth 303fcf5ef2aSThomas Huth /*****************************************************************************/ 304fcf5ef2aSThomas Huth /* PowerPC 601 specific instructions (POWER bridge) */ 305fcf5ef2aSThomas Huth target_ulong helper_div(CPUPPCState *env, target_ulong arg1, target_ulong arg2) 306fcf5ef2aSThomas Huth { 307fcf5ef2aSThomas Huth uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ]; 308fcf5ef2aSThomas Huth 309fcf5ef2aSThomas Huth if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 310fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 311fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 312fcf5ef2aSThomas Huth return INT32_MIN; 313fcf5ef2aSThomas Huth } else { 314fcf5ef2aSThomas Huth env->spr[SPR_MQ] = tmp % arg2; 315fcf5ef2aSThomas Huth return tmp / (int32_t)arg2; 316fcf5ef2aSThomas Huth } 317fcf5ef2aSThomas Huth } 318fcf5ef2aSThomas Huth 319fcf5ef2aSThomas Huth target_ulong helper_divo(CPUPPCState *env, target_ulong arg1, 320fcf5ef2aSThomas Huth target_ulong arg2) 321fcf5ef2aSThomas Huth { 322fcf5ef2aSThomas Huth uint64_t tmp = (uint64_t)arg1 << 32 | env->spr[SPR_MQ]; 323fcf5ef2aSThomas Huth 324fcf5ef2aSThomas Huth if (((int32_t)tmp == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 325fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 326fcf5ef2aSThomas Huth env->so = env->ov = 1; 327fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 328fcf5ef2aSThomas Huth return INT32_MIN; 329fcf5ef2aSThomas Huth } else { 330fcf5ef2aSThomas Huth env->spr[SPR_MQ] = tmp % arg2; 331fcf5ef2aSThomas Huth tmp /= (int32_t)arg2; 332fcf5ef2aSThomas Huth if ((int32_t)tmp != tmp) { 333fcf5ef2aSThomas Huth env->so = env->ov = 1; 334fcf5ef2aSThomas Huth } else { 335fcf5ef2aSThomas Huth env->ov = 0; 336fcf5ef2aSThomas Huth } 337fcf5ef2aSThomas Huth return tmp; 338fcf5ef2aSThomas Huth } 339fcf5ef2aSThomas Huth } 340fcf5ef2aSThomas Huth 341fcf5ef2aSThomas Huth target_ulong helper_divs(CPUPPCState *env, target_ulong arg1, 342fcf5ef2aSThomas Huth target_ulong arg2) 343fcf5ef2aSThomas Huth { 344fcf5ef2aSThomas Huth if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 345fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 346fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 347fcf5ef2aSThomas Huth return INT32_MIN; 348fcf5ef2aSThomas Huth } else { 349fcf5ef2aSThomas Huth env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2; 350fcf5ef2aSThomas Huth return (int32_t)arg1 / (int32_t)arg2; 351fcf5ef2aSThomas Huth } 352fcf5ef2aSThomas Huth } 353fcf5ef2aSThomas Huth 354fcf5ef2aSThomas Huth target_ulong helper_divso(CPUPPCState *env, target_ulong arg1, 355fcf5ef2aSThomas Huth target_ulong arg2) 356fcf5ef2aSThomas Huth { 357fcf5ef2aSThomas Huth if (((int32_t)arg1 == INT32_MIN && (int32_t)arg2 == (int32_t)-1) || 358fcf5ef2aSThomas Huth (int32_t)arg2 == 0) { 359fcf5ef2aSThomas Huth env->so = env->ov = 1; 360fcf5ef2aSThomas Huth env->spr[SPR_MQ] = 0; 361fcf5ef2aSThomas Huth return INT32_MIN; 362fcf5ef2aSThomas Huth } else { 363fcf5ef2aSThomas Huth env->ov = 0; 364fcf5ef2aSThomas Huth env->spr[SPR_MQ] = (int32_t)arg1 % (int32_t)arg2; 365fcf5ef2aSThomas Huth return (int32_t)arg1 / (int32_t)arg2; 366fcf5ef2aSThomas Huth } 367fcf5ef2aSThomas Huth } 368fcf5ef2aSThomas Huth 369fcf5ef2aSThomas Huth /*****************************************************************************/ 370fcf5ef2aSThomas Huth /* 602 specific instructions */ 371fcf5ef2aSThomas Huth /* mfrom is the most crazy instruction ever seen, imho ! */ 372fcf5ef2aSThomas Huth /* Real implementation uses a ROM table. Do the same */ 373fcf5ef2aSThomas Huth /* Extremely decomposed: 374fcf5ef2aSThomas Huth * -arg / 256 375fcf5ef2aSThomas Huth * return 256 * log10(10 + 1.0) + 0.5 376fcf5ef2aSThomas Huth */ 377fcf5ef2aSThomas Huth #if !defined(CONFIG_USER_ONLY) 378fcf5ef2aSThomas Huth target_ulong helper_602_mfrom(target_ulong arg) 379fcf5ef2aSThomas Huth { 380fcf5ef2aSThomas Huth if (likely(arg < 602)) { 3815b27a92dSPaolo Bonzini #include "mfrom_table.inc.c" 382fcf5ef2aSThomas Huth return mfrom_ROM_table[arg]; 383fcf5ef2aSThomas Huth } else { 384fcf5ef2aSThomas Huth return 0; 385fcf5ef2aSThomas Huth } 386fcf5ef2aSThomas Huth } 387fcf5ef2aSThomas Huth #endif 388fcf5ef2aSThomas Huth 389fcf5ef2aSThomas Huth /*****************************************************************************/ 390fcf5ef2aSThomas Huth /* Altivec extension helpers */ 391fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 392fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 393fcf5ef2aSThomas Huth for (index = 0; index < ARRAY_SIZE(r->element); index++) 394fcf5ef2aSThomas Huth #else 395fcf5ef2aSThomas Huth #define VECTOR_FOR_INORDER_I(index, element) \ 396fcf5ef2aSThomas Huth for (index = ARRAY_SIZE(r->element)-1; index >= 0; index--) 397fcf5ef2aSThomas Huth #endif 398fcf5ef2aSThomas Huth 399fcf5ef2aSThomas Huth /* Saturating arithmetic helpers. */ 400fcf5ef2aSThomas Huth #define SATCVT(from, to, from_type, to_type, min, max) \ 401fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 402fcf5ef2aSThomas Huth { \ 403fcf5ef2aSThomas Huth to_type r; \ 404fcf5ef2aSThomas Huth \ 405fcf5ef2aSThomas Huth if (x < (from_type)min) { \ 406fcf5ef2aSThomas Huth r = min; \ 407fcf5ef2aSThomas Huth *sat = 1; \ 408fcf5ef2aSThomas Huth } else if (x > (from_type)max) { \ 409fcf5ef2aSThomas Huth r = max; \ 410fcf5ef2aSThomas Huth *sat = 1; \ 411fcf5ef2aSThomas Huth } else { \ 412fcf5ef2aSThomas Huth r = x; \ 413fcf5ef2aSThomas Huth } \ 414fcf5ef2aSThomas Huth return r; \ 415fcf5ef2aSThomas Huth } 416fcf5ef2aSThomas Huth #define SATCVTU(from, to, from_type, to_type, min, max) \ 417fcf5ef2aSThomas Huth static inline to_type cvt##from##to(from_type x, int *sat) \ 418fcf5ef2aSThomas Huth { \ 419fcf5ef2aSThomas Huth to_type r; \ 420fcf5ef2aSThomas Huth \ 421fcf5ef2aSThomas Huth if (x > (from_type)max) { \ 422fcf5ef2aSThomas Huth r = max; \ 423fcf5ef2aSThomas Huth *sat = 1; \ 424fcf5ef2aSThomas Huth } else { \ 425fcf5ef2aSThomas Huth r = x; \ 426fcf5ef2aSThomas Huth } \ 427fcf5ef2aSThomas Huth return r; \ 428fcf5ef2aSThomas Huth } 429fcf5ef2aSThomas Huth SATCVT(sh, sb, int16_t, int8_t, INT8_MIN, INT8_MAX) 430fcf5ef2aSThomas Huth SATCVT(sw, sh, int32_t, int16_t, INT16_MIN, INT16_MAX) 431fcf5ef2aSThomas Huth SATCVT(sd, sw, int64_t, int32_t, INT32_MIN, INT32_MAX) 432fcf5ef2aSThomas Huth 433fcf5ef2aSThomas Huth SATCVTU(uh, ub, uint16_t, uint8_t, 0, UINT8_MAX) 434fcf5ef2aSThomas Huth SATCVTU(uw, uh, uint32_t, uint16_t, 0, UINT16_MAX) 435fcf5ef2aSThomas Huth SATCVTU(ud, uw, uint64_t, uint32_t, 0, UINT32_MAX) 436fcf5ef2aSThomas Huth SATCVT(sh, ub, int16_t, uint8_t, 0, UINT8_MAX) 437fcf5ef2aSThomas Huth SATCVT(sw, uh, int32_t, uint16_t, 0, UINT16_MAX) 438fcf5ef2aSThomas Huth SATCVT(sd, uw, int64_t, uint32_t, 0, UINT32_MAX) 439fcf5ef2aSThomas Huth #undef SATCVT 440fcf5ef2aSThomas Huth #undef SATCVTU 441fcf5ef2aSThomas Huth 442fcf5ef2aSThomas Huth void helper_lvsl(ppc_avr_t *r, target_ulong sh) 443fcf5ef2aSThomas Huth { 444fcf5ef2aSThomas Huth int i, j = (sh & 0xf); 445fcf5ef2aSThomas Huth 446fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 447fcf5ef2aSThomas Huth r->u8[i] = j++; 448fcf5ef2aSThomas Huth } 449fcf5ef2aSThomas Huth } 450fcf5ef2aSThomas Huth 451fcf5ef2aSThomas Huth void helper_lvsr(ppc_avr_t *r, target_ulong sh) 452fcf5ef2aSThomas Huth { 453fcf5ef2aSThomas Huth int i, j = 0x10 - (sh & 0xf); 454fcf5ef2aSThomas Huth 455fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 456fcf5ef2aSThomas Huth r->u8[i] = j++; 457fcf5ef2aSThomas Huth } 458fcf5ef2aSThomas Huth } 459fcf5ef2aSThomas Huth 460fcf5ef2aSThomas Huth void helper_mtvscr(CPUPPCState *env, ppc_avr_t *r) 461fcf5ef2aSThomas Huth { 462fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 463fcf5ef2aSThomas Huth env->vscr = r->u32[3]; 464fcf5ef2aSThomas Huth #else 465fcf5ef2aSThomas Huth env->vscr = r->u32[0]; 466fcf5ef2aSThomas Huth #endif 467fcf5ef2aSThomas Huth set_flush_to_zero(vscr_nj, &env->vec_status); 468fcf5ef2aSThomas Huth } 469fcf5ef2aSThomas Huth 470fcf5ef2aSThomas Huth void helper_vaddcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 471fcf5ef2aSThomas Huth { 472fcf5ef2aSThomas Huth int i; 473fcf5ef2aSThomas Huth 474fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 475fcf5ef2aSThomas Huth r->u32[i] = ~a->u32[i] < b->u32[i]; 476fcf5ef2aSThomas Huth } 477fcf5ef2aSThomas Huth } 478fcf5ef2aSThomas Huth 479fcf5ef2aSThomas Huth /* vprtybw */ 480fcf5ef2aSThomas Huth void helper_vprtybw(ppc_avr_t *r, ppc_avr_t *b) 481fcf5ef2aSThomas Huth { 482fcf5ef2aSThomas Huth int i; 483fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 484fcf5ef2aSThomas Huth uint64_t res = b->u32[i] ^ (b->u32[i] >> 16); 485fcf5ef2aSThomas Huth res ^= res >> 8; 486fcf5ef2aSThomas Huth r->u32[i] = res & 1; 487fcf5ef2aSThomas Huth } 488fcf5ef2aSThomas Huth } 489fcf5ef2aSThomas Huth 490fcf5ef2aSThomas Huth /* vprtybd */ 491fcf5ef2aSThomas Huth void helper_vprtybd(ppc_avr_t *r, ppc_avr_t *b) 492fcf5ef2aSThomas Huth { 493fcf5ef2aSThomas Huth int i; 494fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 495fcf5ef2aSThomas Huth uint64_t res = b->u64[i] ^ (b->u64[i] >> 32); 496fcf5ef2aSThomas Huth res ^= res >> 16; 497fcf5ef2aSThomas Huth res ^= res >> 8; 498fcf5ef2aSThomas Huth r->u64[i] = res & 1; 499fcf5ef2aSThomas Huth } 500fcf5ef2aSThomas Huth } 501fcf5ef2aSThomas Huth 502fcf5ef2aSThomas Huth /* vprtybq */ 503fcf5ef2aSThomas Huth void helper_vprtybq(ppc_avr_t *r, ppc_avr_t *b) 504fcf5ef2aSThomas Huth { 505fcf5ef2aSThomas Huth uint64_t res = b->u64[0] ^ b->u64[1]; 506fcf5ef2aSThomas Huth res ^= res >> 32; 507fcf5ef2aSThomas Huth res ^= res >> 16; 508fcf5ef2aSThomas Huth res ^= res >> 8; 5093c385a93SMark Cave-Ayland r->VsrD(1) = res & 1; 5103c385a93SMark Cave-Ayland r->VsrD(0) = 0; 511fcf5ef2aSThomas Huth } 512fcf5ef2aSThomas Huth 513fcf5ef2aSThomas Huth #define VARITH_DO(name, op, element) \ 514fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 515fcf5ef2aSThomas Huth { \ 516fcf5ef2aSThomas Huth int i; \ 517fcf5ef2aSThomas Huth \ 518fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 519fcf5ef2aSThomas Huth r->element[i] = a->element[i] op b->element[i]; \ 520fcf5ef2aSThomas Huth } \ 521fcf5ef2aSThomas Huth } 522fcf5ef2aSThomas Huth #define VARITH(suffix, element) \ 523fcf5ef2aSThomas Huth VARITH_DO(add##suffix, +, element) \ 524fcf5ef2aSThomas Huth VARITH_DO(sub##suffix, -, element) 525fcf5ef2aSThomas Huth VARITH(ubm, u8) 526fcf5ef2aSThomas Huth VARITH(uhm, u16) 527fcf5ef2aSThomas Huth VARITH(uwm, u32) 528fcf5ef2aSThomas Huth VARITH(udm, u64) 529fcf5ef2aSThomas Huth VARITH_DO(muluwm, *, u32) 530fcf5ef2aSThomas Huth #undef VARITH_DO 531fcf5ef2aSThomas Huth #undef VARITH 532fcf5ef2aSThomas Huth 533fcf5ef2aSThomas Huth #define VARITHFP(suffix, func) \ 534fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 535fcf5ef2aSThomas Huth ppc_avr_t *b) \ 536fcf5ef2aSThomas Huth { \ 537fcf5ef2aSThomas Huth int i; \ 538fcf5ef2aSThomas Huth \ 53905ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 54005ee3e8aSMark Cave-Ayland r->f32[i] = func(a->f32[i], b->f32[i], &env->vec_status); \ 541fcf5ef2aSThomas Huth } \ 542fcf5ef2aSThomas Huth } 543fcf5ef2aSThomas Huth VARITHFP(addfp, float32_add) 544fcf5ef2aSThomas Huth VARITHFP(subfp, float32_sub) 545fcf5ef2aSThomas Huth VARITHFP(minfp, float32_min) 546fcf5ef2aSThomas Huth VARITHFP(maxfp, float32_max) 547fcf5ef2aSThomas Huth #undef VARITHFP 548fcf5ef2aSThomas Huth 549fcf5ef2aSThomas Huth #define VARITHFPFMA(suffix, type) \ 550fcf5ef2aSThomas Huth void helper_v##suffix(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 551fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) \ 552fcf5ef2aSThomas Huth { \ 553fcf5ef2aSThomas Huth int i; \ 55405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 55505ee3e8aSMark Cave-Ayland r->f32[i] = float32_muladd(a->f32[i], c->f32[i], b->f32[i], \ 556fcf5ef2aSThomas Huth type, &env->vec_status); \ 557fcf5ef2aSThomas Huth } \ 558fcf5ef2aSThomas Huth } 559fcf5ef2aSThomas Huth VARITHFPFMA(maddfp, 0); 560fcf5ef2aSThomas Huth VARITHFPFMA(nmsubfp, float_muladd_negate_result | float_muladd_negate_c); 561fcf5ef2aSThomas Huth #undef VARITHFPFMA 562fcf5ef2aSThomas Huth 563fcf5ef2aSThomas Huth #define VARITHSAT_CASE(type, op, cvt, element) \ 564fcf5ef2aSThomas Huth { \ 565fcf5ef2aSThomas Huth type result = (type)a->element[i] op (type)b->element[i]; \ 566fcf5ef2aSThomas Huth r->element[i] = cvt(result, &sat); \ 567fcf5ef2aSThomas Huth } 568fcf5ef2aSThomas Huth 569fcf5ef2aSThomas Huth #define VARITHSAT_DO(name, op, optype, cvt, element) \ 570fcf5ef2aSThomas Huth void helper_v##name(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, \ 571fcf5ef2aSThomas Huth ppc_avr_t *b) \ 572fcf5ef2aSThomas Huth { \ 573fcf5ef2aSThomas Huth int sat = 0; \ 574fcf5ef2aSThomas Huth int i; \ 575fcf5ef2aSThomas Huth \ 576fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 577fcf5ef2aSThomas Huth switch (sizeof(r->element[0])) { \ 578fcf5ef2aSThomas Huth case 1: \ 579fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 580fcf5ef2aSThomas Huth break; \ 581fcf5ef2aSThomas Huth case 2: \ 582fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 583fcf5ef2aSThomas Huth break; \ 584fcf5ef2aSThomas Huth case 4: \ 585fcf5ef2aSThomas Huth VARITHSAT_CASE(optype, op, cvt, element); \ 586fcf5ef2aSThomas Huth break; \ 587fcf5ef2aSThomas Huth } \ 588fcf5ef2aSThomas Huth } \ 589fcf5ef2aSThomas Huth if (sat) { \ 590fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); \ 591fcf5ef2aSThomas Huth } \ 592fcf5ef2aSThomas Huth } 593fcf5ef2aSThomas Huth #define VARITHSAT_SIGNED(suffix, element, optype, cvt) \ 594fcf5ef2aSThomas Huth VARITHSAT_DO(adds##suffix##s, +, optype, cvt, element) \ 595fcf5ef2aSThomas Huth VARITHSAT_DO(subs##suffix##s, -, optype, cvt, element) 596fcf5ef2aSThomas Huth #define VARITHSAT_UNSIGNED(suffix, element, optype, cvt) \ 597fcf5ef2aSThomas Huth VARITHSAT_DO(addu##suffix##s, +, optype, cvt, element) \ 598fcf5ef2aSThomas Huth VARITHSAT_DO(subu##suffix##s, -, optype, cvt, element) 599fcf5ef2aSThomas Huth VARITHSAT_SIGNED(b, s8, int16_t, cvtshsb) 600fcf5ef2aSThomas Huth VARITHSAT_SIGNED(h, s16, int32_t, cvtswsh) 601fcf5ef2aSThomas Huth VARITHSAT_SIGNED(w, s32, int64_t, cvtsdsw) 602fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(b, u8, uint16_t, cvtshub) 603fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(h, u16, uint32_t, cvtswuh) 604fcf5ef2aSThomas Huth VARITHSAT_UNSIGNED(w, u32, uint64_t, cvtsduw) 605fcf5ef2aSThomas Huth #undef VARITHSAT_CASE 606fcf5ef2aSThomas Huth #undef VARITHSAT_DO 607fcf5ef2aSThomas Huth #undef VARITHSAT_SIGNED 608fcf5ef2aSThomas Huth #undef VARITHSAT_UNSIGNED 609fcf5ef2aSThomas Huth 610fcf5ef2aSThomas Huth #define VAVG_DO(name, element, etype) \ 611fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 612fcf5ef2aSThomas Huth { \ 613fcf5ef2aSThomas Huth int i; \ 614fcf5ef2aSThomas Huth \ 615fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 616fcf5ef2aSThomas Huth etype x = (etype)a->element[i] + (etype)b->element[i] + 1; \ 617fcf5ef2aSThomas Huth r->element[i] = x >> 1; \ 618fcf5ef2aSThomas Huth } \ 619fcf5ef2aSThomas Huth } 620fcf5ef2aSThomas Huth 621fcf5ef2aSThomas Huth #define VAVG(type, signed_element, signed_type, unsigned_element, \ 622fcf5ef2aSThomas Huth unsigned_type) \ 623fcf5ef2aSThomas Huth VAVG_DO(avgs##type, signed_element, signed_type) \ 624fcf5ef2aSThomas Huth VAVG_DO(avgu##type, unsigned_element, unsigned_type) 625fcf5ef2aSThomas Huth VAVG(b, s8, int16_t, u8, uint16_t) 626fcf5ef2aSThomas Huth VAVG(h, s16, int32_t, u16, uint32_t) 627fcf5ef2aSThomas Huth VAVG(w, s32, int64_t, u32, uint64_t) 628fcf5ef2aSThomas Huth #undef VAVG_DO 629fcf5ef2aSThomas Huth #undef VAVG 630fcf5ef2aSThomas Huth 631fcf5ef2aSThomas Huth #define VABSDU_DO(name, element) \ 632fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 633fcf5ef2aSThomas Huth { \ 634fcf5ef2aSThomas Huth int i; \ 635fcf5ef2aSThomas Huth \ 636fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 637fcf5ef2aSThomas Huth r->element[i] = (a->element[i] > b->element[i]) ? \ 638fcf5ef2aSThomas Huth (a->element[i] - b->element[i]) : \ 639fcf5ef2aSThomas Huth (b->element[i] - a->element[i]); \ 640fcf5ef2aSThomas Huth } \ 641fcf5ef2aSThomas Huth } 642fcf5ef2aSThomas Huth 643fcf5ef2aSThomas Huth /* VABSDU - Vector absolute difference unsigned 644fcf5ef2aSThomas Huth * name - instruction mnemonic suffix (b: byte, h: halfword, w: word) 645fcf5ef2aSThomas Huth * element - element type to access from vector 646fcf5ef2aSThomas Huth */ 647fcf5ef2aSThomas Huth #define VABSDU(type, element) \ 648fcf5ef2aSThomas Huth VABSDU_DO(absdu##type, element) 649fcf5ef2aSThomas Huth VABSDU(b, u8) 650fcf5ef2aSThomas Huth VABSDU(h, u16) 651fcf5ef2aSThomas Huth VABSDU(w, u32) 652fcf5ef2aSThomas Huth #undef VABSDU_DO 653fcf5ef2aSThomas Huth #undef VABSDU 654fcf5ef2aSThomas Huth 655fcf5ef2aSThomas Huth #define VCF(suffix, cvt, element) \ 656fcf5ef2aSThomas Huth void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r, \ 657fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 658fcf5ef2aSThomas Huth { \ 659fcf5ef2aSThomas Huth int i; \ 660fcf5ef2aSThomas Huth \ 66105ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 662fcf5ef2aSThomas Huth float32 t = cvt(b->element[i], &env->vec_status); \ 66305ee3e8aSMark Cave-Ayland r->f32[i] = float32_scalbn(t, -uim, &env->vec_status); \ 664fcf5ef2aSThomas Huth } \ 665fcf5ef2aSThomas Huth } 666fcf5ef2aSThomas Huth VCF(ux, uint32_to_float32, u32) 667fcf5ef2aSThomas Huth VCF(sx, int32_to_float32, s32) 668fcf5ef2aSThomas Huth #undef VCF 669fcf5ef2aSThomas Huth 670fcf5ef2aSThomas Huth #define VCMP_DO(suffix, compare, element, record) \ 671fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 672fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 673fcf5ef2aSThomas Huth { \ 674fcf5ef2aSThomas Huth uint64_t ones = (uint64_t)-1; \ 675fcf5ef2aSThomas Huth uint64_t all = ones; \ 676fcf5ef2aSThomas Huth uint64_t none = 0; \ 677fcf5ef2aSThomas Huth int i; \ 678fcf5ef2aSThomas Huth \ 679fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 680fcf5ef2aSThomas Huth uint64_t result = (a->element[i] compare b->element[i] ? \ 681fcf5ef2aSThomas Huth ones : 0x0); \ 682fcf5ef2aSThomas Huth switch (sizeof(a->element[0])) { \ 683fcf5ef2aSThomas Huth case 8: \ 684fcf5ef2aSThomas Huth r->u64[i] = result; \ 685fcf5ef2aSThomas Huth break; \ 686fcf5ef2aSThomas Huth case 4: \ 687fcf5ef2aSThomas Huth r->u32[i] = result; \ 688fcf5ef2aSThomas Huth break; \ 689fcf5ef2aSThomas Huth case 2: \ 690fcf5ef2aSThomas Huth r->u16[i] = result; \ 691fcf5ef2aSThomas Huth break; \ 692fcf5ef2aSThomas Huth case 1: \ 693fcf5ef2aSThomas Huth r->u8[i] = result; \ 694fcf5ef2aSThomas Huth break; \ 695fcf5ef2aSThomas Huth } \ 696fcf5ef2aSThomas Huth all &= result; \ 697fcf5ef2aSThomas Huth none |= result; \ 698fcf5ef2aSThomas Huth } \ 699fcf5ef2aSThomas Huth if (record) { \ 700fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 701fcf5ef2aSThomas Huth } \ 702fcf5ef2aSThomas Huth } 703fcf5ef2aSThomas Huth #define VCMP(suffix, compare, element) \ 704fcf5ef2aSThomas Huth VCMP_DO(suffix, compare, element, 0) \ 705fcf5ef2aSThomas Huth VCMP_DO(suffix##_dot, compare, element, 1) 706fcf5ef2aSThomas Huth VCMP(equb, ==, u8) 707fcf5ef2aSThomas Huth VCMP(equh, ==, u16) 708fcf5ef2aSThomas Huth VCMP(equw, ==, u32) 709fcf5ef2aSThomas Huth VCMP(equd, ==, u64) 710fcf5ef2aSThomas Huth VCMP(gtub, >, u8) 711fcf5ef2aSThomas Huth VCMP(gtuh, >, u16) 712fcf5ef2aSThomas Huth VCMP(gtuw, >, u32) 713fcf5ef2aSThomas Huth VCMP(gtud, >, u64) 714fcf5ef2aSThomas Huth VCMP(gtsb, >, s8) 715fcf5ef2aSThomas Huth VCMP(gtsh, >, s16) 716fcf5ef2aSThomas Huth VCMP(gtsw, >, s32) 717fcf5ef2aSThomas Huth VCMP(gtsd, >, s64) 718fcf5ef2aSThomas Huth #undef VCMP_DO 719fcf5ef2aSThomas Huth #undef VCMP 720fcf5ef2aSThomas Huth 721fcf5ef2aSThomas Huth #define VCMPNE_DO(suffix, element, etype, cmpzero, record) \ 722fcf5ef2aSThomas Huth void helper_vcmpne##suffix(CPUPPCState *env, ppc_avr_t *r, \ 723fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 724fcf5ef2aSThomas Huth { \ 725fcf5ef2aSThomas Huth etype ones = (etype)-1; \ 726fcf5ef2aSThomas Huth etype all = ones; \ 727fcf5ef2aSThomas Huth etype result, none = 0; \ 728fcf5ef2aSThomas Huth int i; \ 729fcf5ef2aSThomas Huth \ 730fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 731fcf5ef2aSThomas Huth if (cmpzero) { \ 732fcf5ef2aSThomas Huth result = ((a->element[i] == 0) \ 733fcf5ef2aSThomas Huth || (b->element[i] == 0) \ 734fcf5ef2aSThomas Huth || (a->element[i] != b->element[i]) ? \ 735fcf5ef2aSThomas Huth ones : 0x0); \ 736fcf5ef2aSThomas Huth } else { \ 737fcf5ef2aSThomas Huth result = (a->element[i] != b->element[i]) ? ones : 0x0; \ 738fcf5ef2aSThomas Huth } \ 739fcf5ef2aSThomas Huth r->element[i] = result; \ 740fcf5ef2aSThomas Huth all &= result; \ 741fcf5ef2aSThomas Huth none |= result; \ 742fcf5ef2aSThomas Huth } \ 743fcf5ef2aSThomas Huth if (record) { \ 744fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 745fcf5ef2aSThomas Huth } \ 746fcf5ef2aSThomas Huth } 747fcf5ef2aSThomas Huth 748fcf5ef2aSThomas Huth /* VCMPNEZ - Vector compare not equal to zero 749fcf5ef2aSThomas Huth * suffix - instruction mnemonic suffix (b: byte, h: halfword, w: word) 750fcf5ef2aSThomas Huth * element - element type to access from vector 751fcf5ef2aSThomas Huth */ 752fcf5ef2aSThomas Huth #define VCMPNE(suffix, element, etype, cmpzero) \ 753fcf5ef2aSThomas Huth VCMPNE_DO(suffix, element, etype, cmpzero, 0) \ 754fcf5ef2aSThomas Huth VCMPNE_DO(suffix##_dot, element, etype, cmpzero, 1) 755fcf5ef2aSThomas Huth VCMPNE(zb, u8, uint8_t, 1) 756fcf5ef2aSThomas Huth VCMPNE(zh, u16, uint16_t, 1) 757fcf5ef2aSThomas Huth VCMPNE(zw, u32, uint32_t, 1) 758fcf5ef2aSThomas Huth VCMPNE(b, u8, uint8_t, 0) 759fcf5ef2aSThomas Huth VCMPNE(h, u16, uint16_t, 0) 760fcf5ef2aSThomas Huth VCMPNE(w, u32, uint32_t, 0) 761fcf5ef2aSThomas Huth #undef VCMPNE_DO 762fcf5ef2aSThomas Huth #undef VCMPNE 763fcf5ef2aSThomas Huth 764fcf5ef2aSThomas Huth #define VCMPFP_DO(suffix, compare, order, record) \ 765fcf5ef2aSThomas Huth void helper_vcmp##suffix(CPUPPCState *env, ppc_avr_t *r, \ 766fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 767fcf5ef2aSThomas Huth { \ 768fcf5ef2aSThomas Huth uint32_t ones = (uint32_t)-1; \ 769fcf5ef2aSThomas Huth uint32_t all = ones; \ 770fcf5ef2aSThomas Huth uint32_t none = 0; \ 771fcf5ef2aSThomas Huth int i; \ 772fcf5ef2aSThomas Huth \ 77305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 774fcf5ef2aSThomas Huth uint32_t result; \ 77505ee3e8aSMark Cave-Ayland int rel = float32_compare_quiet(a->f32[i], b->f32[i], \ 776fcf5ef2aSThomas Huth &env->vec_status); \ 777fcf5ef2aSThomas Huth if (rel == float_relation_unordered) { \ 778fcf5ef2aSThomas Huth result = 0; \ 779fcf5ef2aSThomas Huth } else if (rel compare order) { \ 780fcf5ef2aSThomas Huth result = ones; \ 781fcf5ef2aSThomas Huth } else { \ 782fcf5ef2aSThomas Huth result = 0; \ 783fcf5ef2aSThomas Huth } \ 784fcf5ef2aSThomas Huth r->u32[i] = result; \ 785fcf5ef2aSThomas Huth all &= result; \ 786fcf5ef2aSThomas Huth none |= result; \ 787fcf5ef2aSThomas Huth } \ 788fcf5ef2aSThomas Huth if (record) { \ 789fcf5ef2aSThomas Huth env->crf[6] = ((all != 0) << 3) | ((none == 0) << 1); \ 790fcf5ef2aSThomas Huth } \ 791fcf5ef2aSThomas Huth } 792fcf5ef2aSThomas Huth #define VCMPFP(suffix, compare, order) \ 793fcf5ef2aSThomas Huth VCMPFP_DO(suffix, compare, order, 0) \ 794fcf5ef2aSThomas Huth VCMPFP_DO(suffix##_dot, compare, order, 1) 795fcf5ef2aSThomas Huth VCMPFP(eqfp, ==, float_relation_equal) 796fcf5ef2aSThomas Huth VCMPFP(gefp, !=, float_relation_less) 797fcf5ef2aSThomas Huth VCMPFP(gtfp, ==, float_relation_greater) 798fcf5ef2aSThomas Huth #undef VCMPFP_DO 799fcf5ef2aSThomas Huth #undef VCMPFP 800fcf5ef2aSThomas Huth 801fcf5ef2aSThomas Huth static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r, 802fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b, int record) 803fcf5ef2aSThomas Huth { 804fcf5ef2aSThomas Huth int i; 805fcf5ef2aSThomas Huth int all_in = 0; 806fcf5ef2aSThomas Huth 80705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 80805ee3e8aSMark Cave-Ayland int le_rel = float32_compare_quiet(a->f32[i], b->f32[i], 80905ee3e8aSMark Cave-Ayland &env->vec_status); 810fcf5ef2aSThomas Huth if (le_rel == float_relation_unordered) { 811fcf5ef2aSThomas Huth r->u32[i] = 0xc0000000; 812fcf5ef2aSThomas Huth all_in = 1; 813fcf5ef2aSThomas Huth } else { 81405ee3e8aSMark Cave-Ayland float32 bneg = float32_chs(b->f32[i]); 81505ee3e8aSMark Cave-Ayland int ge_rel = float32_compare_quiet(a->f32[i], bneg, 81605ee3e8aSMark Cave-Ayland &env->vec_status); 817fcf5ef2aSThomas Huth int le = le_rel != float_relation_greater; 818fcf5ef2aSThomas Huth int ge = ge_rel != float_relation_less; 819fcf5ef2aSThomas Huth 820fcf5ef2aSThomas Huth r->u32[i] = ((!le) << 31) | ((!ge) << 30); 821fcf5ef2aSThomas Huth all_in |= (!le | !ge); 822fcf5ef2aSThomas Huth } 823fcf5ef2aSThomas Huth } 824fcf5ef2aSThomas Huth if (record) { 825fcf5ef2aSThomas Huth env->crf[6] = (all_in == 0) << 1; 826fcf5ef2aSThomas Huth } 827fcf5ef2aSThomas Huth } 828fcf5ef2aSThomas Huth 829fcf5ef2aSThomas Huth void helper_vcmpbfp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 830fcf5ef2aSThomas Huth { 831fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 0); 832fcf5ef2aSThomas Huth } 833fcf5ef2aSThomas Huth 834fcf5ef2aSThomas Huth void helper_vcmpbfp_dot(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 835fcf5ef2aSThomas Huth ppc_avr_t *b) 836fcf5ef2aSThomas Huth { 837fcf5ef2aSThomas Huth vcmpbfp_internal(env, r, a, b, 1); 838fcf5ef2aSThomas Huth } 839fcf5ef2aSThomas Huth 840fcf5ef2aSThomas Huth #define VCT(suffix, satcvt, element) \ 841fcf5ef2aSThomas Huth void helper_vct##suffix(CPUPPCState *env, ppc_avr_t *r, \ 842fcf5ef2aSThomas Huth ppc_avr_t *b, uint32_t uim) \ 843fcf5ef2aSThomas Huth { \ 844fcf5ef2aSThomas Huth int i; \ 845fcf5ef2aSThomas Huth int sat = 0; \ 846fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 847fcf5ef2aSThomas Huth \ 848fcf5ef2aSThomas Huth set_float_rounding_mode(float_round_to_zero, &s); \ 84905ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 85005ee3e8aSMark Cave-Ayland if (float32_is_any_nan(b->f32[i])) { \ 851fcf5ef2aSThomas Huth r->element[i] = 0; \ 852fcf5ef2aSThomas Huth } else { \ 85305ee3e8aSMark Cave-Ayland float64 t = float32_to_float64(b->f32[i], &s); \ 854fcf5ef2aSThomas Huth int64_t j; \ 855fcf5ef2aSThomas Huth \ 856fcf5ef2aSThomas Huth t = float64_scalbn(t, uim, &s); \ 857fcf5ef2aSThomas Huth j = float64_to_int64(t, &s); \ 858fcf5ef2aSThomas Huth r->element[i] = satcvt(j, &sat); \ 859fcf5ef2aSThomas Huth } \ 860fcf5ef2aSThomas Huth } \ 861fcf5ef2aSThomas Huth if (sat) { \ 862fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); \ 863fcf5ef2aSThomas Huth } \ 864fcf5ef2aSThomas Huth } 865fcf5ef2aSThomas Huth VCT(uxs, cvtsduw, u32) 866fcf5ef2aSThomas Huth VCT(sxs, cvtsdsw, s32) 867fcf5ef2aSThomas Huth #undef VCT 868fcf5ef2aSThomas Huth 869fcf5ef2aSThomas Huth target_ulong helper_vclzlsbb(ppc_avr_t *r) 870fcf5ef2aSThomas Huth { 871fcf5ef2aSThomas Huth target_ulong count = 0; 872fcf5ef2aSThomas Huth int i; 873fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 874fcf5ef2aSThomas Huth if (r->u8[i] & 0x01) { 875fcf5ef2aSThomas Huth break; 876fcf5ef2aSThomas Huth } 877fcf5ef2aSThomas Huth count++; 878fcf5ef2aSThomas Huth } 879fcf5ef2aSThomas Huth return count; 880fcf5ef2aSThomas Huth } 881fcf5ef2aSThomas Huth 882fcf5ef2aSThomas Huth target_ulong helper_vctzlsbb(ppc_avr_t *r) 883fcf5ef2aSThomas Huth { 884fcf5ef2aSThomas Huth target_ulong count = 0; 885fcf5ef2aSThomas Huth int i; 886fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 887fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 888fcf5ef2aSThomas Huth #else 889fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 890fcf5ef2aSThomas Huth #endif 891fcf5ef2aSThomas Huth if (r->u8[i] & 0x01) { 892fcf5ef2aSThomas Huth break; 893fcf5ef2aSThomas Huth } 894fcf5ef2aSThomas Huth count++; 895fcf5ef2aSThomas Huth } 896fcf5ef2aSThomas Huth return count; 897fcf5ef2aSThomas Huth } 898fcf5ef2aSThomas Huth 899fcf5ef2aSThomas Huth void helper_vmhaddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 900fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 901fcf5ef2aSThomas Huth { 902fcf5ef2aSThomas Huth int sat = 0; 903fcf5ef2aSThomas Huth int i; 904fcf5ef2aSThomas Huth 905fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 906fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 907fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 908fcf5ef2aSThomas Huth 909fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 910fcf5ef2aSThomas Huth } 911fcf5ef2aSThomas Huth 912fcf5ef2aSThomas Huth if (sat) { 913fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 914fcf5ef2aSThomas Huth } 915fcf5ef2aSThomas Huth } 916fcf5ef2aSThomas Huth 917fcf5ef2aSThomas Huth void helper_vmhraddshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 918fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 919fcf5ef2aSThomas Huth { 920fcf5ef2aSThomas Huth int sat = 0; 921fcf5ef2aSThomas Huth int i; 922fcf5ef2aSThomas Huth 923fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 924fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i] + 0x00004000; 925fcf5ef2aSThomas Huth int32_t t = (int32_t)c->s16[i] + (prod >> 15); 926fcf5ef2aSThomas Huth r->s16[i] = cvtswsh(t, &sat); 927fcf5ef2aSThomas Huth } 928fcf5ef2aSThomas Huth 929fcf5ef2aSThomas Huth if (sat) { 930fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 931fcf5ef2aSThomas Huth } 932fcf5ef2aSThomas Huth } 933fcf5ef2aSThomas Huth 934fcf5ef2aSThomas Huth #define VMINMAX_DO(name, compare, element) \ 935fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 936fcf5ef2aSThomas Huth { \ 937fcf5ef2aSThomas Huth int i; \ 938fcf5ef2aSThomas Huth \ 939fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 940fcf5ef2aSThomas Huth if (a->element[i] compare b->element[i]) { \ 941fcf5ef2aSThomas Huth r->element[i] = b->element[i]; \ 942fcf5ef2aSThomas Huth } else { \ 943fcf5ef2aSThomas Huth r->element[i] = a->element[i]; \ 944fcf5ef2aSThomas Huth } \ 945fcf5ef2aSThomas Huth } \ 946fcf5ef2aSThomas Huth } 947fcf5ef2aSThomas Huth #define VMINMAX(suffix, element) \ 948fcf5ef2aSThomas Huth VMINMAX_DO(min##suffix, >, element) \ 949fcf5ef2aSThomas Huth VMINMAX_DO(max##suffix, <, element) 950fcf5ef2aSThomas Huth VMINMAX(sb, s8) 951fcf5ef2aSThomas Huth VMINMAX(sh, s16) 952fcf5ef2aSThomas Huth VMINMAX(sw, s32) 953fcf5ef2aSThomas Huth VMINMAX(sd, s64) 954fcf5ef2aSThomas Huth VMINMAX(ub, u8) 955fcf5ef2aSThomas Huth VMINMAX(uh, u16) 956fcf5ef2aSThomas Huth VMINMAX(uw, u32) 957fcf5ef2aSThomas Huth VMINMAX(ud, u64) 958fcf5ef2aSThomas Huth #undef VMINMAX_DO 959fcf5ef2aSThomas Huth #undef VMINMAX 960fcf5ef2aSThomas Huth 961fcf5ef2aSThomas Huth void helper_vmladduhm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 962fcf5ef2aSThomas Huth { 963fcf5ef2aSThomas Huth int i; 964fcf5ef2aSThomas Huth 965fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 966fcf5ef2aSThomas Huth int32_t prod = a->s16[i] * b->s16[i]; 967fcf5ef2aSThomas Huth r->s16[i] = (int16_t) (prod + c->s16[i]); 968fcf5ef2aSThomas Huth } 969fcf5ef2aSThomas Huth } 970fcf5ef2aSThomas Huth 971d81c2040SMark Cave-Ayland #define VMRG_DO(name, element, access, ofs) \ 972fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 973fcf5ef2aSThomas Huth { \ 974fcf5ef2aSThomas Huth ppc_avr_t result; \ 975d81c2040SMark Cave-Ayland int i, half = ARRAY_SIZE(r->element) / 2; \ 976fcf5ef2aSThomas Huth \ 977d81c2040SMark Cave-Ayland for (i = 0; i < half; i++) { \ 978d81c2040SMark Cave-Ayland result.access(i * 2 + 0) = a->access(i + ofs); \ 979d81c2040SMark Cave-Ayland result.access(i * 2 + 1) = b->access(i + ofs); \ 980fcf5ef2aSThomas Huth } \ 981fcf5ef2aSThomas Huth *r = result; \ 982fcf5ef2aSThomas Huth } 983d81c2040SMark Cave-Ayland 984d81c2040SMark Cave-Ayland #define VMRG(suffix, element, access) \ 985d81c2040SMark Cave-Ayland VMRG_DO(mrgl##suffix, element, access, half) \ 986d81c2040SMark Cave-Ayland VMRG_DO(mrgh##suffix, element, access, 0) 987d81c2040SMark Cave-Ayland VMRG(b, u8, VsrB) 988d81c2040SMark Cave-Ayland VMRG(h, u16, VsrH) 989d81c2040SMark Cave-Ayland VMRG(w, u32, VsrW) 990fcf5ef2aSThomas Huth #undef VMRG_DO 991fcf5ef2aSThomas Huth #undef VMRG 992fcf5ef2aSThomas Huth 993fcf5ef2aSThomas Huth void helper_vmsummbm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 994fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 995fcf5ef2aSThomas Huth { 996fcf5ef2aSThomas Huth int32_t prod[16]; 997fcf5ef2aSThomas Huth int i; 998fcf5ef2aSThomas Huth 999fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s8); i++) { 1000fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s8[i] * b->u8[i]; 1001fcf5ef2aSThomas Huth } 1002fcf5ef2aSThomas Huth 1003fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1004fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[4 * i] + prod[4 * i + 1] + 1005fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1006fcf5ef2aSThomas Huth } 1007fcf5ef2aSThomas Huth } 1008fcf5ef2aSThomas Huth 1009fcf5ef2aSThomas Huth void helper_vmsumshm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1010fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1011fcf5ef2aSThomas Huth { 1012fcf5ef2aSThomas Huth int32_t prod[8]; 1013fcf5ef2aSThomas Huth int i; 1014fcf5ef2aSThomas Huth 1015fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1016fcf5ef2aSThomas Huth prod[i] = a->s16[i] * b->s16[i]; 1017fcf5ef2aSThomas Huth } 1018fcf5ef2aSThomas Huth 1019fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1020fcf5ef2aSThomas Huth r->s32[i] = c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1021fcf5ef2aSThomas Huth } 1022fcf5ef2aSThomas Huth } 1023fcf5ef2aSThomas Huth 1024fcf5ef2aSThomas Huth void helper_vmsumshs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1025fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1026fcf5ef2aSThomas Huth { 1027fcf5ef2aSThomas Huth int32_t prod[8]; 1028fcf5ef2aSThomas Huth int i; 1029fcf5ef2aSThomas Huth int sat = 0; 1030fcf5ef2aSThomas Huth 1031fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s16); i++) { 1032fcf5ef2aSThomas Huth prod[i] = (int32_t)a->s16[i] * b->s16[i]; 1033fcf5ef2aSThomas Huth } 1034fcf5ef2aSThomas Huth 1035fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1036fcf5ef2aSThomas Huth int64_t t = (int64_t)c->s32[i] + prod[2 * i] + prod[2 * i + 1]; 1037fcf5ef2aSThomas Huth 1038fcf5ef2aSThomas Huth r->u32[i] = cvtsdsw(t, &sat); 1039fcf5ef2aSThomas Huth } 1040fcf5ef2aSThomas Huth 1041fcf5ef2aSThomas Huth if (sat) { 1042fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 1043fcf5ef2aSThomas Huth } 1044fcf5ef2aSThomas Huth } 1045fcf5ef2aSThomas Huth 1046fcf5ef2aSThomas Huth void helper_vmsumubm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1047fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1048fcf5ef2aSThomas Huth { 1049fcf5ef2aSThomas Huth uint16_t prod[16]; 1050fcf5ef2aSThomas Huth int i; 1051fcf5ef2aSThomas Huth 1052fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1053fcf5ef2aSThomas Huth prod[i] = a->u8[i] * b->u8[i]; 1054fcf5ef2aSThomas Huth } 1055fcf5ef2aSThomas Huth 1056fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1057fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[4 * i] + prod[4 * i + 1] + 1058fcf5ef2aSThomas Huth prod[4 * i + 2] + prod[4 * i + 3]; 1059fcf5ef2aSThomas Huth } 1060fcf5ef2aSThomas Huth } 1061fcf5ef2aSThomas Huth 1062fcf5ef2aSThomas Huth void helper_vmsumuhm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1063fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1064fcf5ef2aSThomas Huth { 1065fcf5ef2aSThomas Huth uint32_t prod[8]; 1066fcf5ef2aSThomas Huth int i; 1067fcf5ef2aSThomas Huth 1068fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1069fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1070fcf5ef2aSThomas Huth } 1071fcf5ef2aSThomas Huth 1072fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 1073fcf5ef2aSThomas Huth r->u32[i] = c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1074fcf5ef2aSThomas Huth } 1075fcf5ef2aSThomas Huth } 1076fcf5ef2aSThomas Huth 1077fcf5ef2aSThomas Huth void helper_vmsumuhs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, 1078fcf5ef2aSThomas Huth ppc_avr_t *b, ppc_avr_t *c) 1079fcf5ef2aSThomas Huth { 1080fcf5ef2aSThomas Huth uint32_t prod[8]; 1081fcf5ef2aSThomas Huth int i; 1082fcf5ef2aSThomas Huth int sat = 0; 1083fcf5ef2aSThomas Huth 1084fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u16); i++) { 1085fcf5ef2aSThomas Huth prod[i] = a->u16[i] * b->u16[i]; 1086fcf5ef2aSThomas Huth } 1087fcf5ef2aSThomas Huth 1088fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, s32) { 1089fcf5ef2aSThomas Huth uint64_t t = (uint64_t)c->u32[i] + prod[2 * i] + prod[2 * i + 1]; 1090fcf5ef2aSThomas Huth 1091fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 1092fcf5ef2aSThomas Huth } 1093fcf5ef2aSThomas Huth 1094fcf5ef2aSThomas Huth if (sat) { 1095fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 1096fcf5ef2aSThomas Huth } 1097fcf5ef2aSThomas Huth } 1098fcf5ef2aSThomas Huth 10994fbc89edSMark Cave-Ayland #define VMUL_DO_EVN(name, mul_element, mul_access, prod_access, cast) \ 1100fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1101fcf5ef2aSThomas Huth { \ 1102fcf5ef2aSThomas Huth int i; \ 1103fcf5ef2aSThomas Huth \ 11044fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 11054fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i) * \ 11064fbc89edSMark Cave-Ayland (cast)b->mul_access(i); \ 1107fcf5ef2aSThomas Huth } \ 1108fcf5ef2aSThomas Huth } 11094fbc89edSMark Cave-Ayland 11104fbc89edSMark Cave-Ayland #define VMUL_DO_ODD(name, mul_element, mul_access, prod_access, cast) \ 11114fbc89edSMark Cave-Ayland void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 11124fbc89edSMark Cave-Ayland { \ 11134fbc89edSMark Cave-Ayland int i; \ 11144fbc89edSMark Cave-Ayland \ 11154fbc89edSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->mul_element); i += 2) { \ 11164fbc89edSMark Cave-Ayland r->prod_access(i >> 1) = (cast)a->mul_access(i + 1) * \ 11174fbc89edSMark Cave-Ayland (cast)b->mul_access(i + 1); \ 11184fbc89edSMark Cave-Ayland } \ 11194fbc89edSMark Cave-Ayland } 11204fbc89edSMark Cave-Ayland 11214fbc89edSMark Cave-Ayland #define VMUL(suffix, mul_element, mul_access, prod_access, cast) \ 11224fbc89edSMark Cave-Ayland VMUL_DO_EVN(mule##suffix, mul_element, mul_access, prod_access, cast) \ 11234fbc89edSMark Cave-Ayland VMUL_DO_ODD(mulo##suffix, mul_element, mul_access, prod_access, cast) 11244fbc89edSMark Cave-Ayland VMUL(sb, s8, VsrSB, VsrSH, int16_t) 11254fbc89edSMark Cave-Ayland VMUL(sh, s16, VsrSH, VsrSW, int32_t) 11264fbc89edSMark Cave-Ayland VMUL(sw, s32, VsrSW, VsrSD, int64_t) 11274fbc89edSMark Cave-Ayland VMUL(ub, u8, VsrB, VsrH, uint16_t) 11284fbc89edSMark Cave-Ayland VMUL(uh, u16, VsrH, VsrW, uint32_t) 11294fbc89edSMark Cave-Ayland VMUL(uw, u32, VsrW, VsrD, uint64_t) 11304fbc89edSMark Cave-Ayland #undef VMUL_DO_EVN 11314fbc89edSMark Cave-Ayland #undef VMUL_DO_ODD 1132fcf5ef2aSThomas Huth #undef VMUL 1133fcf5ef2aSThomas Huth 1134fcf5ef2aSThomas Huth void helper_vperm(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1135fcf5ef2aSThomas Huth ppc_avr_t *c) 1136fcf5ef2aSThomas Huth { 1137fcf5ef2aSThomas Huth ppc_avr_t result; 1138fcf5ef2aSThomas Huth int i; 1139fcf5ef2aSThomas Huth 1140fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1141fcf5ef2aSThomas Huth int s = c->u8[i] & 0x1f; 1142fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1143fcf5ef2aSThomas Huth int index = s & 0xf; 1144fcf5ef2aSThomas Huth #else 1145fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1146fcf5ef2aSThomas Huth #endif 1147fcf5ef2aSThomas Huth 1148fcf5ef2aSThomas Huth if (s & 0x10) { 1149fcf5ef2aSThomas Huth result.u8[i] = b->u8[index]; 1150fcf5ef2aSThomas Huth } else { 1151fcf5ef2aSThomas Huth result.u8[i] = a->u8[index]; 1152fcf5ef2aSThomas Huth } 1153fcf5ef2aSThomas Huth } 1154fcf5ef2aSThomas Huth *r = result; 1155fcf5ef2aSThomas Huth } 1156fcf5ef2aSThomas Huth 1157fcf5ef2aSThomas Huth void helper_vpermr(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1158fcf5ef2aSThomas Huth ppc_avr_t *c) 1159fcf5ef2aSThomas Huth { 1160fcf5ef2aSThomas Huth ppc_avr_t result; 1161fcf5ef2aSThomas Huth int i; 1162fcf5ef2aSThomas Huth 1163fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1164fcf5ef2aSThomas Huth int s = c->u8[i] & 0x1f; 1165fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1166fcf5ef2aSThomas Huth int index = 15 - (s & 0xf); 1167fcf5ef2aSThomas Huth #else 1168fcf5ef2aSThomas Huth int index = s & 0xf; 1169fcf5ef2aSThomas Huth #endif 1170fcf5ef2aSThomas Huth 1171fcf5ef2aSThomas Huth if (s & 0x10) { 1172fcf5ef2aSThomas Huth result.u8[i] = a->u8[index]; 1173fcf5ef2aSThomas Huth } else { 1174fcf5ef2aSThomas Huth result.u8[i] = b->u8[index]; 1175fcf5ef2aSThomas Huth } 1176fcf5ef2aSThomas Huth } 1177fcf5ef2aSThomas Huth *r = result; 1178fcf5ef2aSThomas Huth } 1179fcf5ef2aSThomas Huth 1180fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1181fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[(i)]) 1182fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (i) 1183fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) != 0) 1184fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) (extract64((avr)->u64[i], index, 1)) 1185fcf5ef2aSThomas Huth #else 1186fcf5ef2aSThomas Huth #define VBPERMQ_INDEX(avr, i) ((avr)->u8[15-(i)]) 1187fcf5ef2aSThomas Huth #define VBPERMD_INDEX(i) (1 - i) 1188fcf5ef2aSThomas Huth #define VBPERMQ_DW(index) (((index) & 0x40) == 0) 1189fcf5ef2aSThomas Huth #define EXTRACT_BIT(avr, i, index) \ 1190fcf5ef2aSThomas Huth (extract64((avr)->u64[1 - i], 63 - index, 1)) 1191fcf5ef2aSThomas Huth #endif 1192fcf5ef2aSThomas Huth 1193fcf5ef2aSThomas Huth void helper_vbpermd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1194fcf5ef2aSThomas Huth { 1195fcf5ef2aSThomas Huth int i, j; 1196fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 1197fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1198fcf5ef2aSThomas Huth for (j = 0; j < 8; j++) { 1199fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, (i * 8) + j); 1200fcf5ef2aSThomas Huth if (index < 64 && EXTRACT_BIT(a, i, index)) { 1201fcf5ef2aSThomas Huth result.u64[VBPERMD_INDEX(i)] |= (0x80 >> j); 1202fcf5ef2aSThomas Huth } 1203fcf5ef2aSThomas Huth } 1204fcf5ef2aSThomas Huth } 1205fcf5ef2aSThomas Huth *r = result; 1206fcf5ef2aSThomas Huth } 1207fcf5ef2aSThomas Huth 1208fcf5ef2aSThomas Huth void helper_vbpermq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1209fcf5ef2aSThomas Huth { 1210fcf5ef2aSThomas Huth int i; 1211fcf5ef2aSThomas Huth uint64_t perm = 0; 1212fcf5ef2aSThomas Huth 1213fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1214fcf5ef2aSThomas Huth int index = VBPERMQ_INDEX(b, i); 1215fcf5ef2aSThomas Huth 1216fcf5ef2aSThomas Huth if (index < 128) { 1217fcf5ef2aSThomas Huth uint64_t mask = (1ull << (63-(index & 0x3F))); 1218fcf5ef2aSThomas Huth if (a->u64[VBPERMQ_DW(index)] & mask) { 1219fcf5ef2aSThomas Huth perm |= (0x8000 >> i); 1220fcf5ef2aSThomas Huth } 1221fcf5ef2aSThomas Huth } 1222fcf5ef2aSThomas Huth } 1223fcf5ef2aSThomas Huth 12243c385a93SMark Cave-Ayland r->VsrD(0) = perm; 12253c385a93SMark Cave-Ayland r->VsrD(1) = 0; 1226fcf5ef2aSThomas Huth } 1227fcf5ef2aSThomas Huth 1228fcf5ef2aSThomas Huth #undef VBPERMQ_INDEX 1229fcf5ef2aSThomas Huth #undef VBPERMQ_DW 1230fcf5ef2aSThomas Huth 1231fcf5ef2aSThomas Huth static const uint64_t VGBBD_MASKS[256] = { 1232fcf5ef2aSThomas Huth 0x0000000000000000ull, /* 00 */ 1233fcf5ef2aSThomas Huth 0x0000000000000080ull, /* 01 */ 1234fcf5ef2aSThomas Huth 0x0000000000008000ull, /* 02 */ 1235fcf5ef2aSThomas Huth 0x0000000000008080ull, /* 03 */ 1236fcf5ef2aSThomas Huth 0x0000000000800000ull, /* 04 */ 1237fcf5ef2aSThomas Huth 0x0000000000800080ull, /* 05 */ 1238fcf5ef2aSThomas Huth 0x0000000000808000ull, /* 06 */ 1239fcf5ef2aSThomas Huth 0x0000000000808080ull, /* 07 */ 1240fcf5ef2aSThomas Huth 0x0000000080000000ull, /* 08 */ 1241fcf5ef2aSThomas Huth 0x0000000080000080ull, /* 09 */ 1242fcf5ef2aSThomas Huth 0x0000000080008000ull, /* 0A */ 1243fcf5ef2aSThomas Huth 0x0000000080008080ull, /* 0B */ 1244fcf5ef2aSThomas Huth 0x0000000080800000ull, /* 0C */ 1245fcf5ef2aSThomas Huth 0x0000000080800080ull, /* 0D */ 1246fcf5ef2aSThomas Huth 0x0000000080808000ull, /* 0E */ 1247fcf5ef2aSThomas Huth 0x0000000080808080ull, /* 0F */ 1248fcf5ef2aSThomas Huth 0x0000008000000000ull, /* 10 */ 1249fcf5ef2aSThomas Huth 0x0000008000000080ull, /* 11 */ 1250fcf5ef2aSThomas Huth 0x0000008000008000ull, /* 12 */ 1251fcf5ef2aSThomas Huth 0x0000008000008080ull, /* 13 */ 1252fcf5ef2aSThomas Huth 0x0000008000800000ull, /* 14 */ 1253fcf5ef2aSThomas Huth 0x0000008000800080ull, /* 15 */ 1254fcf5ef2aSThomas Huth 0x0000008000808000ull, /* 16 */ 1255fcf5ef2aSThomas Huth 0x0000008000808080ull, /* 17 */ 1256fcf5ef2aSThomas Huth 0x0000008080000000ull, /* 18 */ 1257fcf5ef2aSThomas Huth 0x0000008080000080ull, /* 19 */ 1258fcf5ef2aSThomas Huth 0x0000008080008000ull, /* 1A */ 1259fcf5ef2aSThomas Huth 0x0000008080008080ull, /* 1B */ 1260fcf5ef2aSThomas Huth 0x0000008080800000ull, /* 1C */ 1261fcf5ef2aSThomas Huth 0x0000008080800080ull, /* 1D */ 1262fcf5ef2aSThomas Huth 0x0000008080808000ull, /* 1E */ 1263fcf5ef2aSThomas Huth 0x0000008080808080ull, /* 1F */ 1264fcf5ef2aSThomas Huth 0x0000800000000000ull, /* 20 */ 1265fcf5ef2aSThomas Huth 0x0000800000000080ull, /* 21 */ 1266fcf5ef2aSThomas Huth 0x0000800000008000ull, /* 22 */ 1267fcf5ef2aSThomas Huth 0x0000800000008080ull, /* 23 */ 1268fcf5ef2aSThomas Huth 0x0000800000800000ull, /* 24 */ 1269fcf5ef2aSThomas Huth 0x0000800000800080ull, /* 25 */ 1270fcf5ef2aSThomas Huth 0x0000800000808000ull, /* 26 */ 1271fcf5ef2aSThomas Huth 0x0000800000808080ull, /* 27 */ 1272fcf5ef2aSThomas Huth 0x0000800080000000ull, /* 28 */ 1273fcf5ef2aSThomas Huth 0x0000800080000080ull, /* 29 */ 1274fcf5ef2aSThomas Huth 0x0000800080008000ull, /* 2A */ 1275fcf5ef2aSThomas Huth 0x0000800080008080ull, /* 2B */ 1276fcf5ef2aSThomas Huth 0x0000800080800000ull, /* 2C */ 1277fcf5ef2aSThomas Huth 0x0000800080800080ull, /* 2D */ 1278fcf5ef2aSThomas Huth 0x0000800080808000ull, /* 2E */ 1279fcf5ef2aSThomas Huth 0x0000800080808080ull, /* 2F */ 1280fcf5ef2aSThomas Huth 0x0000808000000000ull, /* 30 */ 1281fcf5ef2aSThomas Huth 0x0000808000000080ull, /* 31 */ 1282fcf5ef2aSThomas Huth 0x0000808000008000ull, /* 32 */ 1283fcf5ef2aSThomas Huth 0x0000808000008080ull, /* 33 */ 1284fcf5ef2aSThomas Huth 0x0000808000800000ull, /* 34 */ 1285fcf5ef2aSThomas Huth 0x0000808000800080ull, /* 35 */ 1286fcf5ef2aSThomas Huth 0x0000808000808000ull, /* 36 */ 1287fcf5ef2aSThomas Huth 0x0000808000808080ull, /* 37 */ 1288fcf5ef2aSThomas Huth 0x0000808080000000ull, /* 38 */ 1289fcf5ef2aSThomas Huth 0x0000808080000080ull, /* 39 */ 1290fcf5ef2aSThomas Huth 0x0000808080008000ull, /* 3A */ 1291fcf5ef2aSThomas Huth 0x0000808080008080ull, /* 3B */ 1292fcf5ef2aSThomas Huth 0x0000808080800000ull, /* 3C */ 1293fcf5ef2aSThomas Huth 0x0000808080800080ull, /* 3D */ 1294fcf5ef2aSThomas Huth 0x0000808080808000ull, /* 3E */ 1295fcf5ef2aSThomas Huth 0x0000808080808080ull, /* 3F */ 1296fcf5ef2aSThomas Huth 0x0080000000000000ull, /* 40 */ 1297fcf5ef2aSThomas Huth 0x0080000000000080ull, /* 41 */ 1298fcf5ef2aSThomas Huth 0x0080000000008000ull, /* 42 */ 1299fcf5ef2aSThomas Huth 0x0080000000008080ull, /* 43 */ 1300fcf5ef2aSThomas Huth 0x0080000000800000ull, /* 44 */ 1301fcf5ef2aSThomas Huth 0x0080000000800080ull, /* 45 */ 1302fcf5ef2aSThomas Huth 0x0080000000808000ull, /* 46 */ 1303fcf5ef2aSThomas Huth 0x0080000000808080ull, /* 47 */ 1304fcf5ef2aSThomas Huth 0x0080000080000000ull, /* 48 */ 1305fcf5ef2aSThomas Huth 0x0080000080000080ull, /* 49 */ 1306fcf5ef2aSThomas Huth 0x0080000080008000ull, /* 4A */ 1307fcf5ef2aSThomas Huth 0x0080000080008080ull, /* 4B */ 1308fcf5ef2aSThomas Huth 0x0080000080800000ull, /* 4C */ 1309fcf5ef2aSThomas Huth 0x0080000080800080ull, /* 4D */ 1310fcf5ef2aSThomas Huth 0x0080000080808000ull, /* 4E */ 1311fcf5ef2aSThomas Huth 0x0080000080808080ull, /* 4F */ 1312fcf5ef2aSThomas Huth 0x0080008000000000ull, /* 50 */ 1313fcf5ef2aSThomas Huth 0x0080008000000080ull, /* 51 */ 1314fcf5ef2aSThomas Huth 0x0080008000008000ull, /* 52 */ 1315fcf5ef2aSThomas Huth 0x0080008000008080ull, /* 53 */ 1316fcf5ef2aSThomas Huth 0x0080008000800000ull, /* 54 */ 1317fcf5ef2aSThomas Huth 0x0080008000800080ull, /* 55 */ 1318fcf5ef2aSThomas Huth 0x0080008000808000ull, /* 56 */ 1319fcf5ef2aSThomas Huth 0x0080008000808080ull, /* 57 */ 1320fcf5ef2aSThomas Huth 0x0080008080000000ull, /* 58 */ 1321fcf5ef2aSThomas Huth 0x0080008080000080ull, /* 59 */ 1322fcf5ef2aSThomas Huth 0x0080008080008000ull, /* 5A */ 1323fcf5ef2aSThomas Huth 0x0080008080008080ull, /* 5B */ 1324fcf5ef2aSThomas Huth 0x0080008080800000ull, /* 5C */ 1325fcf5ef2aSThomas Huth 0x0080008080800080ull, /* 5D */ 1326fcf5ef2aSThomas Huth 0x0080008080808000ull, /* 5E */ 1327fcf5ef2aSThomas Huth 0x0080008080808080ull, /* 5F */ 1328fcf5ef2aSThomas Huth 0x0080800000000000ull, /* 60 */ 1329fcf5ef2aSThomas Huth 0x0080800000000080ull, /* 61 */ 1330fcf5ef2aSThomas Huth 0x0080800000008000ull, /* 62 */ 1331fcf5ef2aSThomas Huth 0x0080800000008080ull, /* 63 */ 1332fcf5ef2aSThomas Huth 0x0080800000800000ull, /* 64 */ 1333fcf5ef2aSThomas Huth 0x0080800000800080ull, /* 65 */ 1334fcf5ef2aSThomas Huth 0x0080800000808000ull, /* 66 */ 1335fcf5ef2aSThomas Huth 0x0080800000808080ull, /* 67 */ 1336fcf5ef2aSThomas Huth 0x0080800080000000ull, /* 68 */ 1337fcf5ef2aSThomas Huth 0x0080800080000080ull, /* 69 */ 1338fcf5ef2aSThomas Huth 0x0080800080008000ull, /* 6A */ 1339fcf5ef2aSThomas Huth 0x0080800080008080ull, /* 6B */ 1340fcf5ef2aSThomas Huth 0x0080800080800000ull, /* 6C */ 1341fcf5ef2aSThomas Huth 0x0080800080800080ull, /* 6D */ 1342fcf5ef2aSThomas Huth 0x0080800080808000ull, /* 6E */ 1343fcf5ef2aSThomas Huth 0x0080800080808080ull, /* 6F */ 1344fcf5ef2aSThomas Huth 0x0080808000000000ull, /* 70 */ 1345fcf5ef2aSThomas Huth 0x0080808000000080ull, /* 71 */ 1346fcf5ef2aSThomas Huth 0x0080808000008000ull, /* 72 */ 1347fcf5ef2aSThomas Huth 0x0080808000008080ull, /* 73 */ 1348fcf5ef2aSThomas Huth 0x0080808000800000ull, /* 74 */ 1349fcf5ef2aSThomas Huth 0x0080808000800080ull, /* 75 */ 1350fcf5ef2aSThomas Huth 0x0080808000808000ull, /* 76 */ 1351fcf5ef2aSThomas Huth 0x0080808000808080ull, /* 77 */ 1352fcf5ef2aSThomas Huth 0x0080808080000000ull, /* 78 */ 1353fcf5ef2aSThomas Huth 0x0080808080000080ull, /* 79 */ 1354fcf5ef2aSThomas Huth 0x0080808080008000ull, /* 7A */ 1355fcf5ef2aSThomas Huth 0x0080808080008080ull, /* 7B */ 1356fcf5ef2aSThomas Huth 0x0080808080800000ull, /* 7C */ 1357fcf5ef2aSThomas Huth 0x0080808080800080ull, /* 7D */ 1358fcf5ef2aSThomas Huth 0x0080808080808000ull, /* 7E */ 1359fcf5ef2aSThomas Huth 0x0080808080808080ull, /* 7F */ 1360fcf5ef2aSThomas Huth 0x8000000000000000ull, /* 80 */ 1361fcf5ef2aSThomas Huth 0x8000000000000080ull, /* 81 */ 1362fcf5ef2aSThomas Huth 0x8000000000008000ull, /* 82 */ 1363fcf5ef2aSThomas Huth 0x8000000000008080ull, /* 83 */ 1364fcf5ef2aSThomas Huth 0x8000000000800000ull, /* 84 */ 1365fcf5ef2aSThomas Huth 0x8000000000800080ull, /* 85 */ 1366fcf5ef2aSThomas Huth 0x8000000000808000ull, /* 86 */ 1367fcf5ef2aSThomas Huth 0x8000000000808080ull, /* 87 */ 1368fcf5ef2aSThomas Huth 0x8000000080000000ull, /* 88 */ 1369fcf5ef2aSThomas Huth 0x8000000080000080ull, /* 89 */ 1370fcf5ef2aSThomas Huth 0x8000000080008000ull, /* 8A */ 1371fcf5ef2aSThomas Huth 0x8000000080008080ull, /* 8B */ 1372fcf5ef2aSThomas Huth 0x8000000080800000ull, /* 8C */ 1373fcf5ef2aSThomas Huth 0x8000000080800080ull, /* 8D */ 1374fcf5ef2aSThomas Huth 0x8000000080808000ull, /* 8E */ 1375fcf5ef2aSThomas Huth 0x8000000080808080ull, /* 8F */ 1376fcf5ef2aSThomas Huth 0x8000008000000000ull, /* 90 */ 1377fcf5ef2aSThomas Huth 0x8000008000000080ull, /* 91 */ 1378fcf5ef2aSThomas Huth 0x8000008000008000ull, /* 92 */ 1379fcf5ef2aSThomas Huth 0x8000008000008080ull, /* 93 */ 1380fcf5ef2aSThomas Huth 0x8000008000800000ull, /* 94 */ 1381fcf5ef2aSThomas Huth 0x8000008000800080ull, /* 95 */ 1382fcf5ef2aSThomas Huth 0x8000008000808000ull, /* 96 */ 1383fcf5ef2aSThomas Huth 0x8000008000808080ull, /* 97 */ 1384fcf5ef2aSThomas Huth 0x8000008080000000ull, /* 98 */ 1385fcf5ef2aSThomas Huth 0x8000008080000080ull, /* 99 */ 1386fcf5ef2aSThomas Huth 0x8000008080008000ull, /* 9A */ 1387fcf5ef2aSThomas Huth 0x8000008080008080ull, /* 9B */ 1388fcf5ef2aSThomas Huth 0x8000008080800000ull, /* 9C */ 1389fcf5ef2aSThomas Huth 0x8000008080800080ull, /* 9D */ 1390fcf5ef2aSThomas Huth 0x8000008080808000ull, /* 9E */ 1391fcf5ef2aSThomas Huth 0x8000008080808080ull, /* 9F */ 1392fcf5ef2aSThomas Huth 0x8000800000000000ull, /* A0 */ 1393fcf5ef2aSThomas Huth 0x8000800000000080ull, /* A1 */ 1394fcf5ef2aSThomas Huth 0x8000800000008000ull, /* A2 */ 1395fcf5ef2aSThomas Huth 0x8000800000008080ull, /* A3 */ 1396fcf5ef2aSThomas Huth 0x8000800000800000ull, /* A4 */ 1397fcf5ef2aSThomas Huth 0x8000800000800080ull, /* A5 */ 1398fcf5ef2aSThomas Huth 0x8000800000808000ull, /* A6 */ 1399fcf5ef2aSThomas Huth 0x8000800000808080ull, /* A7 */ 1400fcf5ef2aSThomas Huth 0x8000800080000000ull, /* A8 */ 1401fcf5ef2aSThomas Huth 0x8000800080000080ull, /* A9 */ 1402fcf5ef2aSThomas Huth 0x8000800080008000ull, /* AA */ 1403fcf5ef2aSThomas Huth 0x8000800080008080ull, /* AB */ 1404fcf5ef2aSThomas Huth 0x8000800080800000ull, /* AC */ 1405fcf5ef2aSThomas Huth 0x8000800080800080ull, /* AD */ 1406fcf5ef2aSThomas Huth 0x8000800080808000ull, /* AE */ 1407fcf5ef2aSThomas Huth 0x8000800080808080ull, /* AF */ 1408fcf5ef2aSThomas Huth 0x8000808000000000ull, /* B0 */ 1409fcf5ef2aSThomas Huth 0x8000808000000080ull, /* B1 */ 1410fcf5ef2aSThomas Huth 0x8000808000008000ull, /* B2 */ 1411fcf5ef2aSThomas Huth 0x8000808000008080ull, /* B3 */ 1412fcf5ef2aSThomas Huth 0x8000808000800000ull, /* B4 */ 1413fcf5ef2aSThomas Huth 0x8000808000800080ull, /* B5 */ 1414fcf5ef2aSThomas Huth 0x8000808000808000ull, /* B6 */ 1415fcf5ef2aSThomas Huth 0x8000808000808080ull, /* B7 */ 1416fcf5ef2aSThomas Huth 0x8000808080000000ull, /* B8 */ 1417fcf5ef2aSThomas Huth 0x8000808080000080ull, /* B9 */ 1418fcf5ef2aSThomas Huth 0x8000808080008000ull, /* BA */ 1419fcf5ef2aSThomas Huth 0x8000808080008080ull, /* BB */ 1420fcf5ef2aSThomas Huth 0x8000808080800000ull, /* BC */ 1421fcf5ef2aSThomas Huth 0x8000808080800080ull, /* BD */ 1422fcf5ef2aSThomas Huth 0x8000808080808000ull, /* BE */ 1423fcf5ef2aSThomas Huth 0x8000808080808080ull, /* BF */ 1424fcf5ef2aSThomas Huth 0x8080000000000000ull, /* C0 */ 1425fcf5ef2aSThomas Huth 0x8080000000000080ull, /* C1 */ 1426fcf5ef2aSThomas Huth 0x8080000000008000ull, /* C2 */ 1427fcf5ef2aSThomas Huth 0x8080000000008080ull, /* C3 */ 1428fcf5ef2aSThomas Huth 0x8080000000800000ull, /* C4 */ 1429fcf5ef2aSThomas Huth 0x8080000000800080ull, /* C5 */ 1430fcf5ef2aSThomas Huth 0x8080000000808000ull, /* C6 */ 1431fcf5ef2aSThomas Huth 0x8080000000808080ull, /* C7 */ 1432fcf5ef2aSThomas Huth 0x8080000080000000ull, /* C8 */ 1433fcf5ef2aSThomas Huth 0x8080000080000080ull, /* C9 */ 1434fcf5ef2aSThomas Huth 0x8080000080008000ull, /* CA */ 1435fcf5ef2aSThomas Huth 0x8080000080008080ull, /* CB */ 1436fcf5ef2aSThomas Huth 0x8080000080800000ull, /* CC */ 1437fcf5ef2aSThomas Huth 0x8080000080800080ull, /* CD */ 1438fcf5ef2aSThomas Huth 0x8080000080808000ull, /* CE */ 1439fcf5ef2aSThomas Huth 0x8080000080808080ull, /* CF */ 1440fcf5ef2aSThomas Huth 0x8080008000000000ull, /* D0 */ 1441fcf5ef2aSThomas Huth 0x8080008000000080ull, /* D1 */ 1442fcf5ef2aSThomas Huth 0x8080008000008000ull, /* D2 */ 1443fcf5ef2aSThomas Huth 0x8080008000008080ull, /* D3 */ 1444fcf5ef2aSThomas Huth 0x8080008000800000ull, /* D4 */ 1445fcf5ef2aSThomas Huth 0x8080008000800080ull, /* D5 */ 1446fcf5ef2aSThomas Huth 0x8080008000808000ull, /* D6 */ 1447fcf5ef2aSThomas Huth 0x8080008000808080ull, /* D7 */ 1448fcf5ef2aSThomas Huth 0x8080008080000000ull, /* D8 */ 1449fcf5ef2aSThomas Huth 0x8080008080000080ull, /* D9 */ 1450fcf5ef2aSThomas Huth 0x8080008080008000ull, /* DA */ 1451fcf5ef2aSThomas Huth 0x8080008080008080ull, /* DB */ 1452fcf5ef2aSThomas Huth 0x8080008080800000ull, /* DC */ 1453fcf5ef2aSThomas Huth 0x8080008080800080ull, /* DD */ 1454fcf5ef2aSThomas Huth 0x8080008080808000ull, /* DE */ 1455fcf5ef2aSThomas Huth 0x8080008080808080ull, /* DF */ 1456fcf5ef2aSThomas Huth 0x8080800000000000ull, /* E0 */ 1457fcf5ef2aSThomas Huth 0x8080800000000080ull, /* E1 */ 1458fcf5ef2aSThomas Huth 0x8080800000008000ull, /* E2 */ 1459fcf5ef2aSThomas Huth 0x8080800000008080ull, /* E3 */ 1460fcf5ef2aSThomas Huth 0x8080800000800000ull, /* E4 */ 1461fcf5ef2aSThomas Huth 0x8080800000800080ull, /* E5 */ 1462fcf5ef2aSThomas Huth 0x8080800000808000ull, /* E6 */ 1463fcf5ef2aSThomas Huth 0x8080800000808080ull, /* E7 */ 1464fcf5ef2aSThomas Huth 0x8080800080000000ull, /* E8 */ 1465fcf5ef2aSThomas Huth 0x8080800080000080ull, /* E9 */ 1466fcf5ef2aSThomas Huth 0x8080800080008000ull, /* EA */ 1467fcf5ef2aSThomas Huth 0x8080800080008080ull, /* EB */ 1468fcf5ef2aSThomas Huth 0x8080800080800000ull, /* EC */ 1469fcf5ef2aSThomas Huth 0x8080800080800080ull, /* ED */ 1470fcf5ef2aSThomas Huth 0x8080800080808000ull, /* EE */ 1471fcf5ef2aSThomas Huth 0x8080800080808080ull, /* EF */ 1472fcf5ef2aSThomas Huth 0x8080808000000000ull, /* F0 */ 1473fcf5ef2aSThomas Huth 0x8080808000000080ull, /* F1 */ 1474fcf5ef2aSThomas Huth 0x8080808000008000ull, /* F2 */ 1475fcf5ef2aSThomas Huth 0x8080808000008080ull, /* F3 */ 1476fcf5ef2aSThomas Huth 0x8080808000800000ull, /* F4 */ 1477fcf5ef2aSThomas Huth 0x8080808000800080ull, /* F5 */ 1478fcf5ef2aSThomas Huth 0x8080808000808000ull, /* F6 */ 1479fcf5ef2aSThomas Huth 0x8080808000808080ull, /* F7 */ 1480fcf5ef2aSThomas Huth 0x8080808080000000ull, /* F8 */ 1481fcf5ef2aSThomas Huth 0x8080808080000080ull, /* F9 */ 1482fcf5ef2aSThomas Huth 0x8080808080008000ull, /* FA */ 1483fcf5ef2aSThomas Huth 0x8080808080008080ull, /* FB */ 1484fcf5ef2aSThomas Huth 0x8080808080800000ull, /* FC */ 1485fcf5ef2aSThomas Huth 0x8080808080800080ull, /* FD */ 1486fcf5ef2aSThomas Huth 0x8080808080808000ull, /* FE */ 1487fcf5ef2aSThomas Huth 0x8080808080808080ull, /* FF */ 1488fcf5ef2aSThomas Huth }; 1489fcf5ef2aSThomas Huth 1490fcf5ef2aSThomas Huth void helper_vgbbd(ppc_avr_t *r, ppc_avr_t *b) 1491fcf5ef2aSThomas Huth { 1492fcf5ef2aSThomas Huth int i; 1493fcf5ef2aSThomas Huth uint64_t t[2] = { 0, 0 }; 1494fcf5ef2aSThomas Huth 1495fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 1496fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1497fcf5ef2aSThomas Huth t[i>>3] |= VGBBD_MASKS[b->u8[i]] >> (i & 7); 1498fcf5ef2aSThomas Huth #else 1499fcf5ef2aSThomas Huth t[i>>3] |= VGBBD_MASKS[b->u8[i]] >> (7-(i & 7)); 1500fcf5ef2aSThomas Huth #endif 1501fcf5ef2aSThomas Huth } 1502fcf5ef2aSThomas Huth 1503fcf5ef2aSThomas Huth r->u64[0] = t[0]; 1504fcf5ef2aSThomas Huth r->u64[1] = t[1]; 1505fcf5ef2aSThomas Huth } 1506fcf5ef2aSThomas Huth 1507fcf5ef2aSThomas Huth #define PMSUM(name, srcfld, trgfld, trgtyp) \ 1508fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1509fcf5ef2aSThomas Huth { \ 1510fcf5ef2aSThomas Huth int i, j; \ 1511fcf5ef2aSThomas Huth trgtyp prod[sizeof(ppc_avr_t)/sizeof(a->srcfld[0])]; \ 1512fcf5ef2aSThomas Huth \ 1513fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, srcfld) { \ 1514fcf5ef2aSThomas Huth prod[i] = 0; \ 1515fcf5ef2aSThomas Huth for (j = 0; j < sizeof(a->srcfld[0]) * 8; j++) { \ 1516fcf5ef2aSThomas Huth if (a->srcfld[i] & (1ull<<j)) { \ 1517fcf5ef2aSThomas Huth prod[i] ^= ((trgtyp)b->srcfld[i] << j); \ 1518fcf5ef2aSThomas Huth } \ 1519fcf5ef2aSThomas Huth } \ 1520fcf5ef2aSThomas Huth } \ 1521fcf5ef2aSThomas Huth \ 1522fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, trgfld) { \ 1523fcf5ef2aSThomas Huth r->trgfld[i] = prod[2*i] ^ prod[2*i+1]; \ 1524fcf5ef2aSThomas Huth } \ 1525fcf5ef2aSThomas Huth } 1526fcf5ef2aSThomas Huth 1527fcf5ef2aSThomas Huth PMSUM(vpmsumb, u8, u16, uint16_t) 1528fcf5ef2aSThomas Huth PMSUM(vpmsumh, u16, u32, uint32_t) 1529fcf5ef2aSThomas Huth PMSUM(vpmsumw, u32, u64, uint64_t) 1530fcf5ef2aSThomas Huth 1531fcf5ef2aSThomas Huth void helper_vpmsumd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1532fcf5ef2aSThomas Huth { 1533fcf5ef2aSThomas Huth 1534fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 1535fcf5ef2aSThomas Huth int i, j; 1536fcf5ef2aSThomas Huth __uint128_t prod[2]; 1537fcf5ef2aSThomas Huth 1538fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1539fcf5ef2aSThomas Huth prod[i] = 0; 1540fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1541fcf5ef2aSThomas Huth if (a->u64[i] & (1ull<<j)) { 1542fcf5ef2aSThomas Huth prod[i] ^= (((__uint128_t)b->u64[i]) << j); 1543fcf5ef2aSThomas Huth } 1544fcf5ef2aSThomas Huth } 1545fcf5ef2aSThomas Huth } 1546fcf5ef2aSThomas Huth 1547fcf5ef2aSThomas Huth r->u128 = prod[0] ^ prod[1]; 1548fcf5ef2aSThomas Huth 1549fcf5ef2aSThomas Huth #else 1550fcf5ef2aSThomas Huth int i, j; 1551fcf5ef2aSThomas Huth ppc_avr_t prod[2]; 1552fcf5ef2aSThomas Huth 1553fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 15543c385a93SMark Cave-Ayland prod[i].VsrD(1) = prod[i].VsrD(0) = 0; 1555fcf5ef2aSThomas Huth for (j = 0; j < 64; j++) { 1556fcf5ef2aSThomas Huth if (a->u64[i] & (1ull<<j)) { 1557fcf5ef2aSThomas Huth ppc_avr_t bshift; 1558fcf5ef2aSThomas Huth if (j == 0) { 15593c385a93SMark Cave-Ayland bshift.VsrD(0) = 0; 15603c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i]; 1561fcf5ef2aSThomas Huth } else { 15623c385a93SMark Cave-Ayland bshift.VsrD(0) = b->u64[i] >> (64 - j); 15633c385a93SMark Cave-Ayland bshift.VsrD(1) = b->u64[i] << j; 1564fcf5ef2aSThomas Huth } 15653c385a93SMark Cave-Ayland prod[i].VsrD(1) ^= bshift.VsrD(1); 15663c385a93SMark Cave-Ayland prod[i].VsrD(0) ^= bshift.VsrD(0); 1567fcf5ef2aSThomas Huth } 1568fcf5ef2aSThomas Huth } 1569fcf5ef2aSThomas Huth } 1570fcf5ef2aSThomas Huth 15713c385a93SMark Cave-Ayland r->VsrD(1) = prod[0].VsrD(1) ^ prod[1].VsrD(1); 15723c385a93SMark Cave-Ayland r->VsrD(0) = prod[0].VsrD(0) ^ prod[1].VsrD(0); 1573fcf5ef2aSThomas Huth #endif 1574fcf5ef2aSThomas Huth } 1575fcf5ef2aSThomas Huth 1576fcf5ef2aSThomas Huth 1577fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1578fcf5ef2aSThomas Huth #define PKBIG 1 1579fcf5ef2aSThomas Huth #else 1580fcf5ef2aSThomas Huth #define PKBIG 0 1581fcf5ef2aSThomas Huth #endif 1582fcf5ef2aSThomas Huth void helper_vpkpx(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1583fcf5ef2aSThomas Huth { 1584fcf5ef2aSThomas Huth int i, j; 1585fcf5ef2aSThomas Huth ppc_avr_t result; 1586fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1587fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { a, b }; 1588fcf5ef2aSThomas Huth #else 1589fcf5ef2aSThomas Huth const ppc_avr_t *x[2] = { b, a }; 1590fcf5ef2aSThomas Huth #endif 1591fcf5ef2aSThomas Huth 1592fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u64) { 1593fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(j, u32) { 1594fcf5ef2aSThomas Huth uint32_t e = x[i]->u32[j]; 1595fcf5ef2aSThomas Huth 1596fcf5ef2aSThomas Huth result.u16[4*i+j] = (((e >> 9) & 0xfc00) | 1597fcf5ef2aSThomas Huth ((e >> 6) & 0x3e0) | 1598fcf5ef2aSThomas Huth ((e >> 3) & 0x1f)); 1599fcf5ef2aSThomas Huth } 1600fcf5ef2aSThomas Huth } 1601fcf5ef2aSThomas Huth *r = result; 1602fcf5ef2aSThomas Huth } 1603fcf5ef2aSThomas Huth 1604fcf5ef2aSThomas Huth #define VPK(suffix, from, to, cvt, dosat) \ 1605fcf5ef2aSThomas Huth void helper_vpk##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1606fcf5ef2aSThomas Huth ppc_avr_t *a, ppc_avr_t *b) \ 1607fcf5ef2aSThomas Huth { \ 1608fcf5ef2aSThomas Huth int i; \ 1609fcf5ef2aSThomas Huth int sat = 0; \ 1610fcf5ef2aSThomas Huth ppc_avr_t result; \ 1611fcf5ef2aSThomas Huth ppc_avr_t *a0 = PKBIG ? a : b; \ 1612fcf5ef2aSThomas Huth ppc_avr_t *a1 = PKBIG ? b : a; \ 1613fcf5ef2aSThomas Huth \ 1614fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, from) { \ 1615fcf5ef2aSThomas Huth result.to[i] = cvt(a0->from[i], &sat); \ 1616fcf5ef2aSThomas Huth result.to[i+ARRAY_SIZE(r->from)] = cvt(a1->from[i], &sat); \ 1617fcf5ef2aSThomas Huth } \ 1618fcf5ef2aSThomas Huth *r = result; \ 1619fcf5ef2aSThomas Huth if (dosat && sat) { \ 1620fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); \ 1621fcf5ef2aSThomas Huth } \ 1622fcf5ef2aSThomas Huth } 1623fcf5ef2aSThomas Huth #define I(x, y) (x) 1624fcf5ef2aSThomas Huth VPK(shss, s16, s8, cvtshsb, 1) 1625fcf5ef2aSThomas Huth VPK(shus, s16, u8, cvtshub, 1) 1626fcf5ef2aSThomas Huth VPK(swss, s32, s16, cvtswsh, 1) 1627fcf5ef2aSThomas Huth VPK(swus, s32, u16, cvtswuh, 1) 1628fcf5ef2aSThomas Huth VPK(sdss, s64, s32, cvtsdsw, 1) 1629fcf5ef2aSThomas Huth VPK(sdus, s64, u32, cvtsduw, 1) 1630fcf5ef2aSThomas Huth VPK(uhus, u16, u8, cvtuhub, 1) 1631fcf5ef2aSThomas Huth VPK(uwus, u32, u16, cvtuwuh, 1) 1632fcf5ef2aSThomas Huth VPK(udus, u64, u32, cvtuduw, 1) 1633fcf5ef2aSThomas Huth VPK(uhum, u16, u8, I, 0) 1634fcf5ef2aSThomas Huth VPK(uwum, u32, u16, I, 0) 1635fcf5ef2aSThomas Huth VPK(udum, u64, u32, I, 0) 1636fcf5ef2aSThomas Huth #undef I 1637fcf5ef2aSThomas Huth #undef VPK 1638fcf5ef2aSThomas Huth #undef PKBIG 1639fcf5ef2aSThomas Huth 1640fcf5ef2aSThomas Huth void helper_vrefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1641fcf5ef2aSThomas Huth { 1642fcf5ef2aSThomas Huth int i; 1643fcf5ef2aSThomas Huth 164405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 164505ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, b->f32[i], &env->vec_status); 1646fcf5ef2aSThomas Huth } 1647fcf5ef2aSThomas Huth } 1648fcf5ef2aSThomas Huth 1649fcf5ef2aSThomas Huth #define VRFI(suffix, rounding) \ 1650fcf5ef2aSThomas Huth void helper_vrfi##suffix(CPUPPCState *env, ppc_avr_t *r, \ 1651fcf5ef2aSThomas Huth ppc_avr_t *b) \ 1652fcf5ef2aSThomas Huth { \ 1653fcf5ef2aSThomas Huth int i; \ 1654fcf5ef2aSThomas Huth float_status s = env->vec_status; \ 1655fcf5ef2aSThomas Huth \ 1656fcf5ef2aSThomas Huth set_float_rounding_mode(rounding, &s); \ 165705ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { \ 165805ee3e8aSMark Cave-Ayland r->f32[i] = float32_round_to_int (b->f32[i], &s); \ 1659fcf5ef2aSThomas Huth } \ 1660fcf5ef2aSThomas Huth } 1661fcf5ef2aSThomas Huth VRFI(n, float_round_nearest_even) 1662fcf5ef2aSThomas Huth VRFI(m, float_round_down) 1663fcf5ef2aSThomas Huth VRFI(p, float_round_up) 1664fcf5ef2aSThomas Huth VRFI(z, float_round_to_zero) 1665fcf5ef2aSThomas Huth #undef VRFI 1666fcf5ef2aSThomas Huth 1667fcf5ef2aSThomas Huth #define VROTATE(suffix, element, mask) \ 1668fcf5ef2aSThomas Huth void helper_vrl##suffix(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1669fcf5ef2aSThomas Huth { \ 1670fcf5ef2aSThomas Huth int i; \ 1671fcf5ef2aSThomas Huth \ 1672fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1673fcf5ef2aSThomas Huth unsigned int shift = b->element[i] & mask; \ 1674fcf5ef2aSThomas Huth r->element[i] = (a->element[i] << shift) | \ 1675fcf5ef2aSThomas Huth (a->element[i] >> (sizeof(a->element[0]) * 8 - shift)); \ 1676fcf5ef2aSThomas Huth } \ 1677fcf5ef2aSThomas Huth } 1678fcf5ef2aSThomas Huth VROTATE(b, u8, 0x7) 1679fcf5ef2aSThomas Huth VROTATE(h, u16, 0xF) 1680fcf5ef2aSThomas Huth VROTATE(w, u32, 0x1F) 1681fcf5ef2aSThomas Huth VROTATE(d, u64, 0x3F) 1682fcf5ef2aSThomas Huth #undef VROTATE 1683fcf5ef2aSThomas Huth 1684fcf5ef2aSThomas Huth void helper_vrsqrtefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1685fcf5ef2aSThomas Huth { 1686fcf5ef2aSThomas Huth int i; 1687fcf5ef2aSThomas Huth 168805ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 168905ee3e8aSMark Cave-Ayland float32 t = float32_sqrt(b->f32[i], &env->vec_status); 1690fcf5ef2aSThomas Huth 169105ee3e8aSMark Cave-Ayland r->f32[i] = float32_div(float32_one, t, &env->vec_status); 1692fcf5ef2aSThomas Huth } 1693fcf5ef2aSThomas Huth } 1694fcf5ef2aSThomas Huth 1695fcf5ef2aSThomas Huth #define VRLMI(name, size, element, insert) \ 1696fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1697fcf5ef2aSThomas Huth { \ 1698fcf5ef2aSThomas Huth int i; \ 1699fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1700fcf5ef2aSThomas Huth uint##size##_t src1 = a->element[i]; \ 1701fcf5ef2aSThomas Huth uint##size##_t src2 = b->element[i]; \ 1702fcf5ef2aSThomas Huth uint##size##_t src3 = r->element[i]; \ 1703fcf5ef2aSThomas Huth uint##size##_t begin, end, shift, mask, rot_val; \ 1704fcf5ef2aSThomas Huth \ 1705fcf5ef2aSThomas Huth shift = extract##size(src2, 0, 6); \ 1706fcf5ef2aSThomas Huth end = extract##size(src2, 8, 6); \ 1707fcf5ef2aSThomas Huth begin = extract##size(src2, 16, 6); \ 1708fcf5ef2aSThomas Huth rot_val = rol##size(src1, shift); \ 1709fcf5ef2aSThomas Huth mask = mask_u##size(begin, end); \ 1710fcf5ef2aSThomas Huth if (insert) { \ 1711fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask) | (src3 & ~mask); \ 1712fcf5ef2aSThomas Huth } else { \ 1713fcf5ef2aSThomas Huth r->element[i] = (rot_val & mask); \ 1714fcf5ef2aSThomas Huth } \ 1715fcf5ef2aSThomas Huth } \ 1716fcf5ef2aSThomas Huth } 1717fcf5ef2aSThomas Huth 1718fcf5ef2aSThomas Huth VRLMI(vrldmi, 64, u64, 1); 1719fcf5ef2aSThomas Huth VRLMI(vrlwmi, 32, u32, 1); 1720fcf5ef2aSThomas Huth VRLMI(vrldnm, 64, u64, 0); 1721fcf5ef2aSThomas Huth VRLMI(vrlwnm, 32, u32, 0); 1722fcf5ef2aSThomas Huth 1723fcf5ef2aSThomas Huth void helper_vsel(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, 1724fcf5ef2aSThomas Huth ppc_avr_t *c) 1725fcf5ef2aSThomas Huth { 1726fcf5ef2aSThomas Huth r->u64[0] = (a->u64[0] & ~c->u64[0]) | (b->u64[0] & c->u64[0]); 1727fcf5ef2aSThomas Huth r->u64[1] = (a->u64[1] & ~c->u64[1]) | (b->u64[1] & c->u64[1]); 1728fcf5ef2aSThomas Huth } 1729fcf5ef2aSThomas Huth 1730fcf5ef2aSThomas Huth void helper_vexptefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1731fcf5ef2aSThomas Huth { 1732fcf5ef2aSThomas Huth int i; 1733fcf5ef2aSThomas Huth 173405ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 173505ee3e8aSMark Cave-Ayland r->f32[i] = float32_exp2(b->f32[i], &env->vec_status); 1736fcf5ef2aSThomas Huth } 1737fcf5ef2aSThomas Huth } 1738fcf5ef2aSThomas Huth 1739fcf5ef2aSThomas Huth void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b) 1740fcf5ef2aSThomas Huth { 1741fcf5ef2aSThomas Huth int i; 1742fcf5ef2aSThomas Huth 174305ee3e8aSMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->f32); i++) { 174405ee3e8aSMark Cave-Ayland r->f32[i] = float32_log2(b->f32[i], &env->vec_status); 1745fcf5ef2aSThomas Huth } 1746fcf5ef2aSThomas Huth } 1747fcf5ef2aSThomas Huth 174860caf221SAvinesh Kumar #if defined(HOST_WORDS_BIGENDIAN) 174960caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 175060caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 175160caf221SAvinesh Kumar { \ 175260caf221SAvinesh Kumar int index; \ 175360caf221SAvinesh Kumar if (left) { \ 175460caf221SAvinesh Kumar index = (a & 0xf) * 8; \ 175560caf221SAvinesh Kumar } else { \ 175660caf221SAvinesh Kumar index = ((15 - (a & 0xf) + 1) * 8) - size; \ 175760caf221SAvinesh Kumar } \ 175860caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 175960caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 176060caf221SAvinesh Kumar } 176160caf221SAvinesh Kumar #else 176260caf221SAvinesh Kumar #define VEXTU_X_DO(name, size, left) \ 176360caf221SAvinesh Kumar target_ulong glue(helper_, name)(target_ulong a, ppc_avr_t *b) \ 176460caf221SAvinesh Kumar { \ 176560caf221SAvinesh Kumar int index; \ 176660caf221SAvinesh Kumar if (left) { \ 176760caf221SAvinesh Kumar index = ((15 - (a & 0xf) + 1) * 8) - size; \ 176860caf221SAvinesh Kumar } else { \ 176960caf221SAvinesh Kumar index = (a & 0xf) * 8; \ 177060caf221SAvinesh Kumar } \ 177160caf221SAvinesh Kumar return int128_getlo(int128_rshift(b->s128, index)) & \ 177260caf221SAvinesh Kumar MAKE_64BIT_MASK(0, size); \ 177360caf221SAvinesh Kumar } 177460caf221SAvinesh Kumar #endif 177560caf221SAvinesh Kumar 177660caf221SAvinesh Kumar VEXTU_X_DO(vextublx, 8, 1) 177760caf221SAvinesh Kumar VEXTU_X_DO(vextuhlx, 16, 1) 177860caf221SAvinesh Kumar VEXTU_X_DO(vextuwlx, 32, 1) 177960caf221SAvinesh Kumar VEXTU_X_DO(vextubrx, 8, 0) 178060caf221SAvinesh Kumar VEXTU_X_DO(vextuhrx, 16, 0) 178160caf221SAvinesh Kumar VEXTU_X_DO(vextuwrx, 32, 0) 178260caf221SAvinesh Kumar #undef VEXTU_X_DO 178360caf221SAvinesh Kumar 1784fcf5ef2aSThomas Huth /* The specification says that the results are undefined if all of the 1785fcf5ef2aSThomas Huth * shift counts are not identical. We check to make sure that they are 1786fcf5ef2aSThomas Huth * to conform to what real hardware appears to do. */ 1787fcf5ef2aSThomas Huth #define VSHIFT(suffix, leftp) \ 1788fcf5ef2aSThomas Huth void helper_vs##suffix(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1789fcf5ef2aSThomas Huth { \ 17903c385a93SMark Cave-Ayland int shift = b->VsrB(15) & 0x7; \ 1791fcf5ef2aSThomas Huth int doit = 1; \ 1792fcf5ef2aSThomas Huth int i; \ 1793fcf5ef2aSThomas Huth \ 1794fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { \ 1795fcf5ef2aSThomas Huth doit = doit && ((b->u8[i] & 0x7) == shift); \ 1796fcf5ef2aSThomas Huth } \ 1797fcf5ef2aSThomas Huth if (doit) { \ 1798fcf5ef2aSThomas Huth if (shift == 0) { \ 1799fcf5ef2aSThomas Huth *r = *a; \ 1800fcf5ef2aSThomas Huth } else if (leftp) { \ 18013c385a93SMark Cave-Ayland uint64_t carry = a->VsrD(1) >> (64 - shift); \ 1802fcf5ef2aSThomas Huth \ 18033c385a93SMark Cave-Ayland r->VsrD(0) = (a->VsrD(0) << shift) | carry; \ 18043c385a93SMark Cave-Ayland r->VsrD(1) = a->VsrD(1) << shift; \ 1805fcf5ef2aSThomas Huth } else { \ 18063c385a93SMark Cave-Ayland uint64_t carry = a->VsrD(0) << (64 - shift); \ 1807fcf5ef2aSThomas Huth \ 18083c385a93SMark Cave-Ayland r->VsrD(1) = (a->VsrD(1) >> shift) | carry; \ 18093c385a93SMark Cave-Ayland r->VsrD(0) = a->VsrD(0) >> shift; \ 1810fcf5ef2aSThomas Huth } \ 1811fcf5ef2aSThomas Huth } \ 1812fcf5ef2aSThomas Huth } 1813fcf5ef2aSThomas Huth VSHIFT(l, 1) 1814fcf5ef2aSThomas Huth VSHIFT(r, 0) 1815fcf5ef2aSThomas Huth #undef VSHIFT 1816fcf5ef2aSThomas Huth 1817fcf5ef2aSThomas Huth #define VSL(suffix, element, mask) \ 1818fcf5ef2aSThomas Huth void helper_vsl##suffix(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 1819fcf5ef2aSThomas Huth { \ 1820fcf5ef2aSThomas Huth int i; \ 1821fcf5ef2aSThomas Huth \ 1822fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1823fcf5ef2aSThomas Huth unsigned int shift = b->element[i] & mask; \ 1824fcf5ef2aSThomas Huth \ 1825fcf5ef2aSThomas Huth r->element[i] = a->element[i] << shift; \ 1826fcf5ef2aSThomas Huth } \ 1827fcf5ef2aSThomas Huth } 1828fcf5ef2aSThomas Huth VSL(b, u8, 0x7) 1829fcf5ef2aSThomas Huth VSL(h, u16, 0x0F) 1830fcf5ef2aSThomas Huth VSL(w, u32, 0x1F) 1831fcf5ef2aSThomas Huth VSL(d, u64, 0x3F) 1832fcf5ef2aSThomas Huth #undef VSL 1833fcf5ef2aSThomas Huth 1834fcf5ef2aSThomas Huth void helper_vslv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1835fcf5ef2aSThomas Huth { 1836fcf5ef2aSThomas Huth int i; 1837fcf5ef2aSThomas Huth unsigned int shift, bytes, size; 1838fcf5ef2aSThomas Huth 1839fcf5ef2aSThomas Huth size = ARRAY_SIZE(r->u8); 1840fcf5ef2aSThomas Huth for (i = 0; i < size; i++) { 1841fcf5ef2aSThomas Huth shift = b->u8[i] & 0x7; /* extract shift value */ 1842fcf5ef2aSThomas Huth bytes = (a->u8[i] << 8) + /* extract adjacent bytes */ 1843fcf5ef2aSThomas Huth (((i + 1) < size) ? a->u8[i + 1] : 0); 1844fcf5ef2aSThomas Huth r->u8[i] = (bytes << shift) >> 8; /* shift and store result */ 1845fcf5ef2aSThomas Huth } 1846fcf5ef2aSThomas Huth } 1847fcf5ef2aSThomas Huth 1848fcf5ef2aSThomas Huth void helper_vsrv(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1849fcf5ef2aSThomas Huth { 1850fcf5ef2aSThomas Huth int i; 1851fcf5ef2aSThomas Huth unsigned int shift, bytes; 1852fcf5ef2aSThomas Huth 1853fcf5ef2aSThomas Huth /* Use reverse order, as destination and source register can be same. Its 1854fcf5ef2aSThomas Huth * being modified in place saving temporary, reverse order will guarantee 1855fcf5ef2aSThomas Huth * that computed result is not fed back. 1856fcf5ef2aSThomas Huth */ 1857fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->u8) - 1; i >= 0; i--) { 1858fcf5ef2aSThomas Huth shift = b->u8[i] & 0x7; /* extract shift value */ 1859fcf5ef2aSThomas Huth bytes = ((i ? a->u8[i - 1] : 0) << 8) + a->u8[i]; 1860fcf5ef2aSThomas Huth /* extract adjacent bytes */ 1861fcf5ef2aSThomas Huth r->u8[i] = (bytes >> shift) & 0xFF; /* shift and store result */ 1862fcf5ef2aSThomas Huth } 1863fcf5ef2aSThomas Huth } 1864fcf5ef2aSThomas Huth 1865fcf5ef2aSThomas Huth void helper_vsldoi(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t shift) 1866fcf5ef2aSThomas Huth { 1867fcf5ef2aSThomas Huth int sh = shift & 0xf; 1868fcf5ef2aSThomas Huth int i; 1869fcf5ef2aSThomas Huth ppc_avr_t result; 1870fcf5ef2aSThomas Huth 1871fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1872fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1873fcf5ef2aSThomas Huth int index = sh + i; 1874fcf5ef2aSThomas Huth if (index > 0xf) { 1875fcf5ef2aSThomas Huth result.u8[i] = b->u8[index - 0x10]; 1876fcf5ef2aSThomas Huth } else { 1877fcf5ef2aSThomas Huth result.u8[i] = a->u8[index]; 1878fcf5ef2aSThomas Huth } 1879fcf5ef2aSThomas Huth } 1880fcf5ef2aSThomas Huth #else 1881fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u8); i++) { 1882fcf5ef2aSThomas Huth int index = (16 - sh) + i; 1883fcf5ef2aSThomas Huth if (index > 0xf) { 1884fcf5ef2aSThomas Huth result.u8[i] = a->u8[index - 0x10]; 1885fcf5ef2aSThomas Huth } else { 1886fcf5ef2aSThomas Huth result.u8[i] = b->u8[index]; 1887fcf5ef2aSThomas Huth } 1888fcf5ef2aSThomas Huth } 1889fcf5ef2aSThomas Huth #endif 1890fcf5ef2aSThomas Huth *r = result; 1891fcf5ef2aSThomas Huth } 1892fcf5ef2aSThomas Huth 1893fcf5ef2aSThomas Huth void helper_vslo(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 1894fcf5ef2aSThomas Huth { 18953c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 1896fcf5ef2aSThomas Huth 1897fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1898fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 1899fcf5ef2aSThomas Huth memset(&r->u8[16-sh], 0, sh); 1900fcf5ef2aSThomas Huth #else 1901fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 1902fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 1903fcf5ef2aSThomas Huth #endif 1904fcf5ef2aSThomas Huth } 1905fcf5ef2aSThomas Huth 1906fcf5ef2aSThomas Huth /* Experimental testing shows that hardware masks the immediate. */ 1907fcf5ef2aSThomas Huth #define _SPLAT_MASKED(element) (splat & (ARRAY_SIZE(r->element) - 1)) 1908fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1909fcf5ef2aSThomas Huth #define SPLAT_ELEMENT(element) _SPLAT_MASKED(element) 1910fcf5ef2aSThomas Huth #else 1911fcf5ef2aSThomas Huth #define SPLAT_ELEMENT(element) \ 1912fcf5ef2aSThomas Huth (ARRAY_SIZE(r->element) - 1 - _SPLAT_MASKED(element)) 1913fcf5ef2aSThomas Huth #endif 1914fcf5ef2aSThomas Huth #define VSPLT(suffix, element) \ 1915fcf5ef2aSThomas Huth void helper_vsplt##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t splat) \ 1916fcf5ef2aSThomas Huth { \ 1917fcf5ef2aSThomas Huth uint32_t s = b->element[SPLAT_ELEMENT(element)]; \ 1918fcf5ef2aSThomas Huth int i; \ 1919fcf5ef2aSThomas Huth \ 1920fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 1921fcf5ef2aSThomas Huth r->element[i] = s; \ 1922fcf5ef2aSThomas Huth } \ 1923fcf5ef2aSThomas Huth } 1924fcf5ef2aSThomas Huth VSPLT(b, u8) 1925fcf5ef2aSThomas Huth VSPLT(h, u16) 1926fcf5ef2aSThomas Huth VSPLT(w, u32) 1927fcf5ef2aSThomas Huth #undef VSPLT 1928fcf5ef2aSThomas Huth #undef SPLAT_ELEMENT 1929fcf5ef2aSThomas Huth #undef _SPLAT_MASKED 1930fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1931fcf5ef2aSThomas Huth #define VINSERT(suffix, element) \ 1932fcf5ef2aSThomas Huth void helper_vinsert##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1933fcf5ef2aSThomas Huth { \ 19344fff7218SLaurent Vivier memmove(&r->u8[index], &b->u8[8 - sizeof(r->element[0])], \ 1935fcf5ef2aSThomas Huth sizeof(r->element[0])); \ 1936fcf5ef2aSThomas Huth } 1937fcf5ef2aSThomas Huth #else 1938fcf5ef2aSThomas Huth #define VINSERT(suffix, element) \ 1939fcf5ef2aSThomas Huth void helper_vinsert##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1940fcf5ef2aSThomas Huth { \ 1941fcf5ef2aSThomas Huth uint32_t d = (16 - index) - sizeof(r->element[0]); \ 1942fcf5ef2aSThomas Huth memmove(&r->u8[d], &b->u8[8], sizeof(r->element[0])); \ 1943fcf5ef2aSThomas Huth } 1944fcf5ef2aSThomas Huth #endif 1945fcf5ef2aSThomas Huth VINSERT(b, u8) 1946fcf5ef2aSThomas Huth VINSERT(h, u16) 1947fcf5ef2aSThomas Huth VINSERT(w, u32) 1948fcf5ef2aSThomas Huth VINSERT(d, u64) 1949fcf5ef2aSThomas Huth #undef VINSERT 1950fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 1951fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1952fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1953fcf5ef2aSThomas Huth { \ 1954fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1955fcf5ef2aSThomas Huth memmove(&r->u8[8 - es], &b->u8[index], es); \ 1956fcf5ef2aSThomas Huth memset(&r->u8[8], 0, 8); \ 1957fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8 - es); \ 1958fcf5ef2aSThomas Huth } 1959fcf5ef2aSThomas Huth #else 1960fcf5ef2aSThomas Huth #define VEXTRACT(suffix, element) \ 1961fcf5ef2aSThomas Huth void helper_vextract##suffix(ppc_avr_t *r, ppc_avr_t *b, uint32_t index) \ 1962fcf5ef2aSThomas Huth { \ 1963fcf5ef2aSThomas Huth uint32_t es = sizeof(r->element[0]); \ 1964fcf5ef2aSThomas Huth uint32_t s = (16 - index) - es; \ 1965fcf5ef2aSThomas Huth memmove(&r->u8[8], &b->u8[s], es); \ 1966fcf5ef2aSThomas Huth memset(&r->u8[0], 0, 8); \ 1967fcf5ef2aSThomas Huth memset(&r->u8[8 + es], 0, 8 - es); \ 1968fcf5ef2aSThomas Huth } 1969fcf5ef2aSThomas Huth #endif 1970fcf5ef2aSThomas Huth VEXTRACT(ub, u8) 1971fcf5ef2aSThomas Huth VEXTRACT(uh, u16) 1972fcf5ef2aSThomas Huth VEXTRACT(uw, u32) 1973fcf5ef2aSThomas Huth VEXTRACT(d, u64) 1974fcf5ef2aSThomas Huth #undef VEXTRACT 1975fcf5ef2aSThomas Huth 19768ad901e5SNikunj A Dadhania void helper_xxextractuw(CPUPPCState *env, target_ulong xtn, 19778ad901e5SNikunj A Dadhania target_ulong xbn, uint32_t index) 19788ad901e5SNikunj A Dadhania { 19798ad901e5SNikunj A Dadhania ppc_vsr_t xt, xb; 19808ad901e5SNikunj A Dadhania size_t es = sizeof(uint32_t); 19818ad901e5SNikunj A Dadhania uint32_t ext_index; 19828ad901e5SNikunj A Dadhania int i; 19838ad901e5SNikunj A Dadhania 19848ad901e5SNikunj A Dadhania getVSR(xbn, &xb, env); 19858ad901e5SNikunj A Dadhania memset(&xt, 0, sizeof(xt)); 19868ad901e5SNikunj A Dadhania 19878ad901e5SNikunj A Dadhania #if defined(HOST_WORDS_BIGENDIAN) 19888ad901e5SNikunj A Dadhania ext_index = index; 19898ad901e5SNikunj A Dadhania for (i = 0; i < es; i++, ext_index++) { 19908ad901e5SNikunj A Dadhania xt.u8[8 - es + i] = xb.u8[ext_index % 16]; 19918ad901e5SNikunj A Dadhania } 19928ad901e5SNikunj A Dadhania #else 19938ad901e5SNikunj A Dadhania ext_index = 15 - index; 19948ad901e5SNikunj A Dadhania for (i = es - 1; i >= 0; i--, ext_index--) { 19958ad901e5SNikunj A Dadhania xt.u8[8 + i] = xb.u8[ext_index % 16]; 19968ad901e5SNikunj A Dadhania } 19978ad901e5SNikunj A Dadhania #endif 19988ad901e5SNikunj A Dadhania 19998ad901e5SNikunj A Dadhania putVSR(xtn, &xt, env); 20008ad901e5SNikunj A Dadhania } 20018ad901e5SNikunj A Dadhania 20023398b742SNikunj A Dadhania void helper_xxinsertw(CPUPPCState *env, target_ulong xtn, 20033398b742SNikunj A Dadhania target_ulong xbn, uint32_t index) 20043398b742SNikunj A Dadhania { 20053398b742SNikunj A Dadhania ppc_vsr_t xt, xb; 20063398b742SNikunj A Dadhania size_t es = sizeof(uint32_t); 20073398b742SNikunj A Dadhania int ins_index, i = 0; 20083398b742SNikunj A Dadhania 20093398b742SNikunj A Dadhania getVSR(xbn, &xb, env); 20103398b742SNikunj A Dadhania getVSR(xtn, &xt, env); 20113398b742SNikunj A Dadhania 20123398b742SNikunj A Dadhania #if defined(HOST_WORDS_BIGENDIAN) 20133398b742SNikunj A Dadhania ins_index = index; 20143398b742SNikunj A Dadhania for (i = 0; i < es && ins_index < 16; i++, ins_index++) { 20153398b742SNikunj A Dadhania xt.u8[ins_index] = xb.u8[8 - es + i]; 20163398b742SNikunj A Dadhania } 20173398b742SNikunj A Dadhania #else 20183398b742SNikunj A Dadhania ins_index = 15 - index; 20193398b742SNikunj A Dadhania for (i = es - 1; i >= 0 && ins_index >= 0; i--, ins_index--) { 20203398b742SNikunj A Dadhania xt.u8[ins_index] = xb.u8[8 + i]; 20213398b742SNikunj A Dadhania } 20223398b742SNikunj A Dadhania #endif 20233398b742SNikunj A Dadhania 20243398b742SNikunj A Dadhania putVSR(xtn, &xt, env); 20253398b742SNikunj A Dadhania } 20263398b742SNikunj A Dadhania 2027fcf5ef2aSThomas Huth #define VEXT_SIGNED(name, element, mask, cast, recast) \ 2028fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 2029fcf5ef2aSThomas Huth { \ 2030fcf5ef2aSThomas Huth int i; \ 2031fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, element) { \ 2032fcf5ef2aSThomas Huth r->element[i] = (recast)((cast)(b->element[i] & mask)); \ 2033fcf5ef2aSThomas Huth } \ 2034fcf5ef2aSThomas Huth } 2035fcf5ef2aSThomas Huth VEXT_SIGNED(vextsb2w, s32, UINT8_MAX, int8_t, int32_t) 2036fcf5ef2aSThomas Huth VEXT_SIGNED(vextsb2d, s64, UINT8_MAX, int8_t, int64_t) 2037fcf5ef2aSThomas Huth VEXT_SIGNED(vextsh2w, s32, UINT16_MAX, int16_t, int32_t) 2038fcf5ef2aSThomas Huth VEXT_SIGNED(vextsh2d, s64, UINT16_MAX, int16_t, int64_t) 2039fcf5ef2aSThomas Huth VEXT_SIGNED(vextsw2d, s64, UINT32_MAX, int32_t, int64_t) 2040fcf5ef2aSThomas Huth #undef VEXT_SIGNED 2041fcf5ef2aSThomas Huth 2042fcf5ef2aSThomas Huth #define VNEG(name, element) \ 2043fcf5ef2aSThomas Huth void helper_##name(ppc_avr_t *r, ppc_avr_t *b) \ 2044fcf5ef2aSThomas Huth { \ 2045fcf5ef2aSThomas Huth int i; \ 2046fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, element) { \ 2047fcf5ef2aSThomas Huth r->element[i] = -b->element[i]; \ 2048fcf5ef2aSThomas Huth } \ 2049fcf5ef2aSThomas Huth } 2050fcf5ef2aSThomas Huth VNEG(vnegw, s32) 2051fcf5ef2aSThomas Huth VNEG(vnegd, s64) 2052fcf5ef2aSThomas Huth #undef VNEG 2053fcf5ef2aSThomas Huth 2054fcf5ef2aSThomas Huth #define VSPLTI(suffix, element, splat_type) \ 2055fcf5ef2aSThomas Huth void helper_vspltis##suffix(ppc_avr_t *r, uint32_t splat) \ 2056fcf5ef2aSThomas Huth { \ 2057fcf5ef2aSThomas Huth splat_type x = (int8_t)(splat << 3) >> 3; \ 2058fcf5ef2aSThomas Huth int i; \ 2059fcf5ef2aSThomas Huth \ 2060fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 2061fcf5ef2aSThomas Huth r->element[i] = x; \ 2062fcf5ef2aSThomas Huth } \ 2063fcf5ef2aSThomas Huth } 2064fcf5ef2aSThomas Huth VSPLTI(b, s8, int8_t) 2065fcf5ef2aSThomas Huth VSPLTI(h, s16, int16_t) 2066fcf5ef2aSThomas Huth VSPLTI(w, s32, int32_t) 2067fcf5ef2aSThomas Huth #undef VSPLTI 2068fcf5ef2aSThomas Huth 2069fcf5ef2aSThomas Huth #define VSR(suffix, element, mask) \ 2070fcf5ef2aSThomas Huth void helper_vsr##suffix(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) \ 2071fcf5ef2aSThomas Huth { \ 2072fcf5ef2aSThomas Huth int i; \ 2073fcf5ef2aSThomas Huth \ 2074fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->element); i++) { \ 2075fcf5ef2aSThomas Huth unsigned int shift = b->element[i] & mask; \ 2076fcf5ef2aSThomas Huth r->element[i] = a->element[i] >> shift; \ 2077fcf5ef2aSThomas Huth } \ 2078fcf5ef2aSThomas Huth } 2079fcf5ef2aSThomas Huth VSR(ab, s8, 0x7) 2080fcf5ef2aSThomas Huth VSR(ah, s16, 0xF) 2081fcf5ef2aSThomas Huth VSR(aw, s32, 0x1F) 2082fcf5ef2aSThomas Huth VSR(ad, s64, 0x3F) 2083fcf5ef2aSThomas Huth VSR(b, u8, 0x7) 2084fcf5ef2aSThomas Huth VSR(h, u16, 0xF) 2085fcf5ef2aSThomas Huth VSR(w, u32, 0x1F) 2086fcf5ef2aSThomas Huth VSR(d, u64, 0x3F) 2087fcf5ef2aSThomas Huth #undef VSR 2088fcf5ef2aSThomas Huth 2089fcf5ef2aSThomas Huth void helper_vsro(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2090fcf5ef2aSThomas Huth { 20913c385a93SMark Cave-Ayland int sh = (b->VsrB(0xf) >> 3) & 0xf; 2092fcf5ef2aSThomas Huth 2093fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2094fcf5ef2aSThomas Huth memmove(&r->u8[sh], &a->u8[0], 16 - sh); 2095fcf5ef2aSThomas Huth memset(&r->u8[0], 0, sh); 2096fcf5ef2aSThomas Huth #else 2097fcf5ef2aSThomas Huth memmove(&r->u8[0], &a->u8[sh], 16 - sh); 2098fcf5ef2aSThomas Huth memset(&r->u8[16 - sh], 0, sh); 2099fcf5ef2aSThomas Huth #endif 2100fcf5ef2aSThomas Huth } 2101fcf5ef2aSThomas Huth 2102fcf5ef2aSThomas Huth void helper_vsubcuw(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2103fcf5ef2aSThomas Huth { 2104fcf5ef2aSThomas Huth int i; 2105fcf5ef2aSThomas Huth 2106fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2107fcf5ef2aSThomas Huth r->u32[i] = a->u32[i] >= b->u32[i]; 2108fcf5ef2aSThomas Huth } 2109fcf5ef2aSThomas Huth } 2110fcf5ef2aSThomas Huth 2111fcf5ef2aSThomas Huth void helper_vsumsws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2112fcf5ef2aSThomas Huth { 2113fcf5ef2aSThomas Huth int64_t t; 2114fcf5ef2aSThomas Huth int i, upper; 2115fcf5ef2aSThomas Huth ppc_avr_t result; 2116fcf5ef2aSThomas Huth int sat = 0; 2117fcf5ef2aSThomas Huth 2118fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2119fcf5ef2aSThomas Huth upper = ARRAY_SIZE(r->s32)-1; 2120fcf5ef2aSThomas Huth #else 2121fcf5ef2aSThomas Huth upper = 0; 2122fcf5ef2aSThomas Huth #endif 2123fcf5ef2aSThomas Huth t = (int64_t)b->s32[upper]; 2124fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 2125fcf5ef2aSThomas Huth t += a->s32[i]; 2126fcf5ef2aSThomas Huth result.s32[i] = 0; 2127fcf5ef2aSThomas Huth } 2128fcf5ef2aSThomas Huth result.s32[upper] = cvtsdsw(t, &sat); 2129fcf5ef2aSThomas Huth *r = result; 2130fcf5ef2aSThomas Huth 2131fcf5ef2aSThomas Huth if (sat) { 2132fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 2133fcf5ef2aSThomas Huth } 2134fcf5ef2aSThomas Huth } 2135fcf5ef2aSThomas Huth 2136fcf5ef2aSThomas Huth void helper_vsum2sws(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2137fcf5ef2aSThomas Huth { 2138fcf5ef2aSThomas Huth int i, j, upper; 2139fcf5ef2aSThomas Huth ppc_avr_t result; 2140fcf5ef2aSThomas Huth int sat = 0; 2141fcf5ef2aSThomas Huth 2142fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2143fcf5ef2aSThomas Huth upper = 1; 2144fcf5ef2aSThomas Huth #else 2145fcf5ef2aSThomas Huth upper = 0; 2146fcf5ef2aSThomas Huth #endif 2147fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 2148fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[upper + i * 2]; 2149fcf5ef2aSThomas Huth 2150fcf5ef2aSThomas Huth result.u64[i] = 0; 2151fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u64); j++) { 2152fcf5ef2aSThomas Huth t += a->s32[2 * i + j]; 2153fcf5ef2aSThomas Huth } 2154fcf5ef2aSThomas Huth result.s32[upper + i * 2] = cvtsdsw(t, &sat); 2155fcf5ef2aSThomas Huth } 2156fcf5ef2aSThomas Huth 2157fcf5ef2aSThomas Huth *r = result; 2158fcf5ef2aSThomas Huth if (sat) { 2159fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 2160fcf5ef2aSThomas Huth } 2161fcf5ef2aSThomas Huth } 2162fcf5ef2aSThomas Huth 2163fcf5ef2aSThomas Huth void helper_vsum4sbs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2164fcf5ef2aSThomas Huth { 2165fcf5ef2aSThomas Huth int i, j; 2166fcf5ef2aSThomas Huth int sat = 0; 2167fcf5ef2aSThomas Huth 2168fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 2169fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 2170fcf5ef2aSThomas Huth 2171fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->s32); j++) { 2172fcf5ef2aSThomas Huth t += a->s8[4 * i + j]; 2173fcf5ef2aSThomas Huth } 2174fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 2175fcf5ef2aSThomas Huth } 2176fcf5ef2aSThomas Huth 2177fcf5ef2aSThomas Huth if (sat) { 2178fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 2179fcf5ef2aSThomas Huth } 2180fcf5ef2aSThomas Huth } 2181fcf5ef2aSThomas Huth 2182fcf5ef2aSThomas Huth void helper_vsum4shs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2183fcf5ef2aSThomas Huth { 2184fcf5ef2aSThomas Huth int sat = 0; 2185fcf5ef2aSThomas Huth int i; 2186fcf5ef2aSThomas Huth 2187fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->s32); i++) { 2188fcf5ef2aSThomas Huth int64_t t = (int64_t)b->s32[i]; 2189fcf5ef2aSThomas Huth 2190fcf5ef2aSThomas Huth t += a->s16[2 * i] + a->s16[2 * i + 1]; 2191fcf5ef2aSThomas Huth r->s32[i] = cvtsdsw(t, &sat); 2192fcf5ef2aSThomas Huth } 2193fcf5ef2aSThomas Huth 2194fcf5ef2aSThomas Huth if (sat) { 2195fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 2196fcf5ef2aSThomas Huth } 2197fcf5ef2aSThomas Huth } 2198fcf5ef2aSThomas Huth 2199fcf5ef2aSThomas Huth void helper_vsum4ubs(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2200fcf5ef2aSThomas Huth { 2201fcf5ef2aSThomas Huth int i, j; 2202fcf5ef2aSThomas Huth int sat = 0; 2203fcf5ef2aSThomas Huth 2204fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 2205fcf5ef2aSThomas Huth uint64_t t = (uint64_t)b->u32[i]; 2206fcf5ef2aSThomas Huth 2207fcf5ef2aSThomas Huth for (j = 0; j < ARRAY_SIZE(r->u32); j++) { 2208fcf5ef2aSThomas Huth t += a->u8[4 * i + j]; 2209fcf5ef2aSThomas Huth } 2210fcf5ef2aSThomas Huth r->u32[i] = cvtuduw(t, &sat); 2211fcf5ef2aSThomas Huth } 2212fcf5ef2aSThomas Huth 2213fcf5ef2aSThomas Huth if (sat) { 2214fcf5ef2aSThomas Huth env->vscr |= (1 << VSCR_SAT); 2215fcf5ef2aSThomas Huth } 2216fcf5ef2aSThomas Huth } 2217fcf5ef2aSThomas Huth 2218fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2219fcf5ef2aSThomas Huth #define UPKHI 1 2220fcf5ef2aSThomas Huth #define UPKLO 0 2221fcf5ef2aSThomas Huth #else 2222fcf5ef2aSThomas Huth #define UPKHI 0 2223fcf5ef2aSThomas Huth #define UPKLO 1 2224fcf5ef2aSThomas Huth #endif 2225fcf5ef2aSThomas Huth #define VUPKPX(suffix, hi) \ 2226fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 2227fcf5ef2aSThomas Huth { \ 2228fcf5ef2aSThomas Huth int i; \ 2229fcf5ef2aSThomas Huth ppc_avr_t result; \ 2230fcf5ef2aSThomas Huth \ 2231fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->u32); i++) { \ 2232fcf5ef2aSThomas Huth uint16_t e = b->u16[hi ? i : i+4]; \ 2233fcf5ef2aSThomas Huth uint8_t a = (e >> 15) ? 0xff : 0; \ 2234fcf5ef2aSThomas Huth uint8_t r = (e >> 10) & 0x1f; \ 2235fcf5ef2aSThomas Huth uint8_t g = (e >> 5) & 0x1f; \ 2236fcf5ef2aSThomas Huth uint8_t b = e & 0x1f; \ 2237fcf5ef2aSThomas Huth \ 2238fcf5ef2aSThomas Huth result.u32[i] = (a << 24) | (r << 16) | (g << 8) | b; \ 2239fcf5ef2aSThomas Huth } \ 2240fcf5ef2aSThomas Huth *r = result; \ 2241fcf5ef2aSThomas Huth } 2242fcf5ef2aSThomas Huth VUPKPX(lpx, UPKLO) 2243fcf5ef2aSThomas Huth VUPKPX(hpx, UPKHI) 2244fcf5ef2aSThomas Huth #undef VUPKPX 2245fcf5ef2aSThomas Huth 2246fcf5ef2aSThomas Huth #define VUPK(suffix, unpacked, packee, hi) \ 2247fcf5ef2aSThomas Huth void helper_vupk##suffix(ppc_avr_t *r, ppc_avr_t *b) \ 2248fcf5ef2aSThomas Huth { \ 2249fcf5ef2aSThomas Huth int i; \ 2250fcf5ef2aSThomas Huth ppc_avr_t result; \ 2251fcf5ef2aSThomas Huth \ 2252fcf5ef2aSThomas Huth if (hi) { \ 2253fcf5ef2aSThomas Huth for (i = 0; i < ARRAY_SIZE(r->unpacked); i++) { \ 2254fcf5ef2aSThomas Huth result.unpacked[i] = b->packee[i]; \ 2255fcf5ef2aSThomas Huth } \ 2256fcf5ef2aSThomas Huth } else { \ 2257fcf5ef2aSThomas Huth for (i = ARRAY_SIZE(r->unpacked); i < ARRAY_SIZE(r->packee); \ 2258fcf5ef2aSThomas Huth i++) { \ 2259fcf5ef2aSThomas Huth result.unpacked[i - ARRAY_SIZE(r->unpacked)] = b->packee[i]; \ 2260fcf5ef2aSThomas Huth } \ 2261fcf5ef2aSThomas Huth } \ 2262fcf5ef2aSThomas Huth *r = result; \ 2263fcf5ef2aSThomas Huth } 2264fcf5ef2aSThomas Huth VUPK(hsb, s16, s8, UPKHI) 2265fcf5ef2aSThomas Huth VUPK(hsh, s32, s16, UPKHI) 2266fcf5ef2aSThomas Huth VUPK(hsw, s64, s32, UPKHI) 2267fcf5ef2aSThomas Huth VUPK(lsb, s16, s8, UPKLO) 2268fcf5ef2aSThomas Huth VUPK(lsh, s32, s16, UPKLO) 2269fcf5ef2aSThomas Huth VUPK(lsw, s64, s32, UPKLO) 2270fcf5ef2aSThomas Huth #undef VUPK 2271fcf5ef2aSThomas Huth #undef UPKHI 2272fcf5ef2aSThomas Huth #undef UPKLO 2273fcf5ef2aSThomas Huth 2274fcf5ef2aSThomas Huth #define VGENERIC_DO(name, element) \ 2275fcf5ef2aSThomas Huth void helper_v##name(ppc_avr_t *r, ppc_avr_t *b) \ 2276fcf5ef2aSThomas Huth { \ 2277fcf5ef2aSThomas Huth int i; \ 2278fcf5ef2aSThomas Huth \ 2279fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, element) { \ 2280fcf5ef2aSThomas Huth r->element[i] = name(b->element[i]); \ 2281fcf5ef2aSThomas Huth } \ 2282fcf5ef2aSThomas Huth } 2283fcf5ef2aSThomas Huth 2284fcf5ef2aSThomas Huth #define clzb(v) ((v) ? clz32((uint32_t)(v) << 24) : 8) 2285fcf5ef2aSThomas Huth #define clzh(v) ((v) ? clz32((uint32_t)(v) << 16) : 16) 2286fcf5ef2aSThomas Huth #define clzw(v) clz32((v)) 2287fcf5ef2aSThomas Huth #define clzd(v) clz64((v)) 2288fcf5ef2aSThomas Huth 2289fcf5ef2aSThomas Huth VGENERIC_DO(clzb, u8) 2290fcf5ef2aSThomas Huth VGENERIC_DO(clzh, u16) 2291fcf5ef2aSThomas Huth VGENERIC_DO(clzw, u32) 2292fcf5ef2aSThomas Huth VGENERIC_DO(clzd, u64) 2293fcf5ef2aSThomas Huth 2294fcf5ef2aSThomas Huth #undef clzb 2295fcf5ef2aSThomas Huth #undef clzh 2296fcf5ef2aSThomas Huth #undef clzw 2297fcf5ef2aSThomas Huth #undef clzd 2298fcf5ef2aSThomas Huth 2299fcf5ef2aSThomas Huth #define ctzb(v) ((v) ? ctz32(v) : 8) 2300fcf5ef2aSThomas Huth #define ctzh(v) ((v) ? ctz32(v) : 16) 2301fcf5ef2aSThomas Huth #define ctzw(v) ctz32((v)) 2302fcf5ef2aSThomas Huth #define ctzd(v) ctz64((v)) 2303fcf5ef2aSThomas Huth 2304fcf5ef2aSThomas Huth VGENERIC_DO(ctzb, u8) 2305fcf5ef2aSThomas Huth VGENERIC_DO(ctzh, u16) 2306fcf5ef2aSThomas Huth VGENERIC_DO(ctzw, u32) 2307fcf5ef2aSThomas Huth VGENERIC_DO(ctzd, u64) 2308fcf5ef2aSThomas Huth 2309fcf5ef2aSThomas Huth #undef ctzb 2310fcf5ef2aSThomas Huth #undef ctzh 2311fcf5ef2aSThomas Huth #undef ctzw 2312fcf5ef2aSThomas Huth #undef ctzd 2313fcf5ef2aSThomas Huth 2314fcf5ef2aSThomas Huth #define popcntb(v) ctpop8(v) 2315fcf5ef2aSThomas Huth #define popcnth(v) ctpop16(v) 2316fcf5ef2aSThomas Huth #define popcntw(v) ctpop32(v) 2317fcf5ef2aSThomas Huth #define popcntd(v) ctpop64(v) 2318fcf5ef2aSThomas Huth 2319fcf5ef2aSThomas Huth VGENERIC_DO(popcntb, u8) 2320fcf5ef2aSThomas Huth VGENERIC_DO(popcnth, u16) 2321fcf5ef2aSThomas Huth VGENERIC_DO(popcntw, u32) 2322fcf5ef2aSThomas Huth VGENERIC_DO(popcntd, u64) 2323fcf5ef2aSThomas Huth 2324fcf5ef2aSThomas Huth #undef popcntb 2325fcf5ef2aSThomas Huth #undef popcnth 2326fcf5ef2aSThomas Huth #undef popcntw 2327fcf5ef2aSThomas Huth #undef popcntd 2328fcf5ef2aSThomas Huth 2329fcf5ef2aSThomas Huth #undef VGENERIC_DO 2330fcf5ef2aSThomas Huth 2331fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2332fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 0, 1 } } 2333fcf5ef2aSThomas Huth #else 2334fcf5ef2aSThomas Huth #define QW_ONE { .u64 = { 1, 0 } } 2335fcf5ef2aSThomas Huth #endif 2336fcf5ef2aSThomas Huth 2337fcf5ef2aSThomas Huth #ifndef CONFIG_INT128 2338fcf5ef2aSThomas Huth 2339fcf5ef2aSThomas Huth static inline void avr_qw_not(ppc_avr_t *t, ppc_avr_t a) 2340fcf5ef2aSThomas Huth { 2341fcf5ef2aSThomas Huth t->u64[0] = ~a.u64[0]; 2342fcf5ef2aSThomas Huth t->u64[1] = ~a.u64[1]; 2343fcf5ef2aSThomas Huth } 2344fcf5ef2aSThomas Huth 2345fcf5ef2aSThomas Huth static int avr_qw_cmpu(ppc_avr_t a, ppc_avr_t b) 2346fcf5ef2aSThomas Huth { 23473c385a93SMark Cave-Ayland if (a.VsrD(0) < b.VsrD(0)) { 2348fcf5ef2aSThomas Huth return -1; 23493c385a93SMark Cave-Ayland } else if (a.VsrD(0) > b.VsrD(0)) { 2350fcf5ef2aSThomas Huth return 1; 23513c385a93SMark Cave-Ayland } else if (a.VsrD(1) < b.VsrD(1)) { 2352fcf5ef2aSThomas Huth return -1; 23533c385a93SMark Cave-Ayland } else if (a.VsrD(1) > b.VsrD(1)) { 2354fcf5ef2aSThomas Huth return 1; 2355fcf5ef2aSThomas Huth } else { 2356fcf5ef2aSThomas Huth return 0; 2357fcf5ef2aSThomas Huth } 2358fcf5ef2aSThomas Huth } 2359fcf5ef2aSThomas Huth 2360fcf5ef2aSThomas Huth static void avr_qw_add(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 2361fcf5ef2aSThomas Huth { 23623c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 23633c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 23643c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 2365fcf5ef2aSThomas Huth } 2366fcf5ef2aSThomas Huth 2367fcf5ef2aSThomas Huth static int avr_qw_addc(ppc_avr_t *t, ppc_avr_t a, ppc_avr_t b) 2368fcf5ef2aSThomas Huth { 2369fcf5ef2aSThomas Huth ppc_avr_t not_a; 23703c385a93SMark Cave-Ayland t->VsrD(1) = a.VsrD(1) + b.VsrD(1); 23713c385a93SMark Cave-Ayland t->VsrD(0) = a.VsrD(0) + b.VsrD(0) + 23723c385a93SMark Cave-Ayland (~a.VsrD(1) < b.VsrD(1)); 2373fcf5ef2aSThomas Huth avr_qw_not(¬_a, a); 2374fcf5ef2aSThomas Huth return avr_qw_cmpu(not_a, b) < 0; 2375fcf5ef2aSThomas Huth } 2376fcf5ef2aSThomas Huth 2377fcf5ef2aSThomas Huth #endif 2378fcf5ef2aSThomas Huth 2379fcf5ef2aSThomas Huth void helper_vadduqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2380fcf5ef2aSThomas Huth { 2381fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2382fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128; 2383fcf5ef2aSThomas Huth #else 2384fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 2385fcf5ef2aSThomas Huth #endif 2386fcf5ef2aSThomas Huth } 2387fcf5ef2aSThomas Huth 2388fcf5ef2aSThomas Huth void helper_vaddeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2389fcf5ef2aSThomas Huth { 2390fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2391fcf5ef2aSThomas Huth r->u128 = a->u128 + b->u128 + (c->u128 & 1); 2392fcf5ef2aSThomas Huth #else 2393fcf5ef2aSThomas Huth 23943c385a93SMark Cave-Ayland if (c->VsrD(1) & 1) { 2395fcf5ef2aSThomas Huth ppc_avr_t tmp; 2396fcf5ef2aSThomas Huth 23973c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 23983c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2399fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 2400fcf5ef2aSThomas Huth avr_qw_add(r, tmp, *b); 2401fcf5ef2aSThomas Huth } else { 2402fcf5ef2aSThomas Huth avr_qw_add(r, *a, *b); 2403fcf5ef2aSThomas Huth } 2404fcf5ef2aSThomas Huth #endif 2405fcf5ef2aSThomas Huth } 2406fcf5ef2aSThomas Huth 2407fcf5ef2aSThomas Huth void helper_vaddcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2408fcf5ef2aSThomas Huth { 2409fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2410fcf5ef2aSThomas Huth r->u128 = (~a->u128 < b->u128); 2411fcf5ef2aSThomas Huth #else 2412fcf5ef2aSThomas Huth ppc_avr_t not_a; 2413fcf5ef2aSThomas Huth 2414fcf5ef2aSThomas Huth avr_qw_not(¬_a, *a); 2415fcf5ef2aSThomas Huth 24163c385a93SMark Cave-Ayland r->VsrD(0) = 0; 24173c385a93SMark Cave-Ayland r->VsrD(1) = (avr_qw_cmpu(not_a, *b) < 0); 2418fcf5ef2aSThomas Huth #endif 2419fcf5ef2aSThomas Huth } 2420fcf5ef2aSThomas Huth 2421fcf5ef2aSThomas Huth void helper_vaddecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2422fcf5ef2aSThomas Huth { 2423fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2424fcf5ef2aSThomas Huth int carry_out = (~a->u128 < b->u128); 2425fcf5ef2aSThomas Huth if (!carry_out && (c->u128 & 1)) { 2426fcf5ef2aSThomas Huth carry_out = ((a->u128 + b->u128 + 1) == 0) && 2427fcf5ef2aSThomas Huth ((a->u128 != 0) || (b->u128 != 0)); 2428fcf5ef2aSThomas Huth } 2429fcf5ef2aSThomas Huth r->u128 = carry_out; 2430fcf5ef2aSThomas Huth #else 2431fcf5ef2aSThomas Huth 24323c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2433fcf5ef2aSThomas Huth int carry_out = 0; 2434fcf5ef2aSThomas Huth ppc_avr_t tmp; 2435fcf5ef2aSThomas Huth 2436fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, *a, *b); 2437fcf5ef2aSThomas Huth 2438fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2439fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 2440fcf5ef2aSThomas Huth carry_out = avr_qw_addc(&tmp, tmp, one); 2441fcf5ef2aSThomas Huth } 24423c385a93SMark Cave-Ayland r->VsrD(0) = 0; 24433c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2444fcf5ef2aSThomas Huth #endif 2445fcf5ef2aSThomas Huth } 2446fcf5ef2aSThomas Huth 2447fcf5ef2aSThomas Huth void helper_vsubuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2448fcf5ef2aSThomas Huth { 2449fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2450fcf5ef2aSThomas Huth r->u128 = a->u128 - b->u128; 2451fcf5ef2aSThomas Huth #else 2452fcf5ef2aSThomas Huth ppc_avr_t tmp; 2453fcf5ef2aSThomas Huth ppc_avr_t one = QW_ONE; 2454fcf5ef2aSThomas Huth 2455fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2456fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 2457fcf5ef2aSThomas Huth avr_qw_add(r, tmp, one); 2458fcf5ef2aSThomas Huth #endif 2459fcf5ef2aSThomas Huth } 2460fcf5ef2aSThomas Huth 2461fcf5ef2aSThomas Huth void helper_vsubeuqm(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2462fcf5ef2aSThomas Huth { 2463fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2464fcf5ef2aSThomas Huth r->u128 = a->u128 + ~b->u128 + (c->u128 & 1); 2465fcf5ef2aSThomas Huth #else 2466fcf5ef2aSThomas Huth ppc_avr_t tmp, sum; 2467fcf5ef2aSThomas Huth 2468fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2469fcf5ef2aSThomas Huth avr_qw_add(&sum, *a, tmp); 2470fcf5ef2aSThomas Huth 24713c385a93SMark Cave-Ayland tmp.VsrD(0) = 0; 24723c385a93SMark Cave-Ayland tmp.VsrD(1) = c->VsrD(1) & 1; 2473fcf5ef2aSThomas Huth avr_qw_add(r, sum, tmp); 2474fcf5ef2aSThomas Huth #endif 2475fcf5ef2aSThomas Huth } 2476fcf5ef2aSThomas Huth 2477fcf5ef2aSThomas Huth void helper_vsubcuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 2478fcf5ef2aSThomas Huth { 2479fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2480fcf5ef2aSThomas Huth r->u128 = (~a->u128 < ~b->u128) || 2481fcf5ef2aSThomas Huth (a->u128 + ~b->u128 == (__uint128_t)-1); 2482fcf5ef2aSThomas Huth #else 2483fcf5ef2aSThomas Huth int carry = (avr_qw_cmpu(*a, *b) > 0); 2484fcf5ef2aSThomas Huth if (!carry) { 2485fcf5ef2aSThomas Huth ppc_avr_t tmp; 2486fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2487fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 24883c385a93SMark Cave-Ayland carry = ((tmp.VsrSD(0) == -1ull) && (tmp.VsrSD(1) == -1ull)); 2489fcf5ef2aSThomas Huth } 24903c385a93SMark Cave-Ayland r->VsrD(0) = 0; 24913c385a93SMark Cave-Ayland r->VsrD(1) = carry; 2492fcf5ef2aSThomas Huth #endif 2493fcf5ef2aSThomas Huth } 2494fcf5ef2aSThomas Huth 2495fcf5ef2aSThomas Huth void helper_vsubecuq(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 2496fcf5ef2aSThomas Huth { 2497fcf5ef2aSThomas Huth #ifdef CONFIG_INT128 2498fcf5ef2aSThomas Huth r->u128 = 2499fcf5ef2aSThomas Huth (~a->u128 < ~b->u128) || 2500fcf5ef2aSThomas Huth ((c->u128 & 1) && (a->u128 + ~b->u128 == (__uint128_t)-1)); 2501fcf5ef2aSThomas Huth #else 25023c385a93SMark Cave-Ayland int carry_in = c->VsrD(1) & 1; 2503fcf5ef2aSThomas Huth int carry_out = (avr_qw_cmpu(*a, *b) > 0); 2504fcf5ef2aSThomas Huth if (!carry_out && carry_in) { 2505fcf5ef2aSThomas Huth ppc_avr_t tmp; 2506fcf5ef2aSThomas Huth avr_qw_not(&tmp, *b); 2507fcf5ef2aSThomas Huth avr_qw_add(&tmp, *a, tmp); 25083c385a93SMark Cave-Ayland carry_out = ((tmp.VsrD(0) == -1ull) && (tmp.VsrD(1) == -1ull)); 2509fcf5ef2aSThomas Huth } 2510fcf5ef2aSThomas Huth 25113c385a93SMark Cave-Ayland r->VsrD(0) = 0; 25123c385a93SMark Cave-Ayland r->VsrD(1) = carry_out; 2513fcf5ef2aSThomas Huth #endif 2514fcf5ef2aSThomas Huth } 2515fcf5ef2aSThomas Huth 2516fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_1 0xC 2517fcf5ef2aSThomas Huth #define BCD_PLUS_PREF_2 0xF 2518fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_1 0xA 2519fcf5ef2aSThomas Huth #define BCD_NEG_PREF 0xD 2520fcf5ef2aSThomas Huth #define BCD_NEG_ALT 0xB 2521fcf5ef2aSThomas Huth #define BCD_PLUS_ALT_2 0xE 2522fcf5ef2aSThomas Huth #define NATIONAL_PLUS 0x2B 2523fcf5ef2aSThomas Huth #define NATIONAL_NEG 0x2D 2524fcf5ef2aSThomas Huth 2525fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2526365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) (15 - ((n) / 2)) 2527fcf5ef2aSThomas Huth #else 2528365206aeSJose Ricardo Ziviani #define BCD_DIG_BYTE(n) ((n) / 2) 2529fcf5ef2aSThomas Huth #endif 2530fcf5ef2aSThomas Huth 2531fcf5ef2aSThomas Huth static int bcd_get_sgn(ppc_avr_t *bcd) 2532fcf5ef2aSThomas Huth { 2533fcf5ef2aSThomas Huth switch (bcd->u8[BCD_DIG_BYTE(0)] & 0xF) { 2534fcf5ef2aSThomas Huth case BCD_PLUS_PREF_1: 2535fcf5ef2aSThomas Huth case BCD_PLUS_PREF_2: 2536fcf5ef2aSThomas Huth case BCD_PLUS_ALT_1: 2537fcf5ef2aSThomas Huth case BCD_PLUS_ALT_2: 2538fcf5ef2aSThomas Huth { 2539fcf5ef2aSThomas Huth return 1; 2540fcf5ef2aSThomas Huth } 2541fcf5ef2aSThomas Huth 2542fcf5ef2aSThomas Huth case BCD_NEG_PREF: 2543fcf5ef2aSThomas Huth case BCD_NEG_ALT: 2544fcf5ef2aSThomas Huth { 2545fcf5ef2aSThomas Huth return -1; 2546fcf5ef2aSThomas Huth } 2547fcf5ef2aSThomas Huth 2548fcf5ef2aSThomas Huth default: 2549fcf5ef2aSThomas Huth { 2550fcf5ef2aSThomas Huth return 0; 2551fcf5ef2aSThomas Huth } 2552fcf5ef2aSThomas Huth } 2553fcf5ef2aSThomas Huth } 2554fcf5ef2aSThomas Huth 2555fcf5ef2aSThomas Huth static int bcd_preferred_sgn(int sgn, int ps) 2556fcf5ef2aSThomas Huth { 2557fcf5ef2aSThomas Huth if (sgn >= 0) { 2558fcf5ef2aSThomas Huth return (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2; 2559fcf5ef2aSThomas Huth } else { 2560fcf5ef2aSThomas Huth return BCD_NEG_PREF; 2561fcf5ef2aSThomas Huth } 2562fcf5ef2aSThomas Huth } 2563fcf5ef2aSThomas Huth 2564fcf5ef2aSThomas Huth static uint8_t bcd_get_digit(ppc_avr_t *bcd, int n, int *invalid) 2565fcf5ef2aSThomas Huth { 2566fcf5ef2aSThomas Huth uint8_t result; 2567fcf5ef2aSThomas Huth if (n & 1) { 2568fcf5ef2aSThomas Huth result = bcd->u8[BCD_DIG_BYTE(n)] >> 4; 2569fcf5ef2aSThomas Huth } else { 2570fcf5ef2aSThomas Huth result = bcd->u8[BCD_DIG_BYTE(n)] & 0xF; 2571fcf5ef2aSThomas Huth } 2572fcf5ef2aSThomas Huth 2573fcf5ef2aSThomas Huth if (unlikely(result > 9)) { 2574fcf5ef2aSThomas Huth *invalid = true; 2575fcf5ef2aSThomas Huth } 2576fcf5ef2aSThomas Huth return result; 2577fcf5ef2aSThomas Huth } 2578fcf5ef2aSThomas Huth 2579fcf5ef2aSThomas Huth static void bcd_put_digit(ppc_avr_t *bcd, uint8_t digit, int n) 2580fcf5ef2aSThomas Huth { 2581fcf5ef2aSThomas Huth if (n & 1) { 2582fcf5ef2aSThomas Huth bcd->u8[BCD_DIG_BYTE(n)] &= 0x0F; 2583fcf5ef2aSThomas Huth bcd->u8[BCD_DIG_BYTE(n)] |= (digit<<4); 2584fcf5ef2aSThomas Huth } else { 2585fcf5ef2aSThomas Huth bcd->u8[BCD_DIG_BYTE(n)] &= 0xF0; 2586fcf5ef2aSThomas Huth bcd->u8[BCD_DIG_BYTE(n)] |= digit; 2587fcf5ef2aSThomas Huth } 2588fcf5ef2aSThomas Huth } 2589fcf5ef2aSThomas Huth 2590071663dfSJose Ricardo Ziviani static bool bcd_is_valid(ppc_avr_t *bcd) 2591071663dfSJose Ricardo Ziviani { 2592071663dfSJose Ricardo Ziviani int i; 2593071663dfSJose Ricardo Ziviani int invalid = 0; 2594071663dfSJose Ricardo Ziviani 2595071663dfSJose Ricardo Ziviani if (bcd_get_sgn(bcd) == 0) { 2596071663dfSJose Ricardo Ziviani return false; 2597071663dfSJose Ricardo Ziviani } 2598071663dfSJose Ricardo Ziviani 2599071663dfSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 2600071663dfSJose Ricardo Ziviani bcd_get_digit(bcd, i, &invalid); 2601071663dfSJose Ricardo Ziviani if (unlikely(invalid)) { 2602071663dfSJose Ricardo Ziviani return false; 2603071663dfSJose Ricardo Ziviani } 2604071663dfSJose Ricardo Ziviani } 2605071663dfSJose Ricardo Ziviani return true; 2606071663dfSJose Ricardo Ziviani } 2607071663dfSJose Ricardo Ziviani 2608fcf5ef2aSThomas Huth static int bcd_cmp_zero(ppc_avr_t *bcd) 2609fcf5ef2aSThomas Huth { 26103c385a93SMark Cave-Ayland if (bcd->VsrD(0) == 0 && (bcd->VsrD(1) >> 4) == 0) { 2611efa73196SNikunj A Dadhania return CRF_EQ; 2612fcf5ef2aSThomas Huth } else { 2613efa73196SNikunj A Dadhania return (bcd_get_sgn(bcd) == 1) ? CRF_GT : CRF_LT; 2614fcf5ef2aSThomas Huth } 2615fcf5ef2aSThomas Huth } 2616fcf5ef2aSThomas Huth 2617fcf5ef2aSThomas Huth static uint16_t get_national_digit(ppc_avr_t *reg, int n) 2618fcf5ef2aSThomas Huth { 2619fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2620fcf5ef2aSThomas Huth return reg->u16[7 - n]; 2621fcf5ef2aSThomas Huth #else 2622fcf5ef2aSThomas Huth return reg->u16[n]; 2623fcf5ef2aSThomas Huth #endif 2624fcf5ef2aSThomas Huth } 2625fcf5ef2aSThomas Huth 2626fcf5ef2aSThomas Huth static void set_national_digit(ppc_avr_t *reg, uint8_t val, int n) 2627fcf5ef2aSThomas Huth { 2628fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 2629fcf5ef2aSThomas Huth reg->u16[7 - n] = val; 2630fcf5ef2aSThomas Huth #else 2631fcf5ef2aSThomas Huth reg->u16[n] = val; 2632fcf5ef2aSThomas Huth #endif 2633fcf5ef2aSThomas Huth } 2634fcf5ef2aSThomas Huth 2635fcf5ef2aSThomas Huth static int bcd_cmp_mag(ppc_avr_t *a, ppc_avr_t *b) 2636fcf5ef2aSThomas Huth { 2637fcf5ef2aSThomas Huth int i; 2638fcf5ef2aSThomas Huth int invalid = 0; 2639fcf5ef2aSThomas Huth for (i = 31; i > 0; i--) { 2640fcf5ef2aSThomas Huth uint8_t dig_a = bcd_get_digit(a, i, &invalid); 2641fcf5ef2aSThomas Huth uint8_t dig_b = bcd_get_digit(b, i, &invalid); 2642fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2643fcf5ef2aSThomas Huth return 0; /* doesn't matter */ 2644fcf5ef2aSThomas Huth } else if (dig_a > dig_b) { 2645fcf5ef2aSThomas Huth return 1; 2646fcf5ef2aSThomas Huth } else if (dig_a < dig_b) { 2647fcf5ef2aSThomas Huth return -1; 2648fcf5ef2aSThomas Huth } 2649fcf5ef2aSThomas Huth } 2650fcf5ef2aSThomas Huth 2651fcf5ef2aSThomas Huth return 0; 2652fcf5ef2aSThomas Huth } 2653fcf5ef2aSThomas Huth 2654d03b174aSYasmin Beatriz static void bcd_add_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2655fcf5ef2aSThomas Huth int *overflow) 2656fcf5ef2aSThomas Huth { 2657fcf5ef2aSThomas Huth int carry = 0; 2658fcf5ef2aSThomas Huth int i; 2659fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2660fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) + 2661fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2662fcf5ef2aSThomas Huth if (digit > 9) { 2663fcf5ef2aSThomas Huth carry = 1; 2664fcf5ef2aSThomas Huth digit -= 10; 2665fcf5ef2aSThomas Huth } else { 2666fcf5ef2aSThomas Huth carry = 0; 2667fcf5ef2aSThomas Huth } 2668fcf5ef2aSThomas Huth 2669fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2670fcf5ef2aSThomas Huth } 2671fcf5ef2aSThomas Huth 2672fcf5ef2aSThomas Huth *overflow = carry; 2673fcf5ef2aSThomas Huth } 2674fcf5ef2aSThomas Huth 2675d03b174aSYasmin Beatriz static void bcd_sub_mag(ppc_avr_t *t, ppc_avr_t *a, ppc_avr_t *b, int *invalid, 2676fcf5ef2aSThomas Huth int *overflow) 2677fcf5ef2aSThomas Huth { 2678fcf5ef2aSThomas Huth int carry = 0; 2679fcf5ef2aSThomas Huth int i; 2680d03b174aSYasmin Beatriz 2681fcf5ef2aSThomas Huth for (i = 1; i <= 31; i++) { 2682fcf5ef2aSThomas Huth uint8_t digit = bcd_get_digit(a, i, invalid) - 2683fcf5ef2aSThomas Huth bcd_get_digit(b, i, invalid) + carry; 2684fcf5ef2aSThomas Huth if (digit & 0x80) { 2685fcf5ef2aSThomas Huth carry = -1; 2686fcf5ef2aSThomas Huth digit += 10; 2687fcf5ef2aSThomas Huth } else { 2688fcf5ef2aSThomas Huth carry = 0; 2689fcf5ef2aSThomas Huth } 2690fcf5ef2aSThomas Huth 2691fcf5ef2aSThomas Huth bcd_put_digit(t, digit, i); 2692fcf5ef2aSThomas Huth } 2693fcf5ef2aSThomas Huth 2694fcf5ef2aSThomas Huth *overflow = carry; 2695fcf5ef2aSThomas Huth } 2696fcf5ef2aSThomas Huth 2697fcf5ef2aSThomas Huth uint32_t helper_bcdadd(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2698fcf5ef2aSThomas Huth { 2699fcf5ef2aSThomas Huth 2700fcf5ef2aSThomas Huth int sgna = bcd_get_sgn(a); 2701fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2702fcf5ef2aSThomas Huth int invalid = (sgna == 0) || (sgnb == 0); 2703fcf5ef2aSThomas Huth int overflow = 0; 2704fcf5ef2aSThomas Huth uint32_t cr = 0; 2705fcf5ef2aSThomas Huth ppc_avr_t result = { .u64 = { 0, 0 } }; 2706fcf5ef2aSThomas Huth 2707fcf5ef2aSThomas Huth if (!invalid) { 2708fcf5ef2aSThomas Huth if (sgna == sgnb) { 2709fcf5ef2aSThomas Huth result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(sgna, ps); 2710d03b174aSYasmin Beatriz bcd_add_mag(&result, a, b, &invalid, &overflow); 2711d03b174aSYasmin Beatriz cr = bcd_cmp_zero(&result); 2712fcf5ef2aSThomas Huth } else { 2713d03b174aSYasmin Beatriz int magnitude = bcd_cmp_mag(a, b); 2714d03b174aSYasmin Beatriz if (magnitude > 0) { 2715d03b174aSYasmin Beatriz result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(sgna, ps); 2716d03b174aSYasmin Beatriz bcd_sub_mag(&result, a, b, &invalid, &overflow); 2717d03b174aSYasmin Beatriz cr = (sgna > 0) ? CRF_GT : CRF_LT; 2718d03b174aSYasmin Beatriz } else if (magnitude < 0) { 2719fcf5ef2aSThomas Huth result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(sgnb, ps); 2720d03b174aSYasmin Beatriz bcd_sub_mag(&result, b, a, &invalid, &overflow); 2721efa73196SNikunj A Dadhania cr = (sgnb > 0) ? CRF_GT : CRF_LT; 2722d03b174aSYasmin Beatriz } else { 2723d03b174aSYasmin Beatriz result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(0, ps); 2724d03b174aSYasmin Beatriz cr = CRF_EQ; 2725d03b174aSYasmin Beatriz } 2726fcf5ef2aSThomas Huth } 2727fcf5ef2aSThomas Huth } 2728fcf5ef2aSThomas Huth 2729fcf5ef2aSThomas Huth if (unlikely(invalid)) { 27303c385a93SMark Cave-Ayland result.VsrD(0) = result.VsrD(1) = -1; 2731efa73196SNikunj A Dadhania cr = CRF_SO; 2732fcf5ef2aSThomas Huth } else if (overflow) { 2733efa73196SNikunj A Dadhania cr |= CRF_SO; 2734fcf5ef2aSThomas Huth } 2735fcf5ef2aSThomas Huth 2736fcf5ef2aSThomas Huth *r = result; 2737fcf5ef2aSThomas Huth 2738fcf5ef2aSThomas Huth return cr; 2739fcf5ef2aSThomas Huth } 2740fcf5ef2aSThomas Huth 2741fcf5ef2aSThomas Huth uint32_t helper_bcdsub(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2742fcf5ef2aSThomas Huth { 2743fcf5ef2aSThomas Huth ppc_avr_t bcopy = *b; 2744fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2745fcf5ef2aSThomas Huth if (sgnb < 0) { 2746fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_PLUS_PREF_1, 0); 2747fcf5ef2aSThomas Huth } else if (sgnb > 0) { 2748fcf5ef2aSThomas Huth bcd_put_digit(&bcopy, BCD_NEG_PREF, 0); 2749fcf5ef2aSThomas Huth } 2750fcf5ef2aSThomas Huth /* else invalid ... defer to bcdadd code for proper handling */ 2751fcf5ef2aSThomas Huth 2752fcf5ef2aSThomas Huth return helper_bcdadd(r, a, &bcopy, ps); 2753fcf5ef2aSThomas Huth } 2754fcf5ef2aSThomas Huth 2755fcf5ef2aSThomas Huth uint32_t helper_bcdcfn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2756fcf5ef2aSThomas Huth { 2757fcf5ef2aSThomas Huth int i; 2758fcf5ef2aSThomas Huth int cr = 0; 2759fcf5ef2aSThomas Huth uint16_t national = 0; 2760fcf5ef2aSThomas Huth uint16_t sgnb = get_national_digit(b, 0); 2761fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2762fcf5ef2aSThomas Huth int invalid = (sgnb != NATIONAL_PLUS && sgnb != NATIONAL_NEG); 2763fcf5ef2aSThomas Huth 2764fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2765fcf5ef2aSThomas Huth national = get_national_digit(b, i); 2766fcf5ef2aSThomas Huth if (unlikely(national < 0x30 || national > 0x39)) { 2767fcf5ef2aSThomas Huth invalid = 1; 2768fcf5ef2aSThomas Huth break; 2769fcf5ef2aSThomas Huth } 2770fcf5ef2aSThomas Huth 2771fcf5ef2aSThomas Huth bcd_put_digit(&ret, national & 0xf, i); 2772fcf5ef2aSThomas Huth } 2773fcf5ef2aSThomas Huth 2774fcf5ef2aSThomas Huth if (sgnb == NATIONAL_PLUS) { 2775fcf5ef2aSThomas Huth bcd_put_digit(&ret, (ps == 0) ? BCD_PLUS_PREF_1 : BCD_PLUS_PREF_2, 0); 2776fcf5ef2aSThomas Huth } else { 2777fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2778fcf5ef2aSThomas Huth } 2779fcf5ef2aSThomas Huth 2780fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2781fcf5ef2aSThomas Huth 2782fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2783efa73196SNikunj A Dadhania cr = CRF_SO; 2784fcf5ef2aSThomas Huth } 2785fcf5ef2aSThomas Huth 2786fcf5ef2aSThomas Huth *r = ret; 2787fcf5ef2aSThomas Huth 2788fcf5ef2aSThomas Huth return cr; 2789fcf5ef2aSThomas Huth } 2790fcf5ef2aSThomas Huth 2791fcf5ef2aSThomas Huth uint32_t helper_bcdctn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2792fcf5ef2aSThomas Huth { 2793fcf5ef2aSThomas Huth int i; 2794fcf5ef2aSThomas Huth int cr = 0; 2795fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2796fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2797fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2798fcf5ef2aSThomas Huth 27993c385a93SMark Cave-Ayland int ox_flag = (b->VsrD(0) != 0) || ((b->VsrD(1) >> 32) != 0); 2800fcf5ef2aSThomas Huth 2801fcf5ef2aSThomas Huth for (i = 1; i < 8; i++) { 2802fcf5ef2aSThomas Huth set_national_digit(&ret, 0x30 + bcd_get_digit(b, i, &invalid), i); 2803fcf5ef2aSThomas Huth 2804fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2805fcf5ef2aSThomas Huth break; 2806fcf5ef2aSThomas Huth } 2807fcf5ef2aSThomas Huth } 2808fcf5ef2aSThomas Huth set_national_digit(&ret, (sgnb == -1) ? NATIONAL_NEG : NATIONAL_PLUS, 0); 2809fcf5ef2aSThomas Huth 2810fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2811fcf5ef2aSThomas Huth 2812fcf5ef2aSThomas Huth if (ox_flag) { 2813efa73196SNikunj A Dadhania cr |= CRF_SO; 2814fcf5ef2aSThomas Huth } 2815fcf5ef2aSThomas Huth 2816fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2817efa73196SNikunj A Dadhania cr = CRF_SO; 2818fcf5ef2aSThomas Huth } 2819fcf5ef2aSThomas Huth 2820fcf5ef2aSThomas Huth *r = ret; 2821fcf5ef2aSThomas Huth 2822fcf5ef2aSThomas Huth return cr; 2823fcf5ef2aSThomas Huth } 2824fcf5ef2aSThomas Huth 2825fcf5ef2aSThomas Huth uint32_t helper_bcdcfz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2826fcf5ef2aSThomas Huth { 2827fcf5ef2aSThomas Huth int i; 2828fcf5ef2aSThomas Huth int cr = 0; 2829fcf5ef2aSThomas Huth int invalid = 0; 2830fcf5ef2aSThomas Huth int zone_digit = 0; 2831fcf5ef2aSThomas Huth int zone_lead = ps ? 0xF : 0x3; 2832fcf5ef2aSThomas Huth int digit = 0; 2833fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2834fcf5ef2aSThomas Huth int sgnb = b->u8[BCD_DIG_BYTE(0)] >> 4; 2835fcf5ef2aSThomas Huth 2836fcf5ef2aSThomas Huth if (unlikely((sgnb < 0xA) && ps)) { 2837fcf5ef2aSThomas Huth invalid = 1; 2838fcf5ef2aSThomas Huth } 2839fcf5ef2aSThomas Huth 2840fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2841365206aeSJose Ricardo Ziviani zone_digit = i ? b->u8[BCD_DIG_BYTE(i * 2)] >> 4 : zone_lead; 2842fcf5ef2aSThomas Huth digit = b->u8[BCD_DIG_BYTE(i * 2)] & 0xF; 2843fcf5ef2aSThomas Huth if (unlikely(zone_digit != zone_lead || digit > 0x9)) { 2844fcf5ef2aSThomas Huth invalid = 1; 2845fcf5ef2aSThomas Huth break; 2846fcf5ef2aSThomas Huth } 2847fcf5ef2aSThomas Huth 2848fcf5ef2aSThomas Huth bcd_put_digit(&ret, digit, i + 1); 2849fcf5ef2aSThomas Huth } 2850fcf5ef2aSThomas Huth 2851fcf5ef2aSThomas Huth if ((ps && (sgnb == 0xB || sgnb == 0xD)) || 2852fcf5ef2aSThomas Huth (!ps && (sgnb & 0x4))) { 2853fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_NEG_PREF, 0); 2854fcf5ef2aSThomas Huth } else { 2855fcf5ef2aSThomas Huth bcd_put_digit(&ret, BCD_PLUS_PREF_1, 0); 2856fcf5ef2aSThomas Huth } 2857fcf5ef2aSThomas Huth 2858fcf5ef2aSThomas Huth cr = bcd_cmp_zero(&ret); 2859fcf5ef2aSThomas Huth 2860fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2861efa73196SNikunj A Dadhania cr = CRF_SO; 2862fcf5ef2aSThomas Huth } 2863fcf5ef2aSThomas Huth 2864fcf5ef2aSThomas Huth *r = ret; 2865fcf5ef2aSThomas Huth 2866fcf5ef2aSThomas Huth return cr; 2867fcf5ef2aSThomas Huth } 2868fcf5ef2aSThomas Huth 2869fcf5ef2aSThomas Huth uint32_t helper_bcdctz(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2870fcf5ef2aSThomas Huth { 2871fcf5ef2aSThomas Huth int i; 2872fcf5ef2aSThomas Huth int cr = 0; 2873fcf5ef2aSThomas Huth uint8_t digit = 0; 2874fcf5ef2aSThomas Huth int sgnb = bcd_get_sgn(b); 2875fcf5ef2aSThomas Huth int zone_lead = (ps) ? 0xF0 : 0x30; 2876fcf5ef2aSThomas Huth int invalid = (sgnb == 0); 2877fcf5ef2aSThomas Huth ppc_avr_t ret = { .u64 = { 0, 0 } }; 2878fcf5ef2aSThomas Huth 28793c385a93SMark Cave-Ayland int ox_flag = ((b->VsrD(0) >> 4) != 0); 2880fcf5ef2aSThomas Huth 2881fcf5ef2aSThomas Huth for (i = 0; i < 16; i++) { 2882fcf5ef2aSThomas Huth digit = bcd_get_digit(b, i + 1, &invalid); 2883fcf5ef2aSThomas Huth 2884fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2885fcf5ef2aSThomas Huth break; 2886fcf5ef2aSThomas Huth } 2887fcf5ef2aSThomas Huth 2888fcf5ef2aSThomas Huth ret.u8[BCD_DIG_BYTE(i * 2)] = zone_lead + digit; 2889fcf5ef2aSThomas Huth } 2890fcf5ef2aSThomas Huth 2891fcf5ef2aSThomas Huth if (ps) { 2892fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0xC : 0xD, 1); 2893fcf5ef2aSThomas Huth } else { 2894fcf5ef2aSThomas Huth bcd_put_digit(&ret, (sgnb == 1) ? 0x3 : 0x7, 1); 2895fcf5ef2aSThomas Huth } 2896fcf5ef2aSThomas Huth 2897fcf5ef2aSThomas Huth cr = bcd_cmp_zero(b); 2898fcf5ef2aSThomas Huth 2899fcf5ef2aSThomas Huth if (ox_flag) { 2900efa73196SNikunj A Dadhania cr |= CRF_SO; 2901fcf5ef2aSThomas Huth } 2902fcf5ef2aSThomas Huth 2903fcf5ef2aSThomas Huth if (unlikely(invalid)) { 2904efa73196SNikunj A Dadhania cr = CRF_SO; 2905fcf5ef2aSThomas Huth } 2906fcf5ef2aSThomas Huth 2907fcf5ef2aSThomas Huth *r = ret; 2908fcf5ef2aSThomas Huth 2909fcf5ef2aSThomas Huth return cr; 2910fcf5ef2aSThomas Huth } 2911fcf5ef2aSThomas Huth 2912a406c058SJose Ricardo Ziviani uint32_t helper_bcdcfsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2913a406c058SJose Ricardo Ziviani { 2914a406c058SJose Ricardo Ziviani int i; 2915a406c058SJose Ricardo Ziviani int cr = 0; 2916a406c058SJose Ricardo Ziviani uint64_t lo_value; 2917a406c058SJose Ricardo Ziviani uint64_t hi_value; 2918a406c058SJose Ricardo Ziviani ppc_avr_t ret = { .u64 = { 0, 0 } }; 2919a406c058SJose Ricardo Ziviani 29203c385a93SMark Cave-Ayland if (b->VsrSD(0) < 0) { 29213c385a93SMark Cave-Ayland lo_value = -b->VsrSD(1); 29223c385a93SMark Cave-Ayland hi_value = ~b->VsrD(0) + !lo_value; 2923a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, 0xD, 0); 2924a406c058SJose Ricardo Ziviani } else { 29253c385a93SMark Cave-Ayland lo_value = b->VsrD(1); 29263c385a93SMark Cave-Ayland hi_value = b->VsrD(0); 2927a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(0, ps), 0); 2928a406c058SJose Ricardo Ziviani } 2929a406c058SJose Ricardo Ziviani 2930a406c058SJose Ricardo Ziviani if (divu128(&lo_value, &hi_value, 1000000000000000ULL) || 2931a406c058SJose Ricardo Ziviani lo_value > 9999999999999999ULL) { 2932a406c058SJose Ricardo Ziviani cr = CRF_SO; 2933a406c058SJose Ricardo Ziviani } 2934a406c058SJose Ricardo Ziviani 2935a406c058SJose Ricardo Ziviani for (i = 1; i < 16; hi_value /= 10, i++) { 2936a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, hi_value % 10, i); 2937a406c058SJose Ricardo Ziviani } 2938a406c058SJose Ricardo Ziviani 2939a406c058SJose Ricardo Ziviani for (; i < 32; lo_value /= 10, i++) { 2940a406c058SJose Ricardo Ziviani bcd_put_digit(&ret, lo_value % 10, i); 2941a406c058SJose Ricardo Ziviani } 2942a406c058SJose Ricardo Ziviani 2943a406c058SJose Ricardo Ziviani cr |= bcd_cmp_zero(&ret); 2944a406c058SJose Ricardo Ziviani 2945a406c058SJose Ricardo Ziviani *r = ret; 2946a406c058SJose Ricardo Ziviani 2947a406c058SJose Ricardo Ziviani return cr; 2948a406c058SJose Ricardo Ziviani } 2949a406c058SJose Ricardo Ziviani 2950c85bc7ddSJose Ricardo Ziviani uint32_t helper_bcdctsq(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 2951c85bc7ddSJose Ricardo Ziviani { 2952c85bc7ddSJose Ricardo Ziviani uint8_t i; 2953c85bc7ddSJose Ricardo Ziviani int cr; 2954c85bc7ddSJose Ricardo Ziviani uint64_t carry; 2955c85bc7ddSJose Ricardo Ziviani uint64_t unused; 2956c85bc7ddSJose Ricardo Ziviani uint64_t lo_value; 2957c85bc7ddSJose Ricardo Ziviani uint64_t hi_value = 0; 2958c85bc7ddSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 2959c85bc7ddSJose Ricardo Ziviani int invalid = (sgnb == 0); 2960c85bc7ddSJose Ricardo Ziviani 2961c85bc7ddSJose Ricardo Ziviani lo_value = bcd_get_digit(b, 31, &invalid); 2962c85bc7ddSJose Ricardo Ziviani for (i = 30; i > 0; i--) { 2963c85bc7ddSJose Ricardo Ziviani mulu64(&lo_value, &carry, lo_value, 10ULL); 2964c85bc7ddSJose Ricardo Ziviani mulu64(&hi_value, &unused, hi_value, 10ULL); 2965c85bc7ddSJose Ricardo Ziviani lo_value += bcd_get_digit(b, i, &invalid); 2966c85bc7ddSJose Ricardo Ziviani hi_value += carry; 2967c85bc7ddSJose Ricardo Ziviani 2968c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2969c85bc7ddSJose Ricardo Ziviani break; 2970c85bc7ddSJose Ricardo Ziviani } 2971c85bc7ddSJose Ricardo Ziviani } 2972c85bc7ddSJose Ricardo Ziviani 2973c85bc7ddSJose Ricardo Ziviani if (sgnb == -1) { 29743c385a93SMark Cave-Ayland r->VsrSD(1) = -lo_value; 29753c385a93SMark Cave-Ayland r->VsrSD(0) = ~hi_value + !r->VsrSD(1); 2976c85bc7ddSJose Ricardo Ziviani } else { 29773c385a93SMark Cave-Ayland r->VsrSD(1) = lo_value; 29783c385a93SMark Cave-Ayland r->VsrSD(0) = hi_value; 2979c85bc7ddSJose Ricardo Ziviani } 2980c85bc7ddSJose Ricardo Ziviani 2981c85bc7ddSJose Ricardo Ziviani cr = bcd_cmp_zero(b); 2982c85bc7ddSJose Ricardo Ziviani 2983c85bc7ddSJose Ricardo Ziviani if (unlikely(invalid)) { 2984c85bc7ddSJose Ricardo Ziviani cr = CRF_SO; 2985c85bc7ddSJose Ricardo Ziviani } 2986c85bc7ddSJose Ricardo Ziviani 2987c85bc7ddSJose Ricardo Ziviani return cr; 2988c85bc7ddSJose Ricardo Ziviani } 2989c85bc7ddSJose Ricardo Ziviani 2990c3025c3bSJose Ricardo Ziviani uint32_t helper_bcdcpsgn(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 2991c3025c3bSJose Ricardo Ziviani { 2992c3025c3bSJose Ricardo Ziviani int i; 2993c3025c3bSJose Ricardo Ziviani int invalid = 0; 2994c3025c3bSJose Ricardo Ziviani 2995c3025c3bSJose Ricardo Ziviani if (bcd_get_sgn(a) == 0 || bcd_get_sgn(b) == 0) { 2996c3025c3bSJose Ricardo Ziviani return CRF_SO; 2997c3025c3bSJose Ricardo Ziviani } 2998c3025c3bSJose Ricardo Ziviani 2999c3025c3bSJose Ricardo Ziviani *r = *a; 3000c3025c3bSJose Ricardo Ziviani bcd_put_digit(r, b->u8[BCD_DIG_BYTE(0)] & 0xF, 0); 3001c3025c3bSJose Ricardo Ziviani 3002c3025c3bSJose Ricardo Ziviani for (i = 1; i < 32; i++) { 3003c3025c3bSJose Ricardo Ziviani bcd_get_digit(a, i, &invalid); 3004c3025c3bSJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 3005c3025c3bSJose Ricardo Ziviani if (unlikely(invalid)) { 3006c3025c3bSJose Ricardo Ziviani return CRF_SO; 3007c3025c3bSJose Ricardo Ziviani } 3008c3025c3bSJose Ricardo Ziviani } 3009c3025c3bSJose Ricardo Ziviani 3010c3025c3bSJose Ricardo Ziviani return bcd_cmp_zero(r); 3011c3025c3bSJose Ricardo Ziviani } 3012c3025c3bSJose Ricardo Ziviani 3013466a3f9cSJose Ricardo Ziviani uint32_t helper_bcdsetsgn(ppc_avr_t *r, ppc_avr_t *b, uint32_t ps) 3014466a3f9cSJose Ricardo Ziviani { 3015466a3f9cSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 3016466a3f9cSJose Ricardo Ziviani 3017466a3f9cSJose Ricardo Ziviani *r = *b; 3018466a3f9cSJose Ricardo Ziviani bcd_put_digit(r, bcd_preferred_sgn(sgnb, ps), 0); 3019466a3f9cSJose Ricardo Ziviani 3020071663dfSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 3021466a3f9cSJose Ricardo Ziviani return CRF_SO; 3022466a3f9cSJose Ricardo Ziviani } 3023466a3f9cSJose Ricardo Ziviani 3024466a3f9cSJose Ricardo Ziviani return bcd_cmp_zero(r); 3025466a3f9cSJose Ricardo Ziviani } 3026466a3f9cSJose Ricardo Ziviani 3027e04797f7SJose Ricardo Ziviani uint32_t helper_bcds(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 3028e04797f7SJose Ricardo Ziviani { 3029e04797f7SJose Ricardo Ziviani int cr; 3030e04797f7SJose Ricardo Ziviani #if defined(HOST_WORDS_BIGENDIAN) 3031e04797f7SJose Ricardo Ziviani int i = a->s8[7]; 3032e04797f7SJose Ricardo Ziviani #else 3033e04797f7SJose Ricardo Ziviani int i = a->s8[8]; 3034e04797f7SJose Ricardo Ziviani #endif 3035e04797f7SJose Ricardo Ziviani bool ox_flag = false; 3036e04797f7SJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 3037e04797f7SJose Ricardo Ziviani ppc_avr_t ret = *b; 30383c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 3039e04797f7SJose Ricardo Ziviani 3040e04797f7SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 3041e04797f7SJose Ricardo Ziviani return CRF_SO; 3042e04797f7SJose Ricardo Ziviani } 3043e04797f7SJose Ricardo Ziviani 3044e04797f7SJose Ricardo Ziviani if (unlikely(i > 31)) { 3045e04797f7SJose Ricardo Ziviani i = 31; 3046e04797f7SJose Ricardo Ziviani } else if (unlikely(i < -31)) { 3047e04797f7SJose Ricardo Ziviani i = -31; 3048e04797f7SJose Ricardo Ziviani } 3049e04797f7SJose Ricardo Ziviani 3050e04797f7SJose Ricardo Ziviani if (i > 0) { 30513c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 3052e04797f7SJose Ricardo Ziviani } else { 30533c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 3054e04797f7SJose Ricardo Ziviani } 3055e04797f7SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 3056e04797f7SJose Ricardo Ziviani 3057e04797f7SJose Ricardo Ziviani *r = ret; 3058e04797f7SJose Ricardo Ziviani 3059e04797f7SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 3060e04797f7SJose Ricardo Ziviani if (ox_flag) { 3061e04797f7SJose Ricardo Ziviani cr |= CRF_SO; 3062e04797f7SJose Ricardo Ziviani } 3063e04797f7SJose Ricardo Ziviani 3064e04797f7SJose Ricardo Ziviani return cr; 3065e04797f7SJose Ricardo Ziviani } 3066e04797f7SJose Ricardo Ziviani 3067a49a95e9SJose Ricardo Ziviani uint32_t helper_bcdus(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 3068a49a95e9SJose Ricardo Ziviani { 3069a49a95e9SJose Ricardo Ziviani int cr; 3070a49a95e9SJose Ricardo Ziviani int i; 3071a49a95e9SJose Ricardo Ziviani int invalid = 0; 3072a49a95e9SJose Ricardo Ziviani bool ox_flag = false; 3073a49a95e9SJose Ricardo Ziviani ppc_avr_t ret = *b; 3074a49a95e9SJose Ricardo Ziviani 3075a49a95e9SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 3076a49a95e9SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 3077a49a95e9SJose Ricardo Ziviani 3078a49a95e9SJose Ricardo Ziviani if (unlikely(invalid)) { 3079a49a95e9SJose Ricardo Ziviani return CRF_SO; 3080a49a95e9SJose Ricardo Ziviani } 3081a49a95e9SJose Ricardo Ziviani } 3082a49a95e9SJose Ricardo Ziviani 3083a49a95e9SJose Ricardo Ziviani #if defined(HOST_WORDS_BIGENDIAN) 3084a49a95e9SJose Ricardo Ziviani i = a->s8[7]; 3085a49a95e9SJose Ricardo Ziviani #else 3086a49a95e9SJose Ricardo Ziviani i = a->s8[8]; 3087a49a95e9SJose Ricardo Ziviani #endif 3088a49a95e9SJose Ricardo Ziviani if (i >= 32) { 3089a49a95e9SJose Ricardo Ziviani ox_flag = true; 30903c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 3091a49a95e9SJose Ricardo Ziviani } else if (i <= -32) { 30923c385a93SMark Cave-Ayland ret.VsrD(1) = ret.VsrD(0) = 0; 3093a49a95e9SJose Ricardo Ziviani } else if (i > 0) { 30943c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 3095a49a95e9SJose Ricardo Ziviani } else { 30963c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 3097a49a95e9SJose Ricardo Ziviani } 3098a49a95e9SJose Ricardo Ziviani *r = ret; 3099a49a95e9SJose Ricardo Ziviani 3100a49a95e9SJose Ricardo Ziviani cr = bcd_cmp_zero(r); 3101a49a95e9SJose Ricardo Ziviani if (ox_flag) { 3102a49a95e9SJose Ricardo Ziviani cr |= CRF_SO; 3103a49a95e9SJose Ricardo Ziviani } 3104a49a95e9SJose Ricardo Ziviani 3105a49a95e9SJose Ricardo Ziviani return cr; 3106a49a95e9SJose Ricardo Ziviani } 3107a49a95e9SJose Ricardo Ziviani 3108a54238adSJose Ricardo Ziviani uint32_t helper_bcdsr(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 3109a54238adSJose Ricardo Ziviani { 3110a54238adSJose Ricardo Ziviani int cr; 3111a54238adSJose Ricardo Ziviani int unused = 0; 3112a54238adSJose Ricardo Ziviani int invalid = 0; 3113a54238adSJose Ricardo Ziviani bool ox_flag = false; 3114a54238adSJose Ricardo Ziviani int sgnb = bcd_get_sgn(b); 3115a54238adSJose Ricardo Ziviani ppc_avr_t ret = *b; 31163c385a93SMark Cave-Ayland ret.VsrD(1) &= ~0xf; 3117a54238adSJose Ricardo Ziviani 3118a54238adSJose Ricardo Ziviani #if defined(HOST_WORDS_BIGENDIAN) 3119a54238adSJose Ricardo Ziviani int i = a->s8[7]; 3120a54238adSJose Ricardo Ziviani ppc_avr_t bcd_one = { .u64 = { 0, 0x10 } }; 3121a54238adSJose Ricardo Ziviani #else 3122a54238adSJose Ricardo Ziviani int i = a->s8[8]; 3123a54238adSJose Ricardo Ziviani ppc_avr_t bcd_one = { .u64 = { 0x10, 0 } }; 3124a54238adSJose Ricardo Ziviani #endif 3125a54238adSJose Ricardo Ziviani 3126a54238adSJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 3127a54238adSJose Ricardo Ziviani return CRF_SO; 3128a54238adSJose Ricardo Ziviani } 3129a54238adSJose Ricardo Ziviani 3130a54238adSJose Ricardo Ziviani if (unlikely(i > 31)) { 3131a54238adSJose Ricardo Ziviani i = 31; 3132a54238adSJose Ricardo Ziviani } else if (unlikely(i < -31)) { 3133a54238adSJose Ricardo Ziviani i = -31; 3134a54238adSJose Ricardo Ziviani } 3135a54238adSJose Ricardo Ziviani 3136a54238adSJose Ricardo Ziviani if (i > 0) { 31373c385a93SMark Cave-Ayland ulshift(&ret.VsrD(1), &ret.VsrD(0), i * 4, &ox_flag); 3138a54238adSJose Ricardo Ziviani } else { 31393c385a93SMark Cave-Ayland urshift(&ret.VsrD(1), &ret.VsrD(0), -i * 4); 3140a54238adSJose Ricardo Ziviani 3141a54238adSJose Ricardo Ziviani if (bcd_get_digit(&ret, 0, &invalid) >= 5) { 3142a54238adSJose Ricardo Ziviani bcd_add_mag(&ret, &ret, &bcd_one, &invalid, &unused); 3143a54238adSJose Ricardo Ziviani } 3144a54238adSJose Ricardo Ziviani } 3145a54238adSJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(sgnb, ps), 0); 3146a54238adSJose Ricardo Ziviani 3147a54238adSJose Ricardo Ziviani cr = bcd_cmp_zero(&ret); 3148a54238adSJose Ricardo Ziviani if (ox_flag) { 3149a54238adSJose Ricardo Ziviani cr |= CRF_SO; 3150a54238adSJose Ricardo Ziviani } 3151a54238adSJose Ricardo Ziviani *r = ret; 3152a54238adSJose Ricardo Ziviani 3153a54238adSJose Ricardo Ziviani return cr; 3154a54238adSJose Ricardo Ziviani } 3155a54238adSJose Ricardo Ziviani 315631bc4d11SJose Ricardo Ziviani uint32_t helper_bcdtrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 315731bc4d11SJose Ricardo Ziviani { 315831bc4d11SJose Ricardo Ziviani uint64_t mask; 315931bc4d11SJose Ricardo Ziviani uint32_t ox_flag = 0; 316031bc4d11SJose Ricardo Ziviani #if defined(HOST_WORDS_BIGENDIAN) 316131bc4d11SJose Ricardo Ziviani int i = a->s16[3] + 1; 316231bc4d11SJose Ricardo Ziviani #else 316331bc4d11SJose Ricardo Ziviani int i = a->s16[4] + 1; 316431bc4d11SJose Ricardo Ziviani #endif 316531bc4d11SJose Ricardo Ziviani ppc_avr_t ret = *b; 316631bc4d11SJose Ricardo Ziviani 316731bc4d11SJose Ricardo Ziviani if (bcd_is_valid(b) == false) { 316831bc4d11SJose Ricardo Ziviani return CRF_SO; 316931bc4d11SJose Ricardo Ziviani } 317031bc4d11SJose Ricardo Ziviani 317131bc4d11SJose Ricardo Ziviani if (i > 16 && i < 32) { 317231bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 31733c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 317431bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 317531bc4d11SJose Ricardo Ziviani } 317631bc4d11SJose Ricardo Ziviani 31773c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 317831bc4d11SJose Ricardo Ziviani } else if (i >= 0 && i <= 16) { 317931bc4d11SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 31803c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 318131bc4d11SJose Ricardo Ziviani ox_flag = CRF_SO; 318231bc4d11SJose Ricardo Ziviani } 318331bc4d11SJose Ricardo Ziviani 31843c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 31853c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 318631bc4d11SJose Ricardo Ziviani } 318731bc4d11SJose Ricardo Ziviani bcd_put_digit(&ret, bcd_preferred_sgn(bcd_get_sgn(b), ps), 0); 318831bc4d11SJose Ricardo Ziviani *r = ret; 318931bc4d11SJose Ricardo Ziviani 319031bc4d11SJose Ricardo Ziviani return bcd_cmp_zero(&ret) | ox_flag; 319131bc4d11SJose Ricardo Ziviani } 319231bc4d11SJose Ricardo Ziviani 31935c32e2e4SJose Ricardo Ziviani uint32_t helper_bcdutrunc(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, uint32_t ps) 31945c32e2e4SJose Ricardo Ziviani { 31955c32e2e4SJose Ricardo Ziviani int i; 31965c32e2e4SJose Ricardo Ziviani uint64_t mask; 31975c32e2e4SJose Ricardo Ziviani uint32_t ox_flag = 0; 31985c32e2e4SJose Ricardo Ziviani int invalid = 0; 31995c32e2e4SJose Ricardo Ziviani ppc_avr_t ret = *b; 32005c32e2e4SJose Ricardo Ziviani 32015c32e2e4SJose Ricardo Ziviani for (i = 0; i < 32; i++) { 32025c32e2e4SJose Ricardo Ziviani bcd_get_digit(b, i, &invalid); 32035c32e2e4SJose Ricardo Ziviani 32045c32e2e4SJose Ricardo Ziviani if (unlikely(invalid)) { 32055c32e2e4SJose Ricardo Ziviani return CRF_SO; 32065c32e2e4SJose Ricardo Ziviani } 32075c32e2e4SJose Ricardo Ziviani } 32085c32e2e4SJose Ricardo Ziviani 32095c32e2e4SJose Ricardo Ziviani #if defined(HOST_WORDS_BIGENDIAN) 32105c32e2e4SJose Ricardo Ziviani i = a->s16[3]; 32115c32e2e4SJose Ricardo Ziviani #else 32125c32e2e4SJose Ricardo Ziviani i = a->s16[4]; 32135c32e2e4SJose Ricardo Ziviani #endif 32145c32e2e4SJose Ricardo Ziviani if (i > 16 && i < 33) { 32155c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (128 - i * 4); 32163c385a93SMark Cave-Ayland if (ret.VsrD(0) & ~mask) { 32175c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 32185c32e2e4SJose Ricardo Ziviani } 32195c32e2e4SJose Ricardo Ziviani 32203c385a93SMark Cave-Ayland ret.VsrD(0) &= mask; 32215c32e2e4SJose Ricardo Ziviani } else if (i > 0 && i <= 16) { 32225c32e2e4SJose Ricardo Ziviani mask = (uint64_t)-1 >> (64 - i * 4); 32233c385a93SMark Cave-Ayland if (ret.VsrD(0) || (ret.VsrD(1) & ~mask)) { 32245c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 32255c32e2e4SJose Ricardo Ziviani } 32265c32e2e4SJose Ricardo Ziviani 32273c385a93SMark Cave-Ayland ret.VsrD(1) &= mask; 32283c385a93SMark Cave-Ayland ret.VsrD(0) = 0; 32295c32e2e4SJose Ricardo Ziviani } else if (i == 0) { 32303c385a93SMark Cave-Ayland if (ret.VsrD(0) || ret.VsrD(1)) { 32315c32e2e4SJose Ricardo Ziviani ox_flag = CRF_SO; 32325c32e2e4SJose Ricardo Ziviani } 32333c385a93SMark Cave-Ayland ret.VsrD(0) = ret.VsrD(1) = 0; 32345c32e2e4SJose Ricardo Ziviani } 32355c32e2e4SJose Ricardo Ziviani 32365c32e2e4SJose Ricardo Ziviani *r = ret; 32373c385a93SMark Cave-Ayland if (r->VsrD(0) == 0 && r->VsrD(1) == 0) { 32385c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_EQ; 32395c32e2e4SJose Ricardo Ziviani } 32405c32e2e4SJose Ricardo Ziviani 32415c32e2e4SJose Ricardo Ziviani return ox_flag | CRF_GT; 32425c32e2e4SJose Ricardo Ziviani } 32435c32e2e4SJose Ricardo Ziviani 3244fcf5ef2aSThomas Huth void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a) 3245fcf5ef2aSThomas Huth { 3246fcf5ef2aSThomas Huth int i; 3247fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 3248fcf5ef2aSThomas Huth r->u8[i] = AES_sbox[a->u8[i]]; 3249fcf5ef2aSThomas Huth } 3250fcf5ef2aSThomas Huth } 3251fcf5ef2aSThomas Huth 3252fcf5ef2aSThomas Huth void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3253fcf5ef2aSThomas Huth { 3254fcf5ef2aSThomas Huth ppc_avr_t result; 3255fcf5ef2aSThomas Huth int i; 3256fcf5ef2aSThomas Huth 3257fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 32582dea57dbSMark Cave-Ayland result.VsrW(i) = b->VsrW(i) ^ 32592dea57dbSMark Cave-Ayland (AES_Te0[a->VsrB(AES_shifts[4 * i + 0])] ^ 32602dea57dbSMark Cave-Ayland AES_Te1[a->VsrB(AES_shifts[4 * i + 1])] ^ 32612dea57dbSMark Cave-Ayland AES_Te2[a->VsrB(AES_shifts[4 * i + 2])] ^ 32622dea57dbSMark Cave-Ayland AES_Te3[a->VsrB(AES_shifts[4 * i + 3])]); 3263fcf5ef2aSThomas Huth } 3264fcf5ef2aSThomas Huth *r = result; 3265fcf5ef2aSThomas Huth } 3266fcf5ef2aSThomas Huth 3267fcf5ef2aSThomas Huth void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3268fcf5ef2aSThomas Huth { 3269fcf5ef2aSThomas Huth ppc_avr_t result; 3270fcf5ef2aSThomas Huth int i; 3271fcf5ef2aSThomas Huth 3272fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 32732dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_sbox[a->VsrB(AES_shifts[i])]); 3274fcf5ef2aSThomas Huth } 3275fcf5ef2aSThomas Huth *r = result; 3276fcf5ef2aSThomas Huth } 3277fcf5ef2aSThomas Huth 3278fcf5ef2aSThomas Huth void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3279fcf5ef2aSThomas Huth { 3280fcf5ef2aSThomas Huth /* This differs from what is written in ISA V2.07. The RTL is */ 3281fcf5ef2aSThomas Huth /* incorrect and will be fixed in V2.07B. */ 3282fcf5ef2aSThomas Huth int i; 3283fcf5ef2aSThomas Huth ppc_avr_t tmp; 3284fcf5ef2aSThomas Huth 3285fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 32862dea57dbSMark Cave-Ayland tmp.VsrB(i) = b->VsrB(i) ^ AES_isbox[a->VsrB(AES_ishifts[i])]; 3287fcf5ef2aSThomas Huth } 3288fcf5ef2aSThomas Huth 3289fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u32) { 32902dea57dbSMark Cave-Ayland r->VsrW(i) = 32912dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 0)][0] ^ 32922dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 1)][1] ^ 32932dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 2)][2] ^ 32942dea57dbSMark Cave-Ayland AES_imc[tmp.VsrB(4 * i + 3)][3]; 3295fcf5ef2aSThomas Huth } 3296fcf5ef2aSThomas Huth } 3297fcf5ef2aSThomas Huth 3298fcf5ef2aSThomas Huth void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b) 3299fcf5ef2aSThomas Huth { 3300fcf5ef2aSThomas Huth ppc_avr_t result; 3301fcf5ef2aSThomas Huth int i; 3302fcf5ef2aSThomas Huth 3303fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 33042dea57dbSMark Cave-Ayland result.VsrB(i) = b->VsrB(i) ^ (AES_isbox[a->VsrB(AES_ishifts[i])]); 3305fcf5ef2aSThomas Huth } 3306fcf5ef2aSThomas Huth *r = result; 3307fcf5ef2aSThomas Huth } 3308fcf5ef2aSThomas Huth 3309fcf5ef2aSThomas Huth #define ROTRu32(v, n) (((v) >> (n)) | ((v) << (32 - n))) 3310fcf5ef2aSThomas Huth 3311fcf5ef2aSThomas Huth void helper_vshasigmaw(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 3312fcf5ef2aSThomas Huth { 3313fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 3314fcf5ef2aSThomas Huth int six = st_six & 0xF; 3315fcf5ef2aSThomas Huth int i; 3316fcf5ef2aSThomas Huth 3317*730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u32); i++) { 3318fcf5ef2aSThomas Huth if (st == 0) { 3319fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 3320*730d2ca3SMark Cave-Ayland r->VsrW(i) = ROTRu32(a->VsrW(i), 7) ^ 3321*730d2ca3SMark Cave-Ayland ROTRu32(a->VsrW(i), 18) ^ 3322*730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 3); 3323fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 3324*730d2ca3SMark Cave-Ayland r->VsrW(i) = ROTRu32(a->VsrW(i), 17) ^ 3325*730d2ca3SMark Cave-Ayland ROTRu32(a->VsrW(i), 19) ^ 3326*730d2ca3SMark Cave-Ayland (a->VsrW(i) >> 10); 3327fcf5ef2aSThomas Huth } 3328fcf5ef2aSThomas Huth } else { /* st == 1 */ 3329fcf5ef2aSThomas Huth if ((six & (0x8 >> i)) == 0) { 3330*730d2ca3SMark Cave-Ayland r->VsrW(i) = ROTRu32(a->VsrW(i), 2) ^ 3331*730d2ca3SMark Cave-Ayland ROTRu32(a->VsrW(i), 13) ^ 3332*730d2ca3SMark Cave-Ayland ROTRu32(a->VsrW(i), 22); 3333fcf5ef2aSThomas Huth } else { /* six.bit[i] == 1 */ 3334*730d2ca3SMark Cave-Ayland r->VsrW(i) = ROTRu32(a->VsrW(i), 6) ^ 3335*730d2ca3SMark Cave-Ayland ROTRu32(a->VsrW(i), 11) ^ 3336*730d2ca3SMark Cave-Ayland ROTRu32(a->VsrW(i), 25); 3337fcf5ef2aSThomas Huth } 3338fcf5ef2aSThomas Huth } 3339fcf5ef2aSThomas Huth } 3340fcf5ef2aSThomas Huth } 3341fcf5ef2aSThomas Huth 3342fcf5ef2aSThomas Huth #undef ROTRu32 3343fcf5ef2aSThomas Huth 3344fcf5ef2aSThomas Huth #define ROTRu64(v, n) (((v) >> (n)) | ((v) << (64-n))) 3345fcf5ef2aSThomas Huth 3346fcf5ef2aSThomas Huth void helper_vshasigmad(ppc_avr_t *r, ppc_avr_t *a, uint32_t st_six) 3347fcf5ef2aSThomas Huth { 3348fcf5ef2aSThomas Huth int st = (st_six & 0x10) != 0; 3349fcf5ef2aSThomas Huth int six = st_six & 0xF; 3350fcf5ef2aSThomas Huth int i; 3351fcf5ef2aSThomas Huth 3352*730d2ca3SMark Cave-Ayland for (i = 0; i < ARRAY_SIZE(r->u64); i++) { 3353fcf5ef2aSThomas Huth if (st == 0) { 3354fcf5ef2aSThomas Huth if ((six & (0x8 >> (2*i))) == 0) { 3355*730d2ca3SMark Cave-Ayland r->VsrD(i) = ROTRu64(a->VsrD(i), 1) ^ 3356*730d2ca3SMark Cave-Ayland ROTRu64(a->VsrD(i), 8) ^ 3357*730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 7); 3358fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 3359*730d2ca3SMark Cave-Ayland r->VsrD(i) = ROTRu64(a->VsrD(i), 19) ^ 3360*730d2ca3SMark Cave-Ayland ROTRu64(a->VsrD(i), 61) ^ 3361*730d2ca3SMark Cave-Ayland (a->VsrD(i) >> 6); 3362fcf5ef2aSThomas Huth } 3363fcf5ef2aSThomas Huth } else { /* st == 1 */ 3364fcf5ef2aSThomas Huth if ((six & (0x8 >> (2*i))) == 0) { 3365*730d2ca3SMark Cave-Ayland r->VsrD(i) = ROTRu64(a->VsrD(i), 28) ^ 3366*730d2ca3SMark Cave-Ayland ROTRu64(a->VsrD(i), 34) ^ 3367*730d2ca3SMark Cave-Ayland ROTRu64(a->VsrD(i), 39); 3368fcf5ef2aSThomas Huth } else { /* six.bit[2*i] == 1 */ 3369*730d2ca3SMark Cave-Ayland r->VsrD(i) = ROTRu64(a->VsrD(i), 14) ^ 3370*730d2ca3SMark Cave-Ayland ROTRu64(a->VsrD(i), 18) ^ 3371*730d2ca3SMark Cave-Ayland ROTRu64(a->VsrD(i), 41); 3372fcf5ef2aSThomas Huth } 3373fcf5ef2aSThomas Huth } 3374fcf5ef2aSThomas Huth } 3375fcf5ef2aSThomas Huth } 3376fcf5ef2aSThomas Huth 3377fcf5ef2aSThomas Huth #undef ROTRu64 3378fcf5ef2aSThomas Huth 3379fcf5ef2aSThomas Huth void helper_vpermxor(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c) 3380fcf5ef2aSThomas Huth { 3381fcf5ef2aSThomas Huth ppc_avr_t result; 3382fcf5ef2aSThomas Huth int i; 3383fcf5ef2aSThomas Huth 3384fcf5ef2aSThomas Huth VECTOR_FOR_INORDER_I(i, u8) { 3385fcf5ef2aSThomas Huth int indexA = c->u8[i] >> 4; 3386fcf5ef2aSThomas Huth int indexB = c->u8[i] & 0xF; 3387fcf5ef2aSThomas Huth #if defined(HOST_WORDS_BIGENDIAN) 3388fcf5ef2aSThomas Huth result.u8[i] = a->u8[indexA] ^ b->u8[indexB]; 3389fcf5ef2aSThomas Huth #else 3390fcf5ef2aSThomas Huth result.u8[i] = a->u8[15-indexA] ^ b->u8[15-indexB]; 3391fcf5ef2aSThomas Huth #endif 3392fcf5ef2aSThomas Huth } 3393fcf5ef2aSThomas Huth *r = result; 3394fcf5ef2aSThomas Huth } 3395fcf5ef2aSThomas Huth 3396fcf5ef2aSThomas Huth #undef VECTOR_FOR_INORDER_I 3397fcf5ef2aSThomas Huth 3398fcf5ef2aSThomas Huth /*****************************************************************************/ 3399fcf5ef2aSThomas Huth /* SPE extension helpers */ 3400fcf5ef2aSThomas Huth /* Use a table to make this quicker */ 3401fcf5ef2aSThomas Huth static const uint8_t hbrev[16] = { 3402fcf5ef2aSThomas Huth 0x0, 0x8, 0x4, 0xC, 0x2, 0xA, 0x6, 0xE, 3403fcf5ef2aSThomas Huth 0x1, 0x9, 0x5, 0xD, 0x3, 0xB, 0x7, 0xF, 3404fcf5ef2aSThomas Huth }; 3405fcf5ef2aSThomas Huth 3406fcf5ef2aSThomas Huth static inline uint8_t byte_reverse(uint8_t val) 3407fcf5ef2aSThomas Huth { 3408fcf5ef2aSThomas Huth return hbrev[val >> 4] | (hbrev[val & 0xF] << 4); 3409fcf5ef2aSThomas Huth } 3410fcf5ef2aSThomas Huth 3411fcf5ef2aSThomas Huth static inline uint32_t word_reverse(uint32_t val) 3412fcf5ef2aSThomas Huth { 3413fcf5ef2aSThomas Huth return byte_reverse(val >> 24) | (byte_reverse(val >> 16) << 8) | 3414fcf5ef2aSThomas Huth (byte_reverse(val >> 8) << 16) | (byte_reverse(val) << 24); 3415fcf5ef2aSThomas Huth } 3416fcf5ef2aSThomas Huth 3417fcf5ef2aSThomas Huth #define MASKBITS 16 /* Random value - to be fixed (implementation dependent) */ 3418fcf5ef2aSThomas Huth target_ulong helper_brinc(target_ulong arg1, target_ulong arg2) 3419fcf5ef2aSThomas Huth { 3420fcf5ef2aSThomas Huth uint32_t a, b, d, mask; 3421fcf5ef2aSThomas Huth 3422fcf5ef2aSThomas Huth mask = UINT32_MAX >> (32 - MASKBITS); 3423fcf5ef2aSThomas Huth a = arg1 & mask; 3424fcf5ef2aSThomas Huth b = arg2 & mask; 3425fcf5ef2aSThomas Huth d = word_reverse(1 + word_reverse(a | ~b)); 3426fcf5ef2aSThomas Huth return (arg1 & ~mask) | (d & b); 3427fcf5ef2aSThomas Huth } 3428fcf5ef2aSThomas Huth 3429fcf5ef2aSThomas Huth uint32_t helper_cntlsw32(uint32_t val) 3430fcf5ef2aSThomas Huth { 3431fcf5ef2aSThomas Huth if (val & 0x80000000) { 3432fcf5ef2aSThomas Huth return clz32(~val); 3433fcf5ef2aSThomas Huth } else { 3434fcf5ef2aSThomas Huth return clz32(val); 3435fcf5ef2aSThomas Huth } 3436fcf5ef2aSThomas Huth } 3437fcf5ef2aSThomas Huth 3438fcf5ef2aSThomas Huth uint32_t helper_cntlzw32(uint32_t val) 3439fcf5ef2aSThomas Huth { 3440fcf5ef2aSThomas Huth return clz32(val); 3441fcf5ef2aSThomas Huth } 3442fcf5ef2aSThomas Huth 3443fcf5ef2aSThomas Huth /* 440 specific */ 3444fcf5ef2aSThomas Huth target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high, 3445fcf5ef2aSThomas Huth target_ulong low, uint32_t update_Rc) 3446fcf5ef2aSThomas Huth { 3447fcf5ef2aSThomas Huth target_ulong mask; 3448fcf5ef2aSThomas Huth int i; 3449fcf5ef2aSThomas Huth 3450fcf5ef2aSThomas Huth i = 1; 3451fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3452fcf5ef2aSThomas Huth if ((high & mask) == 0) { 3453fcf5ef2aSThomas Huth if (update_Rc) { 3454fcf5ef2aSThomas Huth env->crf[0] = 0x4; 3455fcf5ef2aSThomas Huth } 3456fcf5ef2aSThomas Huth goto done; 3457fcf5ef2aSThomas Huth } 3458fcf5ef2aSThomas Huth i++; 3459fcf5ef2aSThomas Huth } 3460fcf5ef2aSThomas Huth for (mask = 0xFF000000; mask != 0; mask = mask >> 8) { 3461fcf5ef2aSThomas Huth if ((low & mask) == 0) { 3462fcf5ef2aSThomas Huth if (update_Rc) { 3463fcf5ef2aSThomas Huth env->crf[0] = 0x8; 3464fcf5ef2aSThomas Huth } 3465fcf5ef2aSThomas Huth goto done; 3466fcf5ef2aSThomas Huth } 3467fcf5ef2aSThomas Huth i++; 3468fcf5ef2aSThomas Huth } 3469fcf5ef2aSThomas Huth i = 8; 3470fcf5ef2aSThomas Huth if (update_Rc) { 3471fcf5ef2aSThomas Huth env->crf[0] = 0x2; 3472fcf5ef2aSThomas Huth } 3473fcf5ef2aSThomas Huth done: 3474fcf5ef2aSThomas Huth env->xer = (env->xer & ~0x7F) | i; 3475fcf5ef2aSThomas Huth if (update_Rc) { 3476fcf5ef2aSThomas Huth env->crf[0] |= xer_so; 3477fcf5ef2aSThomas Huth } 3478fcf5ef2aSThomas Huth return i; 3479fcf5ef2aSThomas Huth } 3480