/* * RISC-V translation routines for the RV64M Standard Extension. * * Copyright (c) 2016-2017 Sagar Karandikar, sagark@eecs.berkeley.edu * Copyright (c) 2018 Peer Adelt, peer.adelt@hni.uni-paderborn.de * Bastian Koppelmann, kbastian@mail.uni-paderborn.de * * This program is free software; you can redistribute it and/or modify it * under the terms and conditions of the GNU General Public License, * version 2 or later, as published by the Free Software Foundation. * * This program is distributed in the hope it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for * more details. * * You should have received a copy of the GNU General Public License along with * this program. If not, see . */ #define REQUIRE_M_OR_ZMMUL(ctx) do { \ if (!ctx->cfg_ptr->ext_zmmul && !has_ext(ctx, RVM)) { \ return false; \ } \ } while (0) static void gen_mulhu_i128(TCGv r2, TCGv r3, TCGv al, TCGv ah, TCGv bl, TCGv bh) { TCGv tmpl = tcg_temp_new(); TCGv tmph = tcg_temp_new(); TCGv r0 = tcg_temp_new(); TCGv r1 = tcg_temp_new(); TCGv zero = tcg_constant_tl(0); tcg_gen_mulu2_tl(r0, r1, al, bl); tcg_gen_mulu2_tl(tmpl, tmph, al, bh); tcg_gen_add2_tl(r1, r2, r1, zero, tmpl, tmph); tcg_gen_mulu2_tl(tmpl, tmph, ah, bl); tcg_gen_add2_tl(r1, tmph, r1, r2, tmpl, tmph); /* Overflow detection into r3 */ tcg_gen_setcond_tl(TCG_COND_LTU, r3, tmph, r2); tcg_gen_mov_tl(r2, tmph); tcg_gen_mulu2_tl(tmpl, tmph, ah, bh); tcg_gen_add2_tl(r2, r3, r2, r3, tmpl, tmph); } static void gen_mul_i128(TCGv rl, TCGv rh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { TCGv tmpl = tcg_temp_new(); TCGv tmph = tcg_temp_new(); TCGv tmpx = tcg_temp_new(); TCGv zero = tcg_constant_tl(0); tcg_gen_mulu2_tl(rl, rh, rs1l, rs2l); tcg_gen_mulu2_tl(tmpl, tmph, rs1l, rs2h); tcg_gen_add2_tl(rh, tmpx, rh, zero, tmpl, tmph); tcg_gen_mulu2_tl(tmpl, tmph, rs1h, rs2l); tcg_gen_add2_tl(rh, tmph, rh, tmpx, tmpl, tmph); } static bool trans_mul(DisasContext *ctx, arg_mul *a) { REQUIRE_M_OR_ZMMUL(ctx); return gen_arith(ctx, a, EXT_NONE, tcg_gen_mul_tl, gen_mul_i128); } static void gen_mulh_i128(TCGv rl, TCGv rh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { TCGv t0l = tcg_temp_new(); TCGv t0h = tcg_temp_new(); TCGv t1l = tcg_temp_new(); TCGv t1h = tcg_temp_new(); gen_mulhu_i128(rl, rh, rs1l, rs1h, rs2l, rs2h); tcg_gen_sari_tl(t0h, rs1h, 63); tcg_gen_and_tl(t0l, t0h, rs2l); tcg_gen_and_tl(t0h, t0h, rs2h); tcg_gen_sari_tl(t1h, rs2h, 63); tcg_gen_and_tl(t1l, t1h, rs1l); tcg_gen_and_tl(t1h, t1h, rs1h); tcg_gen_sub2_tl(t0l, t0h, rl, rh, t0l, t0h); tcg_gen_sub2_tl(rl, rh, t0l, t0h, t1l, t1h); } static void gen_mulh(TCGv ret, TCGv s1, TCGv s2) { TCGv discard = tcg_temp_new(); tcg_gen_muls2_tl(discard, ret, s1, s2); } static void gen_mulh_w(TCGv ret, TCGv s1, TCGv s2) { tcg_gen_mul_tl(ret, s1, s2); tcg_gen_sari_tl(ret, ret, 32); } static bool trans_mulh(DisasContext *ctx, arg_mulh *a) { REQUIRE_M_OR_ZMMUL(ctx); return gen_arith_per_ol(ctx, a, EXT_SIGN, gen_mulh, gen_mulh_w, gen_mulh_i128); } static void gen_mulhsu_i128(TCGv rl, TCGv rh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { TCGv t0l = tcg_temp_new(); TCGv t0h = tcg_temp_new(); gen_mulhu_i128(rl, rh, rs1l, rs1h, rs2l, rs2h); tcg_gen_sari_tl(t0h, rs1h, 63); tcg_gen_and_tl(t0l, t0h, rs2l); tcg_gen_and_tl(t0h, t0h, rs2h); tcg_gen_sub2_tl(rl, rh, rl, rh, t0l, t0h); } static void gen_mulhsu(TCGv ret, TCGv arg1, TCGv arg2) { TCGv rl = tcg_temp_new(); TCGv rh = tcg_temp_new(); tcg_gen_mulu2_tl(rl, rh, arg1, arg2); /* fix up for one negative */ tcg_gen_sari_tl(rl, arg1, TARGET_LONG_BITS - 1); tcg_gen_and_tl(rl, rl, arg2); tcg_gen_sub_tl(ret, rh, rl); } static void gen_mulhsu_w(TCGv ret, TCGv arg1, TCGv arg2) { TCGv t1 = tcg_temp_new(); TCGv t2 = tcg_temp_new(); tcg_gen_ext32s_tl(t1, arg1); tcg_gen_ext32u_tl(t2, arg2); tcg_gen_mul_tl(ret, t1, t2); tcg_gen_sari_tl(ret, ret, 32); } static bool trans_mulhsu(DisasContext *ctx, arg_mulhsu *a) { REQUIRE_M_OR_ZMMUL(ctx); return gen_arith_per_ol(ctx, a, EXT_NONE, gen_mulhsu, gen_mulhsu_w, gen_mulhsu_i128); } static void gen_mulhu(TCGv ret, TCGv s1, TCGv s2) { TCGv discard = tcg_temp_new(); tcg_gen_mulu2_tl(discard, ret, s1, s2); } static bool trans_mulhu(DisasContext *ctx, arg_mulhu *a) { REQUIRE_M_OR_ZMMUL(ctx); /* gen_mulh_w works for either sign as input. */ return gen_arith_per_ol(ctx, a, EXT_ZERO, gen_mulhu, gen_mulh_w, gen_mulhu_i128); } static void gen_div_i128(TCGv rdl, TCGv rdh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { gen_helper_divs_i128(rdl, cpu_env, rs1l, rs1h, rs2l, rs2h); tcg_gen_ld_tl(rdh, cpu_env, offsetof(CPURISCVState, retxh)); } static void gen_div(TCGv ret, TCGv source1, TCGv source2) { TCGv temp1, temp2, zero, one, mone, min; temp1 = tcg_temp_new(); temp2 = tcg_temp_new(); zero = tcg_constant_tl(0); one = tcg_constant_tl(1); mone = tcg_constant_tl(-1); min = tcg_constant_tl(1ull << (TARGET_LONG_BITS - 1)); /* * If overflow, set temp2 to 1, else source2. * This produces the required result of min. */ tcg_gen_setcond_tl(TCG_COND_EQ, temp1, source1, min); tcg_gen_setcond_tl(TCG_COND_EQ, temp2, source2, mone); tcg_gen_and_tl(temp1, temp1, temp2); tcg_gen_movcond_tl(TCG_COND_NE, temp2, temp1, zero, one, source2); /* * If div by zero, set temp1 to -1 and temp2 to 1 to * produce the required result of -1. */ tcg_gen_movcond_tl(TCG_COND_EQ, temp1, source2, zero, mone, source1); tcg_gen_movcond_tl(TCG_COND_EQ, temp2, source2, zero, one, temp2); tcg_gen_div_tl(ret, temp1, temp2); } static bool trans_div(DisasContext *ctx, arg_div *a) { REQUIRE_EXT(ctx, RVM); return gen_arith(ctx, a, EXT_SIGN, gen_div, gen_div_i128); } static void gen_divu_i128(TCGv rdl, TCGv rdh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { gen_helper_divu_i128(rdl, cpu_env, rs1l, rs1h, rs2l, rs2h); tcg_gen_ld_tl(rdh, cpu_env, offsetof(CPURISCVState, retxh)); } static void gen_divu(TCGv ret, TCGv source1, TCGv source2) { TCGv temp1, temp2, zero, one, max; temp1 = tcg_temp_new(); temp2 = tcg_temp_new(); zero = tcg_constant_tl(0); one = tcg_constant_tl(1); max = tcg_constant_tl(~0); /* * If div by zero, set temp1 to max and temp2 to 1 to * produce the required result of max. */ tcg_gen_movcond_tl(TCG_COND_EQ, temp1, source2, zero, max, source1); tcg_gen_movcond_tl(TCG_COND_EQ, temp2, source2, zero, one, source2); tcg_gen_divu_tl(ret, temp1, temp2); } static bool trans_divu(DisasContext *ctx, arg_divu *a) { REQUIRE_EXT(ctx, RVM); return gen_arith(ctx, a, EXT_ZERO, gen_divu, gen_divu_i128); } static void gen_rem_i128(TCGv rdl, TCGv rdh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { gen_helper_rems_i128(rdl, cpu_env, rs1l, rs1h, rs2l, rs2h); tcg_gen_ld_tl(rdh, cpu_env, offsetof(CPURISCVState, retxh)); } static void gen_rem(TCGv ret, TCGv source1, TCGv source2) { TCGv temp1, temp2, zero, one, mone, min; temp1 = tcg_temp_new(); temp2 = tcg_temp_new(); zero = tcg_constant_tl(0); one = tcg_constant_tl(1); mone = tcg_constant_tl(-1); min = tcg_constant_tl(1ull << (TARGET_LONG_BITS - 1)); /* * If overflow, set temp1 to 0, else source1. * This avoids a possible host trap, and produces the required result of 0. */ tcg_gen_setcond_tl(TCG_COND_EQ, temp1, source1, min); tcg_gen_setcond_tl(TCG_COND_EQ, temp2, source2, mone); tcg_gen_and_tl(temp1, temp1, temp2); tcg_gen_movcond_tl(TCG_COND_NE, temp1, temp1, zero, zero, source1); /* * If div by zero, set temp2 to 1, else source2. * This avoids a possible host trap, but produces an incorrect result. */ tcg_gen_movcond_tl(TCG_COND_EQ, temp2, source2, zero, one, source2); tcg_gen_rem_tl(temp1, temp1, temp2); /* If div by zero, the required result is the original dividend. */ tcg_gen_movcond_tl(TCG_COND_EQ, ret, source2, zero, source1, temp1); } static bool trans_rem(DisasContext *ctx, arg_rem *a) { REQUIRE_EXT(ctx, RVM); return gen_arith(ctx, a, EXT_SIGN, gen_rem, gen_rem_i128); } static void gen_remu_i128(TCGv rdl, TCGv rdh, TCGv rs1l, TCGv rs1h, TCGv rs2l, TCGv rs2h) { gen_helper_remu_i128(rdl, cpu_env, rs1l, rs1h, rs2l, rs2h); tcg_gen_ld_tl(rdh, cpu_env, offsetof(CPURISCVState, retxh)); } static void gen_remu(TCGv ret, TCGv source1, TCGv source2) { TCGv temp, zero, one; temp = tcg_temp_new(); zero = tcg_constant_tl(0); one = tcg_constant_tl(1); /* * If div by zero, set temp to 1, else source2. * This avoids a possible host trap, but produces an incorrect result. */ tcg_gen_movcond_tl(TCG_COND_EQ, temp, source2, zero, one, source2); tcg_gen_remu_tl(temp, source1, temp); /* If div by zero, the required result is the original dividend. */ tcg_gen_movcond_tl(TCG_COND_EQ, ret, source2, zero, source1, temp); } static bool trans_remu(DisasContext *ctx, arg_remu *a) { REQUIRE_EXT(ctx, RVM); return gen_arith(ctx, a, EXT_ZERO, gen_remu, gen_remu_i128); } static bool trans_mulw(DisasContext *ctx, arg_mulw *a) { REQUIRE_64_OR_128BIT(ctx); REQUIRE_M_OR_ZMMUL(ctx); ctx->ol = MXL_RV32; return gen_arith(ctx, a, EXT_NONE, tcg_gen_mul_tl, NULL); } static bool trans_divw(DisasContext *ctx, arg_divw *a) { REQUIRE_64_OR_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV32; return gen_arith(ctx, a, EXT_SIGN, gen_div, NULL); } static bool trans_divuw(DisasContext *ctx, arg_divuw *a) { REQUIRE_64_OR_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV32; return gen_arith(ctx, a, EXT_ZERO, gen_divu, NULL); } static bool trans_remw(DisasContext *ctx, arg_remw *a) { REQUIRE_64_OR_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV32; return gen_arith(ctx, a, EXT_SIGN, gen_rem, NULL); } static bool trans_remuw(DisasContext *ctx, arg_remuw *a) { REQUIRE_64_OR_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV32; return gen_arith(ctx, a, EXT_ZERO, gen_remu, NULL); } static bool trans_muld(DisasContext *ctx, arg_muld *a) { REQUIRE_128BIT(ctx); REQUIRE_M_OR_ZMMUL(ctx); ctx->ol = MXL_RV64; return gen_arith(ctx, a, EXT_SIGN, tcg_gen_mul_tl, NULL); } static bool trans_divd(DisasContext *ctx, arg_divd *a) { REQUIRE_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV64; return gen_arith(ctx, a, EXT_SIGN, gen_div, NULL); } static bool trans_divud(DisasContext *ctx, arg_divud *a) { REQUIRE_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV64; return gen_arith(ctx, a, EXT_ZERO, gen_divu, NULL); } static bool trans_remd(DisasContext *ctx, arg_remd *a) { REQUIRE_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV64; return gen_arith(ctx, a, EXT_SIGN, gen_rem, NULL); } static bool trans_remud(DisasContext *ctx, arg_remud *a) { REQUIRE_128BIT(ctx); REQUIRE_EXT(ctx, RVM); ctx->ol = MXL_RV64; return gen_arith(ctx, a, EXT_ZERO, gen_remu, NULL); }