1/* 2 * RISC-V translation routines for the RV64F Standard Extension. 3 * 4 * Copyright (c) 2016-2017 Sagar Karandikar, sagark@eecs.berkeley.edu 5 * Copyright (c) 2018 Peer Adelt, peer.adelt@hni.uni-paderborn.de 6 * Bastian Koppelmann, kbastian@mail.uni-paderborn.de 7 * 8 * This program is free software; you can redistribute it and/or modify it 9 * under the terms and conditions of the GNU General Public License, 10 * version 2 or later, as published by the Free Software Foundation. 11 * 12 * This program is distributed in the hope it will be useful, but WITHOUT 13 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 14 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 15 * more details. 16 * 17 * You should have received a copy of the GNU General Public License along with 18 * this program. If not, see <http://www.gnu.org/licenses/>. 19 */ 20 21#define REQUIRE_FPU do {\ 22 if (ctx->mstatus_fs == 0) \ 23 return false; \ 24} while (0) 25 26static bool trans_flw(DisasContext *ctx, arg_flw *a) 27{ 28 REQUIRE_FPU; 29 REQUIRE_EXT(ctx, RVF); 30 TCGv t0 = tcg_temp_new(); 31 gen_get_gpr(t0, a->rs1); 32 tcg_gen_addi_tl(t0, t0, a->imm); 33 34 tcg_gen_qemu_ld_i64(cpu_fpr[a->rd], t0, ctx->mem_idx, MO_TEUL); 35 gen_nanbox_s(cpu_fpr[a->rd], cpu_fpr[a->rd]); 36 37 tcg_temp_free(t0); 38 mark_fs_dirty(ctx); 39 return true; 40} 41 42static bool trans_fsw(DisasContext *ctx, arg_fsw *a) 43{ 44 REQUIRE_FPU; 45 REQUIRE_EXT(ctx, RVF); 46 TCGv t0 = tcg_temp_new(); 47 gen_get_gpr(t0, a->rs1); 48 49 tcg_gen_addi_tl(t0, t0, a->imm); 50 51 tcg_gen_qemu_st_i64(cpu_fpr[a->rs2], t0, ctx->mem_idx, MO_TEUL); 52 53 tcg_temp_free(t0); 54 return true; 55} 56 57static bool trans_fmadd_s(DisasContext *ctx, arg_fmadd_s *a) 58{ 59 REQUIRE_FPU; 60 REQUIRE_EXT(ctx, RVF); 61 gen_set_rm(ctx, a->rm); 62 gen_helper_fmadd_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1], 63 cpu_fpr[a->rs2], cpu_fpr[a->rs3]); 64 mark_fs_dirty(ctx); 65 return true; 66} 67 68static bool trans_fmsub_s(DisasContext *ctx, arg_fmsub_s *a) 69{ 70 REQUIRE_FPU; 71 REQUIRE_EXT(ctx, RVF); 72 gen_set_rm(ctx, a->rm); 73 gen_helper_fmsub_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1], 74 cpu_fpr[a->rs2], cpu_fpr[a->rs3]); 75 mark_fs_dirty(ctx); 76 return true; 77} 78 79static bool trans_fnmsub_s(DisasContext *ctx, arg_fnmsub_s *a) 80{ 81 REQUIRE_FPU; 82 REQUIRE_EXT(ctx, RVF); 83 gen_set_rm(ctx, a->rm); 84 gen_helper_fnmsub_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1], 85 cpu_fpr[a->rs2], cpu_fpr[a->rs3]); 86 mark_fs_dirty(ctx); 87 return true; 88} 89 90static bool trans_fnmadd_s(DisasContext *ctx, arg_fnmadd_s *a) 91{ 92 REQUIRE_FPU; 93 REQUIRE_EXT(ctx, RVF); 94 gen_set_rm(ctx, a->rm); 95 gen_helper_fnmadd_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1], 96 cpu_fpr[a->rs2], cpu_fpr[a->rs3]); 97 mark_fs_dirty(ctx); 98 return true; 99} 100 101static bool trans_fadd_s(DisasContext *ctx, arg_fadd_s *a) 102{ 103 REQUIRE_FPU; 104 REQUIRE_EXT(ctx, RVF); 105 106 gen_set_rm(ctx, a->rm); 107 gen_helper_fadd_s(cpu_fpr[a->rd], cpu_env, 108 cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 109 mark_fs_dirty(ctx); 110 return true; 111} 112 113static bool trans_fsub_s(DisasContext *ctx, arg_fsub_s *a) 114{ 115 REQUIRE_FPU; 116 REQUIRE_EXT(ctx, RVF); 117 118 gen_set_rm(ctx, a->rm); 119 gen_helper_fsub_s(cpu_fpr[a->rd], cpu_env, 120 cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 121 mark_fs_dirty(ctx); 122 return true; 123} 124 125static bool trans_fmul_s(DisasContext *ctx, arg_fmul_s *a) 126{ 127 REQUIRE_FPU; 128 REQUIRE_EXT(ctx, RVF); 129 130 gen_set_rm(ctx, a->rm); 131 gen_helper_fmul_s(cpu_fpr[a->rd], cpu_env, 132 cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 133 mark_fs_dirty(ctx); 134 return true; 135} 136 137static bool trans_fdiv_s(DisasContext *ctx, arg_fdiv_s *a) 138{ 139 REQUIRE_FPU; 140 REQUIRE_EXT(ctx, RVF); 141 142 gen_set_rm(ctx, a->rm); 143 gen_helper_fdiv_s(cpu_fpr[a->rd], cpu_env, 144 cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 145 mark_fs_dirty(ctx); 146 return true; 147} 148 149static bool trans_fsqrt_s(DisasContext *ctx, arg_fsqrt_s *a) 150{ 151 REQUIRE_FPU; 152 REQUIRE_EXT(ctx, RVF); 153 154 gen_set_rm(ctx, a->rm); 155 gen_helper_fsqrt_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1]); 156 mark_fs_dirty(ctx); 157 return true; 158} 159 160static bool trans_fsgnj_s(DisasContext *ctx, arg_fsgnj_s *a) 161{ 162 REQUIRE_FPU; 163 REQUIRE_EXT(ctx, RVF); 164 165 if (a->rs1 == a->rs2) { /* FMOV */ 166 gen_check_nanbox_s(cpu_fpr[a->rd], cpu_fpr[a->rs1]); 167 } else { /* FSGNJ */ 168 TCGv_i64 rs1 = tcg_temp_new_i64(); 169 TCGv_i64 rs2 = tcg_temp_new_i64(); 170 171 gen_check_nanbox_s(rs1, cpu_fpr[a->rs1]); 172 gen_check_nanbox_s(rs2, cpu_fpr[a->rs2]); 173 174 /* This formulation retains the nanboxing of rs2. */ 175 tcg_gen_deposit_i64(cpu_fpr[a->rd], rs2, rs1, 0, 31); 176 tcg_temp_free_i64(rs1); 177 tcg_temp_free_i64(rs2); 178 } 179 mark_fs_dirty(ctx); 180 return true; 181} 182 183static bool trans_fsgnjn_s(DisasContext *ctx, arg_fsgnjn_s *a) 184{ 185 TCGv_i64 rs1, rs2, mask; 186 187 REQUIRE_FPU; 188 REQUIRE_EXT(ctx, RVF); 189 190 rs1 = tcg_temp_new_i64(); 191 gen_check_nanbox_s(rs1, cpu_fpr[a->rs1]); 192 193 if (a->rs1 == a->rs2) { /* FNEG */ 194 tcg_gen_xori_i64(cpu_fpr[a->rd], rs1, MAKE_64BIT_MASK(31, 1)); 195 } else { 196 rs2 = tcg_temp_new_i64(); 197 gen_check_nanbox_s(rs2, cpu_fpr[a->rs2]); 198 199 /* 200 * Replace bit 31 in rs1 with inverse in rs2. 201 * This formulation retains the nanboxing of rs1. 202 */ 203 mask = tcg_const_i64(~MAKE_64BIT_MASK(31, 1)); 204 tcg_gen_nor_i64(rs2, rs2, mask); 205 tcg_gen_and_i64(rs1, mask, rs1); 206 tcg_gen_or_i64(cpu_fpr[a->rd], rs1, rs2); 207 208 tcg_temp_free_i64(mask); 209 tcg_temp_free_i64(rs2); 210 } 211 tcg_temp_free_i64(rs1); 212 213 mark_fs_dirty(ctx); 214 return true; 215} 216 217static bool trans_fsgnjx_s(DisasContext *ctx, arg_fsgnjx_s *a) 218{ 219 TCGv_i64 rs1, rs2; 220 221 REQUIRE_FPU; 222 REQUIRE_EXT(ctx, RVF); 223 224 rs1 = tcg_temp_new_i64(); 225 gen_check_nanbox_s(rs1, cpu_fpr[a->rs1]); 226 227 if (a->rs1 == a->rs2) { /* FABS */ 228 tcg_gen_andi_i64(cpu_fpr[a->rd], rs1, ~MAKE_64BIT_MASK(31, 1)); 229 } else { 230 rs2 = tcg_temp_new_i64(); 231 gen_check_nanbox_s(rs2, cpu_fpr[a->rs2]); 232 233 /* 234 * Xor bit 31 in rs1 with that in rs2. 235 * This formulation retains the nanboxing of rs1. 236 */ 237 tcg_gen_andi_i64(rs2, rs2, MAKE_64BIT_MASK(31, 1)); 238 tcg_gen_xor_i64(cpu_fpr[a->rd], rs1, rs2); 239 240 tcg_temp_free_i64(rs2); 241 } 242 tcg_temp_free_i64(rs1); 243 244 mark_fs_dirty(ctx); 245 return true; 246} 247 248static bool trans_fmin_s(DisasContext *ctx, arg_fmin_s *a) 249{ 250 REQUIRE_FPU; 251 REQUIRE_EXT(ctx, RVF); 252 253 gen_helper_fmin_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1], 254 cpu_fpr[a->rs2]); 255 mark_fs_dirty(ctx); 256 return true; 257} 258 259static bool trans_fmax_s(DisasContext *ctx, arg_fmax_s *a) 260{ 261 REQUIRE_FPU; 262 REQUIRE_EXT(ctx, RVF); 263 264 gen_helper_fmax_s(cpu_fpr[a->rd], cpu_env, cpu_fpr[a->rs1], 265 cpu_fpr[a->rs2]); 266 mark_fs_dirty(ctx); 267 return true; 268} 269 270static bool trans_fcvt_w_s(DisasContext *ctx, arg_fcvt_w_s *a) 271{ 272 REQUIRE_FPU; 273 REQUIRE_EXT(ctx, RVF); 274 275 TCGv t0 = tcg_temp_new(); 276 gen_set_rm(ctx, a->rm); 277 gen_helper_fcvt_w_s(t0, cpu_env, cpu_fpr[a->rs1]); 278 gen_set_gpr(a->rd, t0); 279 tcg_temp_free(t0); 280 281 return true; 282} 283 284static bool trans_fcvt_wu_s(DisasContext *ctx, arg_fcvt_wu_s *a) 285{ 286 REQUIRE_FPU; 287 REQUIRE_EXT(ctx, RVF); 288 289 TCGv t0 = tcg_temp_new(); 290 gen_set_rm(ctx, a->rm); 291 gen_helper_fcvt_wu_s(t0, cpu_env, cpu_fpr[a->rs1]); 292 gen_set_gpr(a->rd, t0); 293 tcg_temp_free(t0); 294 295 return true; 296} 297 298static bool trans_fmv_x_w(DisasContext *ctx, arg_fmv_x_w *a) 299{ 300 /* NOTE: This was FMV.X.S in an earlier version of the ISA spec! */ 301 REQUIRE_FPU; 302 REQUIRE_EXT(ctx, RVF); 303 304 TCGv t0 = tcg_temp_new(); 305 306#if defined(TARGET_RISCV64) 307 tcg_gen_ext32s_tl(t0, cpu_fpr[a->rs1]); 308#else 309 tcg_gen_extrl_i64_i32(t0, cpu_fpr[a->rs1]); 310#endif 311 312 gen_set_gpr(a->rd, t0); 313 tcg_temp_free(t0); 314 315 return true; 316} 317 318static bool trans_feq_s(DisasContext *ctx, arg_feq_s *a) 319{ 320 REQUIRE_FPU; 321 REQUIRE_EXT(ctx, RVF); 322 TCGv t0 = tcg_temp_new(); 323 gen_helper_feq_s(t0, cpu_env, cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 324 gen_set_gpr(a->rd, t0); 325 tcg_temp_free(t0); 326 return true; 327} 328 329static bool trans_flt_s(DisasContext *ctx, arg_flt_s *a) 330{ 331 REQUIRE_FPU; 332 REQUIRE_EXT(ctx, RVF); 333 TCGv t0 = tcg_temp_new(); 334 gen_helper_flt_s(t0, cpu_env, cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 335 gen_set_gpr(a->rd, t0); 336 tcg_temp_free(t0); 337 return true; 338} 339 340static bool trans_fle_s(DisasContext *ctx, arg_fle_s *a) 341{ 342 REQUIRE_FPU; 343 REQUIRE_EXT(ctx, RVF); 344 TCGv t0 = tcg_temp_new(); 345 gen_helper_fle_s(t0, cpu_env, cpu_fpr[a->rs1], cpu_fpr[a->rs2]); 346 gen_set_gpr(a->rd, t0); 347 tcg_temp_free(t0); 348 return true; 349} 350 351static bool trans_fclass_s(DisasContext *ctx, arg_fclass_s *a) 352{ 353 REQUIRE_FPU; 354 REQUIRE_EXT(ctx, RVF); 355 356 TCGv t0 = tcg_temp_new(); 357 358 gen_helper_fclass_s(t0, cpu_fpr[a->rs1]); 359 360 gen_set_gpr(a->rd, t0); 361 tcg_temp_free(t0); 362 363 return true; 364} 365 366static bool trans_fcvt_s_w(DisasContext *ctx, arg_fcvt_s_w *a) 367{ 368 REQUIRE_FPU; 369 REQUIRE_EXT(ctx, RVF); 370 371 TCGv t0 = tcg_temp_new(); 372 gen_get_gpr(t0, a->rs1); 373 374 gen_set_rm(ctx, a->rm); 375 gen_helper_fcvt_s_w(cpu_fpr[a->rd], cpu_env, t0); 376 377 mark_fs_dirty(ctx); 378 tcg_temp_free(t0); 379 380 return true; 381} 382 383static bool trans_fcvt_s_wu(DisasContext *ctx, arg_fcvt_s_wu *a) 384{ 385 REQUIRE_FPU; 386 REQUIRE_EXT(ctx, RVF); 387 388 TCGv t0 = tcg_temp_new(); 389 gen_get_gpr(t0, a->rs1); 390 391 gen_set_rm(ctx, a->rm); 392 gen_helper_fcvt_s_wu(cpu_fpr[a->rd], cpu_env, t0); 393 394 mark_fs_dirty(ctx); 395 tcg_temp_free(t0); 396 397 return true; 398} 399 400static bool trans_fmv_w_x(DisasContext *ctx, arg_fmv_w_x *a) 401{ 402 /* NOTE: This was FMV.S.X in an earlier version of the ISA spec! */ 403 REQUIRE_FPU; 404 REQUIRE_EXT(ctx, RVF); 405 406 TCGv t0 = tcg_temp_new(); 407 gen_get_gpr(t0, a->rs1); 408 409 tcg_gen_extu_tl_i64(cpu_fpr[a->rd], t0); 410 gen_nanbox_s(cpu_fpr[a->rd], cpu_fpr[a->rd]); 411 412 mark_fs_dirty(ctx); 413 tcg_temp_free(t0); 414 415 return true; 416} 417 418static bool trans_fcvt_l_s(DisasContext *ctx, arg_fcvt_l_s *a) 419{ 420 REQUIRE_64BIT(ctx); 421 REQUIRE_FPU; 422 REQUIRE_EXT(ctx, RVF); 423 424 TCGv t0 = tcg_temp_new(); 425 gen_set_rm(ctx, a->rm); 426 gen_helper_fcvt_l_s(t0, cpu_env, cpu_fpr[a->rs1]); 427 gen_set_gpr(a->rd, t0); 428 tcg_temp_free(t0); 429 return true; 430} 431 432static bool trans_fcvt_lu_s(DisasContext *ctx, arg_fcvt_lu_s *a) 433{ 434 REQUIRE_64BIT(ctx); 435 REQUIRE_FPU; 436 REQUIRE_EXT(ctx, RVF); 437 438 TCGv t0 = tcg_temp_new(); 439 gen_set_rm(ctx, a->rm); 440 gen_helper_fcvt_lu_s(t0, cpu_env, cpu_fpr[a->rs1]); 441 gen_set_gpr(a->rd, t0); 442 tcg_temp_free(t0); 443 return true; 444} 445 446static bool trans_fcvt_s_l(DisasContext *ctx, arg_fcvt_s_l *a) 447{ 448 REQUIRE_64BIT(ctx); 449 REQUIRE_FPU; 450 REQUIRE_EXT(ctx, RVF); 451 452 TCGv t0 = tcg_temp_new(); 453 gen_get_gpr(t0, a->rs1); 454 455 gen_set_rm(ctx, a->rm); 456 gen_helper_fcvt_s_l(cpu_fpr[a->rd], cpu_env, t0); 457 458 mark_fs_dirty(ctx); 459 tcg_temp_free(t0); 460 return true; 461} 462 463static bool trans_fcvt_s_lu(DisasContext *ctx, arg_fcvt_s_lu *a) 464{ 465 REQUIRE_64BIT(ctx); 466 REQUIRE_FPU; 467 REQUIRE_EXT(ctx, RVF); 468 469 TCGv t0 = tcg_temp_new(); 470 gen_get_gpr(t0, a->rs1); 471 472 gen_set_rm(ctx, a->rm); 473 gen_helper_fcvt_s_lu(cpu_fpr[a->rd], cpu_env, t0); 474 475 mark_fs_dirty(ctx); 476 tcg_temp_free(t0); 477 return true; 478} 479