168d19b58SWeiwei Li /*
268d19b58SWeiwei Li * RISC-V Crypto Emulation Helpers for QEMU.
368d19b58SWeiwei Li *
468d19b58SWeiwei Li * Copyright (c) 2021 Ruibo Lu, luruibo2000@163.com
568d19b58SWeiwei Li * Copyright (c) 2021 Zewen Ye, lustrew@foxmail.com
668d19b58SWeiwei Li *
768d19b58SWeiwei Li * This program is free software; you can redistribute it and/or modify it
868d19b58SWeiwei Li * under the terms and conditions of the GNU General Public License,
968d19b58SWeiwei Li * version 2 or later, as published by the Free Software Foundation.
1068d19b58SWeiwei Li *
1168d19b58SWeiwei Li * This program is distributed in the hope it will be useful, but WITHOUT
1268d19b58SWeiwei Li * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
1368d19b58SWeiwei Li * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
1468d19b58SWeiwei Li * more details.
1568d19b58SWeiwei Li *
1668d19b58SWeiwei Li * You should have received a copy of the GNU General Public License along with
1768d19b58SWeiwei Li * this program. If not, see <http://www.gnu.org/licenses/>.
1868d19b58SWeiwei Li */
1968d19b58SWeiwei Li
2068d19b58SWeiwei Li #include "qemu/osdep.h"
2168d19b58SWeiwei Li #include "cpu.h"
2268d19b58SWeiwei Li #include "exec/exec-all.h"
2368d19b58SWeiwei Li #include "exec/helper-proto.h"
2468d19b58SWeiwei Li #include "crypto/aes.h"
25cad26538SRichard Henderson #include "crypto/aes-round.h"
2668d19b58SWeiwei Li #include "crypto/sm4.h"
2768d19b58SWeiwei Li
2868d19b58SWeiwei Li #define sext32_xlen(x) (target_ulong)(int32_t)(x)
2968d19b58SWeiwei Li
aes32_operation(target_ulong shamt,target_ulong rs1,target_ulong rs2,bool enc,bool mix)3068d19b58SWeiwei Li static inline target_ulong aes32_operation(target_ulong shamt,
3168d19b58SWeiwei Li target_ulong rs1, target_ulong rs2,
3268d19b58SWeiwei Li bool enc, bool mix)
3368d19b58SWeiwei Li {
3468d19b58SWeiwei Li uint8_t si = rs2 >> shamt;
3568d19b58SWeiwei Li uint32_t mixed;
3668d19b58SWeiwei Li target_ulong res;
3768d19b58SWeiwei Li
3868d19b58SWeiwei Li if (enc) {
3968d19b58SWeiwei Li if (mix) {
409ea17007SArd Biesheuvel mixed = be32_to_cpu(AES_Te0[si]);
4168d19b58SWeiwei Li } else {
429ea17007SArd Biesheuvel mixed = AES_sbox[si];
4368d19b58SWeiwei Li }
4468d19b58SWeiwei Li } else {
4568d19b58SWeiwei Li if (mix) {
469ea17007SArd Biesheuvel mixed = be32_to_cpu(AES_Td0[si]);
4768d19b58SWeiwei Li } else {
489ea17007SArd Biesheuvel mixed = AES_isbox[si];
4968d19b58SWeiwei Li }
5068d19b58SWeiwei Li }
5168d19b58SWeiwei Li mixed = rol32(mixed, shamt);
5268d19b58SWeiwei Li res = rs1 ^ mixed;
5368d19b58SWeiwei Li
5468d19b58SWeiwei Li return sext32_xlen(res);
5568d19b58SWeiwei Li }
5668d19b58SWeiwei Li
HELPER(aes32esmi)5768d19b58SWeiwei Li target_ulong HELPER(aes32esmi)(target_ulong rs1, target_ulong rs2,
5868d19b58SWeiwei Li target_ulong shamt)
5968d19b58SWeiwei Li {
6068d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, true);
6168d19b58SWeiwei Li }
6268d19b58SWeiwei Li
HELPER(aes32esi)6368d19b58SWeiwei Li target_ulong HELPER(aes32esi)(target_ulong rs1, target_ulong rs2,
6468d19b58SWeiwei Li target_ulong shamt)
6568d19b58SWeiwei Li {
6668d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, false);
6768d19b58SWeiwei Li }
6868d19b58SWeiwei Li
HELPER(aes32dsmi)6968d19b58SWeiwei Li target_ulong HELPER(aes32dsmi)(target_ulong rs1, target_ulong rs2,
7068d19b58SWeiwei Li target_ulong shamt)
7168d19b58SWeiwei Li {
7268d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, true);
7368d19b58SWeiwei Li }
7468d19b58SWeiwei Li
HELPER(aes32dsi)7568d19b58SWeiwei Li target_ulong HELPER(aes32dsi)(target_ulong rs1, target_ulong rs2,
7668d19b58SWeiwei Li target_ulong shamt)
7768d19b58SWeiwei Li {
7868d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, false);
7968d19b58SWeiwei Li }
809e33e175SWeiwei Li
81cad26538SRichard Henderson static const AESState aes_zero = { };
82cad26538SRichard Henderson
HELPER(aes64esm)839e33e175SWeiwei Li target_ulong HELPER(aes64esm)(target_ulong rs1, target_ulong rs2)
849e33e175SWeiwei Li {
85274f3376SRichard Henderson AESState t;
86274f3376SRichard Henderson
87274f3376SRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1;
88274f3376SRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2;
89274f3376SRichard Henderson aesenc_SB_SR_MC_AK(&t, &t, &aes_zero, false);
90274f3376SRichard Henderson return t.d[HOST_BIG_ENDIAN];
919e33e175SWeiwei Li }
929e33e175SWeiwei Li
HELPER(aes64es)939e33e175SWeiwei Li target_ulong HELPER(aes64es)(target_ulong rs1, target_ulong rs2)
949e33e175SWeiwei Li {
95cad26538SRichard Henderson AESState t;
96cad26538SRichard Henderson
97cad26538SRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1;
98cad26538SRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2;
99cad26538SRichard Henderson aesenc_SB_SR_AK(&t, &t, &aes_zero, false);
100cad26538SRichard Henderson return t.d[HOST_BIG_ENDIAN];
1019e33e175SWeiwei Li }
1029e33e175SWeiwei Li
HELPER(aes64ds)1039e33e175SWeiwei Li target_ulong HELPER(aes64ds)(target_ulong rs1, target_ulong rs2)
1049e33e175SWeiwei Li {
1057a70583aSRichard Henderson AESState t;
1067a70583aSRichard Henderson
1077a70583aSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1;
1087a70583aSRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2;
1097a70583aSRichard Henderson aesdec_ISB_ISR_AK(&t, &t, &aes_zero, false);
1107a70583aSRichard Henderson return t.d[HOST_BIG_ENDIAN];
1119e33e175SWeiwei Li }
1129e33e175SWeiwei Li
HELPER(aes64dsm)1139e33e175SWeiwei Li target_ulong HELPER(aes64dsm)(target_ulong rs1, target_ulong rs2)
1149e33e175SWeiwei Li {
1154ad6f9bfSRichard Henderson AESState t, z = { };
1164ad6f9bfSRichard Henderson
1174ad6f9bfSRichard Henderson /*
1184ad6f9bfSRichard Henderson * This instruction does not include a round key,
1194ad6f9bfSRichard Henderson * so supply a zero to our primitive.
1204ad6f9bfSRichard Henderson */
1214ad6f9bfSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1;
1224ad6f9bfSRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2;
1234ad6f9bfSRichard Henderson aesdec_ISB_ISR_IMC_AK(&t, &t, &z, false);
1244ad6f9bfSRichard Henderson return t.d[HOST_BIG_ENDIAN];
1259e33e175SWeiwei Li }
1269e33e175SWeiwei Li
HELPER(aes64ks2)1279e33e175SWeiwei Li target_ulong HELPER(aes64ks2)(target_ulong rs1, target_ulong rs2)
1289e33e175SWeiwei Li {
1299e33e175SWeiwei Li uint64_t RS1 = rs1;
1309e33e175SWeiwei Li uint64_t RS2 = rs2;
1319e33e175SWeiwei Li uint32_t rs1_hi = RS1 >> 32;
1329e33e175SWeiwei Li uint32_t rs2_lo = RS2;
1339e33e175SWeiwei Li uint32_t rs2_hi = RS2 >> 32;
1349e33e175SWeiwei Li
1359e33e175SWeiwei Li uint32_t r_lo = (rs1_hi ^ rs2_lo);
1369e33e175SWeiwei Li uint32_t r_hi = (rs1_hi ^ rs2_lo ^ rs2_hi);
1379e33e175SWeiwei Li target_ulong result = ((uint64_t)r_hi << 32) | r_lo;
1389e33e175SWeiwei Li
1399e33e175SWeiwei Li return result;
1409e33e175SWeiwei Li }
1419e33e175SWeiwei Li
HELPER(aes64ks1i)1429e33e175SWeiwei Li target_ulong HELPER(aes64ks1i)(target_ulong rs1, target_ulong rnum)
1439e33e175SWeiwei Li {
1449e33e175SWeiwei Li uint64_t RS1 = rs1;
1459e33e175SWeiwei Li static const uint8_t round_consts[10] = {
1469e33e175SWeiwei Li 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36
1479e33e175SWeiwei Li };
1489e33e175SWeiwei Li
1499e33e175SWeiwei Li uint8_t enc_rnum = rnum;
1509e33e175SWeiwei Li uint32_t temp = (RS1 >> 32) & 0xFFFFFFFF;
151*7d496bb5SArd Biesheuvel AESState t, rc = {};
1529e33e175SWeiwei Li
1539e33e175SWeiwei Li if (enc_rnum != 0xA) {
1549e33e175SWeiwei Li temp = ror32(temp, 8); /* Rotate right by 8 */
155*7d496bb5SArd Biesheuvel rc.w[0] = rc.w[1] = round_consts[enc_rnum];
1569e33e175SWeiwei Li }
1579e33e175SWeiwei Li
158*7d496bb5SArd Biesheuvel t.w[0] = t.w[1] = t.w[2] = t.w[3] = temp;
159*7d496bb5SArd Biesheuvel aesenc_SB_SR_AK(&t, &t, &rc, false);
1609e33e175SWeiwei Li
161*7d496bb5SArd Biesheuvel return t.d[0];
1629e33e175SWeiwei Li }
1639e33e175SWeiwei Li
HELPER(aes64im)1649e33e175SWeiwei Li target_ulong HELPER(aes64im)(target_ulong rs1)
1659e33e175SWeiwei Li {
166607a5f9dSRichard Henderson AESState t;
1679e33e175SWeiwei Li
168607a5f9dSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1;
169607a5f9dSRichard Henderson t.d[!HOST_BIG_ENDIAN] = 0;
170607a5f9dSRichard Henderson aesdec_IMC(&t, &t, false);
171607a5f9dSRichard Henderson return t.d[HOST_BIG_ENDIAN];
1729e33e175SWeiwei Li }
1730976083dSWeiwei Li
HELPER(sm4ed)1740976083dSWeiwei Li target_ulong HELPER(sm4ed)(target_ulong rs1, target_ulong rs2,
1750976083dSWeiwei Li target_ulong shamt)
1760976083dSWeiwei Li {
1770976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt);
1780976083dSWeiwei Li uint32_t sb_out = (uint32_t)sm4_sbox[sb_in];
1790976083dSWeiwei Li
1800976083dSWeiwei Li uint32_t x = sb_out ^ (sb_out << 8) ^ (sb_out << 2) ^ (sb_out << 18) ^
1810976083dSWeiwei Li ((sb_out & 0x3f) << 26) ^ ((sb_out & 0xC0) << 10);
1820976083dSWeiwei Li
1830976083dSWeiwei Li uint32_t rotl = rol32(x, shamt);
1840976083dSWeiwei Li
1850976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1);
1860976083dSWeiwei Li }
1870976083dSWeiwei Li
HELPER(sm4ks)1880976083dSWeiwei Li target_ulong HELPER(sm4ks)(target_ulong rs1, target_ulong rs2,
1890976083dSWeiwei Li target_ulong shamt)
1900976083dSWeiwei Li {
1910976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt);
1920976083dSWeiwei Li uint32_t sb_out = sm4_sbox[sb_in];
1930976083dSWeiwei Li
1940976083dSWeiwei Li uint32_t x = sb_out ^ ((sb_out & 0x07) << 29) ^ ((sb_out & 0xFE) << 7) ^
1950976083dSWeiwei Li ((sb_out & 0x01) << 23) ^ ((sb_out & 0xF8) << 13);
1960976083dSWeiwei Li
1970976083dSWeiwei Li uint32_t rotl = rol32(x, shamt);
1980976083dSWeiwei Li
1990976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1);
2000976083dSWeiwei Li }
20168d19b58SWeiwei Li #undef sext32_xlen
202