168d19b58SWeiwei Li /* 268d19b58SWeiwei Li * RISC-V Crypto Emulation Helpers for QEMU. 368d19b58SWeiwei Li * 468d19b58SWeiwei Li * Copyright (c) 2021 Ruibo Lu, luruibo2000@163.com 568d19b58SWeiwei Li * Copyright (c) 2021 Zewen Ye, lustrew@foxmail.com 668d19b58SWeiwei Li * 768d19b58SWeiwei Li * This program is free software; you can redistribute it and/or modify it 868d19b58SWeiwei Li * under the terms and conditions of the GNU General Public License, 968d19b58SWeiwei Li * version 2 or later, as published by the Free Software Foundation. 1068d19b58SWeiwei Li * 1168d19b58SWeiwei Li * This program is distributed in the hope it will be useful, but WITHOUT 1268d19b58SWeiwei Li * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 1368d19b58SWeiwei Li * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 1468d19b58SWeiwei Li * more details. 1568d19b58SWeiwei Li * 1668d19b58SWeiwei Li * You should have received a copy of the GNU General Public License along with 1768d19b58SWeiwei Li * this program. If not, see <http://www.gnu.org/licenses/>. 1868d19b58SWeiwei Li */ 1968d19b58SWeiwei Li 2068d19b58SWeiwei Li #include "qemu/osdep.h" 2168d19b58SWeiwei Li #include "cpu.h" 2268d19b58SWeiwei Li #include "exec/exec-all.h" 2368d19b58SWeiwei Li #include "exec/helper-proto.h" 2468d19b58SWeiwei Li #include "crypto/aes.h" 25cad26538SRichard Henderson #include "crypto/aes-round.h" 2668d19b58SWeiwei Li #include "crypto/sm4.h" 2768d19b58SWeiwei Li 2868d19b58SWeiwei Li #define sext32_xlen(x) (target_ulong)(int32_t)(x) 2968d19b58SWeiwei Li 3068d19b58SWeiwei Li static inline target_ulong aes32_operation(target_ulong shamt, 3168d19b58SWeiwei Li target_ulong rs1, target_ulong rs2, 3268d19b58SWeiwei Li bool enc, bool mix) 3368d19b58SWeiwei Li { 3468d19b58SWeiwei Li uint8_t si = rs2 >> shamt; 3568d19b58SWeiwei Li uint32_t mixed; 3668d19b58SWeiwei Li target_ulong res; 3768d19b58SWeiwei Li 3868d19b58SWeiwei Li if (enc) { 3968d19b58SWeiwei Li if (mix) { 40*9ea17007SArd Biesheuvel mixed = be32_to_cpu(AES_Te0[si]); 4168d19b58SWeiwei Li } else { 42*9ea17007SArd Biesheuvel mixed = AES_sbox[si]; 4368d19b58SWeiwei Li } 4468d19b58SWeiwei Li } else { 4568d19b58SWeiwei Li if (mix) { 46*9ea17007SArd Biesheuvel mixed = be32_to_cpu(AES_Td0[si]); 4768d19b58SWeiwei Li } else { 48*9ea17007SArd Biesheuvel mixed = AES_isbox[si]; 4968d19b58SWeiwei Li } 5068d19b58SWeiwei Li } 5168d19b58SWeiwei Li mixed = rol32(mixed, shamt); 5268d19b58SWeiwei Li res = rs1 ^ mixed; 5368d19b58SWeiwei Li 5468d19b58SWeiwei Li return sext32_xlen(res); 5568d19b58SWeiwei Li } 5668d19b58SWeiwei Li 5768d19b58SWeiwei Li target_ulong HELPER(aes32esmi)(target_ulong rs1, target_ulong rs2, 5868d19b58SWeiwei Li target_ulong shamt) 5968d19b58SWeiwei Li { 6068d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, true); 6168d19b58SWeiwei Li } 6268d19b58SWeiwei Li 6368d19b58SWeiwei Li target_ulong HELPER(aes32esi)(target_ulong rs1, target_ulong rs2, 6468d19b58SWeiwei Li target_ulong shamt) 6568d19b58SWeiwei Li { 6668d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, false); 6768d19b58SWeiwei Li } 6868d19b58SWeiwei Li 6968d19b58SWeiwei Li target_ulong HELPER(aes32dsmi)(target_ulong rs1, target_ulong rs2, 7068d19b58SWeiwei Li target_ulong shamt) 7168d19b58SWeiwei Li { 7268d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, true); 7368d19b58SWeiwei Li } 7468d19b58SWeiwei Li 7568d19b58SWeiwei Li target_ulong HELPER(aes32dsi)(target_ulong rs1, target_ulong rs2, 7668d19b58SWeiwei Li target_ulong shamt) 7768d19b58SWeiwei Li { 7868d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, false); 7968d19b58SWeiwei Li } 809e33e175SWeiwei Li 81cad26538SRichard Henderson static const AESState aes_zero = { }; 82cad26538SRichard Henderson 839e33e175SWeiwei Li target_ulong HELPER(aes64esm)(target_ulong rs1, target_ulong rs2) 849e33e175SWeiwei Li { 85274f3376SRichard Henderson AESState t; 86274f3376SRichard Henderson 87274f3376SRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 88274f3376SRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 89274f3376SRichard Henderson aesenc_SB_SR_MC_AK(&t, &t, &aes_zero, false); 90274f3376SRichard Henderson return t.d[HOST_BIG_ENDIAN]; 919e33e175SWeiwei Li } 929e33e175SWeiwei Li 939e33e175SWeiwei Li target_ulong HELPER(aes64es)(target_ulong rs1, target_ulong rs2) 949e33e175SWeiwei Li { 95cad26538SRichard Henderson AESState t; 96cad26538SRichard Henderson 97cad26538SRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 98cad26538SRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 99cad26538SRichard Henderson aesenc_SB_SR_AK(&t, &t, &aes_zero, false); 100cad26538SRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1019e33e175SWeiwei Li } 1029e33e175SWeiwei Li 1039e33e175SWeiwei Li target_ulong HELPER(aes64ds)(target_ulong rs1, target_ulong rs2) 1049e33e175SWeiwei Li { 1057a70583aSRichard Henderson AESState t; 1067a70583aSRichard Henderson 1077a70583aSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 1087a70583aSRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 1097a70583aSRichard Henderson aesdec_ISB_ISR_AK(&t, &t, &aes_zero, false); 1107a70583aSRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1119e33e175SWeiwei Li } 1129e33e175SWeiwei Li 1139e33e175SWeiwei Li target_ulong HELPER(aes64dsm)(target_ulong rs1, target_ulong rs2) 1149e33e175SWeiwei Li { 1154ad6f9bfSRichard Henderson AESState t, z = { }; 1164ad6f9bfSRichard Henderson 1174ad6f9bfSRichard Henderson /* 1184ad6f9bfSRichard Henderson * This instruction does not include a round key, 1194ad6f9bfSRichard Henderson * so supply a zero to our primitive. 1204ad6f9bfSRichard Henderson */ 1214ad6f9bfSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 1224ad6f9bfSRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 1234ad6f9bfSRichard Henderson aesdec_ISB_ISR_IMC_AK(&t, &t, &z, false); 1244ad6f9bfSRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1259e33e175SWeiwei Li } 1269e33e175SWeiwei Li 1279e33e175SWeiwei Li target_ulong HELPER(aes64ks2)(target_ulong rs1, target_ulong rs2) 1289e33e175SWeiwei Li { 1299e33e175SWeiwei Li uint64_t RS1 = rs1; 1309e33e175SWeiwei Li uint64_t RS2 = rs2; 1319e33e175SWeiwei Li uint32_t rs1_hi = RS1 >> 32; 1329e33e175SWeiwei Li uint32_t rs2_lo = RS2; 1339e33e175SWeiwei Li uint32_t rs2_hi = RS2 >> 32; 1349e33e175SWeiwei Li 1359e33e175SWeiwei Li uint32_t r_lo = (rs1_hi ^ rs2_lo); 1369e33e175SWeiwei Li uint32_t r_hi = (rs1_hi ^ rs2_lo ^ rs2_hi); 1379e33e175SWeiwei Li target_ulong result = ((uint64_t)r_hi << 32) | r_lo; 1389e33e175SWeiwei Li 1399e33e175SWeiwei Li return result; 1409e33e175SWeiwei Li } 1419e33e175SWeiwei Li 1429e33e175SWeiwei Li target_ulong HELPER(aes64ks1i)(target_ulong rs1, target_ulong rnum) 1439e33e175SWeiwei Li { 1449e33e175SWeiwei Li uint64_t RS1 = rs1; 1459e33e175SWeiwei Li static const uint8_t round_consts[10] = { 1469e33e175SWeiwei Li 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36 1479e33e175SWeiwei Li }; 1489e33e175SWeiwei Li 1499e33e175SWeiwei Li uint8_t enc_rnum = rnum; 1509e33e175SWeiwei Li uint32_t temp = (RS1 >> 32) & 0xFFFFFFFF; 1519e33e175SWeiwei Li uint8_t rcon_ = 0; 1529e33e175SWeiwei Li target_ulong result; 1539e33e175SWeiwei Li 1549e33e175SWeiwei Li if (enc_rnum != 0xA) { 1559e33e175SWeiwei Li temp = ror32(temp, 8); /* Rotate right by 8 */ 1569e33e175SWeiwei Li rcon_ = round_consts[enc_rnum]; 1579e33e175SWeiwei Li } 1589e33e175SWeiwei Li 1599e33e175SWeiwei Li temp = ((uint32_t)AES_sbox[(temp >> 24) & 0xFF] << 24) | 1609e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 16) & 0xFF] << 16) | 1619e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 8) & 0xFF] << 8) | 1629e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 0) & 0xFF] << 0); 1639e33e175SWeiwei Li 1649e33e175SWeiwei Li temp ^= rcon_; 1659e33e175SWeiwei Li 1669e33e175SWeiwei Li result = ((uint64_t)temp << 32) | temp; 1679e33e175SWeiwei Li 1689e33e175SWeiwei Li return result; 1699e33e175SWeiwei Li } 1709e33e175SWeiwei Li 1719e33e175SWeiwei Li target_ulong HELPER(aes64im)(target_ulong rs1) 1729e33e175SWeiwei Li { 173607a5f9dSRichard Henderson AESState t; 1749e33e175SWeiwei Li 175607a5f9dSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 176607a5f9dSRichard Henderson t.d[!HOST_BIG_ENDIAN] = 0; 177607a5f9dSRichard Henderson aesdec_IMC(&t, &t, false); 178607a5f9dSRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1799e33e175SWeiwei Li } 1800976083dSWeiwei Li 1810976083dSWeiwei Li target_ulong HELPER(sm4ed)(target_ulong rs1, target_ulong rs2, 1820976083dSWeiwei Li target_ulong shamt) 1830976083dSWeiwei Li { 1840976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt); 1850976083dSWeiwei Li uint32_t sb_out = (uint32_t)sm4_sbox[sb_in]; 1860976083dSWeiwei Li 1870976083dSWeiwei Li uint32_t x = sb_out ^ (sb_out << 8) ^ (sb_out << 2) ^ (sb_out << 18) ^ 1880976083dSWeiwei Li ((sb_out & 0x3f) << 26) ^ ((sb_out & 0xC0) << 10); 1890976083dSWeiwei Li 1900976083dSWeiwei Li uint32_t rotl = rol32(x, shamt); 1910976083dSWeiwei Li 1920976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1); 1930976083dSWeiwei Li } 1940976083dSWeiwei Li 1950976083dSWeiwei Li target_ulong HELPER(sm4ks)(target_ulong rs1, target_ulong rs2, 1960976083dSWeiwei Li target_ulong shamt) 1970976083dSWeiwei Li { 1980976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt); 1990976083dSWeiwei Li uint32_t sb_out = sm4_sbox[sb_in]; 2000976083dSWeiwei Li 2010976083dSWeiwei Li uint32_t x = sb_out ^ ((sb_out & 0x07) << 29) ^ ((sb_out & 0xFE) << 7) ^ 2020976083dSWeiwei Li ((sb_out & 0x01) << 23) ^ ((sb_out & 0xF8) << 13); 2030976083dSWeiwei Li 2040976083dSWeiwei Li uint32_t rotl = rol32(x, shamt); 2050976083dSWeiwei Li 2060976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1); 2070976083dSWeiwei Li } 20868d19b58SWeiwei Li #undef sext32_xlen 209