168d19b58SWeiwei Li /* 268d19b58SWeiwei Li * RISC-V Crypto Emulation Helpers for QEMU. 368d19b58SWeiwei Li * 468d19b58SWeiwei Li * Copyright (c) 2021 Ruibo Lu, luruibo2000@163.com 568d19b58SWeiwei Li * Copyright (c) 2021 Zewen Ye, lustrew@foxmail.com 668d19b58SWeiwei Li * 768d19b58SWeiwei Li * This program is free software; you can redistribute it and/or modify it 868d19b58SWeiwei Li * under the terms and conditions of the GNU General Public License, 968d19b58SWeiwei Li * version 2 or later, as published by the Free Software Foundation. 1068d19b58SWeiwei Li * 1168d19b58SWeiwei Li * This program is distributed in the hope it will be useful, but WITHOUT 1268d19b58SWeiwei Li * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 1368d19b58SWeiwei Li * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 1468d19b58SWeiwei Li * more details. 1568d19b58SWeiwei Li * 1668d19b58SWeiwei Li * You should have received a copy of the GNU General Public License along with 1768d19b58SWeiwei Li * this program. If not, see <http://www.gnu.org/licenses/>. 1868d19b58SWeiwei Li */ 1968d19b58SWeiwei Li 2068d19b58SWeiwei Li #include "qemu/osdep.h" 2168d19b58SWeiwei Li #include "cpu.h" 2268d19b58SWeiwei Li #include "exec/exec-all.h" 2368d19b58SWeiwei Li #include "exec/helper-proto.h" 2468d19b58SWeiwei Li #include "crypto/aes.h" 25cad26538SRichard Henderson #include "crypto/aes-round.h" 2668d19b58SWeiwei Li #include "crypto/sm4.h" 2768d19b58SWeiwei Li 2868d19b58SWeiwei Li #define AES_XTIME(a) \ 2968d19b58SWeiwei Li ((a << 1) ^ ((a & 0x80) ? 0x1b : 0)) 3068d19b58SWeiwei Li 3168d19b58SWeiwei Li #define AES_GFMUL(a, b) (( \ 3268d19b58SWeiwei Li (((b) & 0x1) ? (a) : 0) ^ \ 3368d19b58SWeiwei Li (((b) & 0x2) ? AES_XTIME(a) : 0) ^ \ 3468d19b58SWeiwei Li (((b) & 0x4) ? AES_XTIME(AES_XTIME(a)) : 0) ^ \ 3568d19b58SWeiwei Li (((b) & 0x8) ? AES_XTIME(AES_XTIME(AES_XTIME(a))) : 0)) & 0xFF) 3668d19b58SWeiwei Li 3768d19b58SWeiwei Li static inline uint32_t aes_mixcolumn_byte(uint8_t x, bool fwd) 3868d19b58SWeiwei Li { 3968d19b58SWeiwei Li uint32_t u; 4068d19b58SWeiwei Li 4168d19b58SWeiwei Li if (fwd) { 4268d19b58SWeiwei Li u = (AES_GFMUL(x, 3) << 24) | (x << 16) | (x << 8) | 4368d19b58SWeiwei Li (AES_GFMUL(x, 2) << 0); 4468d19b58SWeiwei Li } else { 4568d19b58SWeiwei Li u = (AES_GFMUL(x, 0xb) << 24) | (AES_GFMUL(x, 0xd) << 16) | 4668d19b58SWeiwei Li (AES_GFMUL(x, 0x9) << 8) | (AES_GFMUL(x, 0xe) << 0); 4768d19b58SWeiwei Li } 4868d19b58SWeiwei Li return u; 4968d19b58SWeiwei Li } 5068d19b58SWeiwei Li 5168d19b58SWeiwei Li #define sext32_xlen(x) (target_ulong)(int32_t)(x) 5268d19b58SWeiwei Li 5368d19b58SWeiwei Li static inline target_ulong aes32_operation(target_ulong shamt, 5468d19b58SWeiwei Li target_ulong rs1, target_ulong rs2, 5568d19b58SWeiwei Li bool enc, bool mix) 5668d19b58SWeiwei Li { 5768d19b58SWeiwei Li uint8_t si = rs2 >> shamt; 5868d19b58SWeiwei Li uint8_t so; 5968d19b58SWeiwei Li uint32_t mixed; 6068d19b58SWeiwei Li target_ulong res; 6168d19b58SWeiwei Li 6268d19b58SWeiwei Li if (enc) { 6368d19b58SWeiwei Li so = AES_sbox[si]; 6468d19b58SWeiwei Li if (mix) { 6568d19b58SWeiwei Li mixed = aes_mixcolumn_byte(so, true); 6668d19b58SWeiwei Li } else { 6768d19b58SWeiwei Li mixed = so; 6868d19b58SWeiwei Li } 6968d19b58SWeiwei Li } else { 7068d19b58SWeiwei Li so = AES_isbox[si]; 7168d19b58SWeiwei Li if (mix) { 7268d19b58SWeiwei Li mixed = aes_mixcolumn_byte(so, false); 7368d19b58SWeiwei Li } else { 7468d19b58SWeiwei Li mixed = so; 7568d19b58SWeiwei Li } 7668d19b58SWeiwei Li } 7768d19b58SWeiwei Li mixed = rol32(mixed, shamt); 7868d19b58SWeiwei Li res = rs1 ^ mixed; 7968d19b58SWeiwei Li 8068d19b58SWeiwei Li return sext32_xlen(res); 8168d19b58SWeiwei Li } 8268d19b58SWeiwei Li 8368d19b58SWeiwei Li target_ulong HELPER(aes32esmi)(target_ulong rs1, target_ulong rs2, 8468d19b58SWeiwei Li target_ulong shamt) 8568d19b58SWeiwei Li { 8668d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, true); 8768d19b58SWeiwei Li } 8868d19b58SWeiwei Li 8968d19b58SWeiwei Li target_ulong HELPER(aes32esi)(target_ulong rs1, target_ulong rs2, 9068d19b58SWeiwei Li target_ulong shamt) 9168d19b58SWeiwei Li { 9268d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, false); 9368d19b58SWeiwei Li } 9468d19b58SWeiwei Li 9568d19b58SWeiwei Li target_ulong HELPER(aes32dsmi)(target_ulong rs1, target_ulong rs2, 9668d19b58SWeiwei Li target_ulong shamt) 9768d19b58SWeiwei Li { 9868d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, true); 9968d19b58SWeiwei Li } 10068d19b58SWeiwei Li 10168d19b58SWeiwei Li target_ulong HELPER(aes32dsi)(target_ulong rs1, target_ulong rs2, 10268d19b58SWeiwei Li target_ulong shamt) 10368d19b58SWeiwei Li { 10468d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, false); 10568d19b58SWeiwei Li } 1069e33e175SWeiwei Li 107cad26538SRichard Henderson static const AESState aes_zero = { }; 108cad26538SRichard Henderson 1099e33e175SWeiwei Li target_ulong HELPER(aes64esm)(target_ulong rs1, target_ulong rs2) 1109e33e175SWeiwei Li { 111274f3376SRichard Henderson AESState t; 112274f3376SRichard Henderson 113274f3376SRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 114274f3376SRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 115274f3376SRichard Henderson aesenc_SB_SR_MC_AK(&t, &t, &aes_zero, false); 116274f3376SRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1179e33e175SWeiwei Li } 1189e33e175SWeiwei Li 1199e33e175SWeiwei Li target_ulong HELPER(aes64es)(target_ulong rs1, target_ulong rs2) 1209e33e175SWeiwei Li { 121cad26538SRichard Henderson AESState t; 122cad26538SRichard Henderson 123cad26538SRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 124cad26538SRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 125cad26538SRichard Henderson aesenc_SB_SR_AK(&t, &t, &aes_zero, false); 126cad26538SRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1279e33e175SWeiwei Li } 1289e33e175SWeiwei Li 1299e33e175SWeiwei Li target_ulong HELPER(aes64ds)(target_ulong rs1, target_ulong rs2) 1309e33e175SWeiwei Li { 1317a70583aSRichard Henderson AESState t; 1327a70583aSRichard Henderson 1337a70583aSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 1347a70583aSRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 1357a70583aSRichard Henderson aesdec_ISB_ISR_AK(&t, &t, &aes_zero, false); 1367a70583aSRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1379e33e175SWeiwei Li } 1389e33e175SWeiwei Li 1399e33e175SWeiwei Li target_ulong HELPER(aes64dsm)(target_ulong rs1, target_ulong rs2) 1409e33e175SWeiwei Li { 141*4ad6f9bfSRichard Henderson AESState t, z = { }; 142*4ad6f9bfSRichard Henderson 143*4ad6f9bfSRichard Henderson /* 144*4ad6f9bfSRichard Henderson * This instruction does not include a round key, 145*4ad6f9bfSRichard Henderson * so supply a zero to our primitive. 146*4ad6f9bfSRichard Henderson */ 147*4ad6f9bfSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 148*4ad6f9bfSRichard Henderson t.d[!HOST_BIG_ENDIAN] = rs2; 149*4ad6f9bfSRichard Henderson aesdec_ISB_ISR_IMC_AK(&t, &t, &z, false); 150*4ad6f9bfSRichard Henderson return t.d[HOST_BIG_ENDIAN]; 1519e33e175SWeiwei Li } 1529e33e175SWeiwei Li 1539e33e175SWeiwei Li target_ulong HELPER(aes64ks2)(target_ulong rs1, target_ulong rs2) 1549e33e175SWeiwei Li { 1559e33e175SWeiwei Li uint64_t RS1 = rs1; 1569e33e175SWeiwei Li uint64_t RS2 = rs2; 1579e33e175SWeiwei Li uint32_t rs1_hi = RS1 >> 32; 1589e33e175SWeiwei Li uint32_t rs2_lo = RS2; 1599e33e175SWeiwei Li uint32_t rs2_hi = RS2 >> 32; 1609e33e175SWeiwei Li 1619e33e175SWeiwei Li uint32_t r_lo = (rs1_hi ^ rs2_lo); 1629e33e175SWeiwei Li uint32_t r_hi = (rs1_hi ^ rs2_lo ^ rs2_hi); 1639e33e175SWeiwei Li target_ulong result = ((uint64_t)r_hi << 32) | r_lo; 1649e33e175SWeiwei Li 1659e33e175SWeiwei Li return result; 1669e33e175SWeiwei Li } 1679e33e175SWeiwei Li 1689e33e175SWeiwei Li target_ulong HELPER(aes64ks1i)(target_ulong rs1, target_ulong rnum) 1699e33e175SWeiwei Li { 1709e33e175SWeiwei Li uint64_t RS1 = rs1; 1719e33e175SWeiwei Li static const uint8_t round_consts[10] = { 1729e33e175SWeiwei Li 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36 1739e33e175SWeiwei Li }; 1749e33e175SWeiwei Li 1759e33e175SWeiwei Li uint8_t enc_rnum = rnum; 1769e33e175SWeiwei Li uint32_t temp = (RS1 >> 32) & 0xFFFFFFFF; 1779e33e175SWeiwei Li uint8_t rcon_ = 0; 1789e33e175SWeiwei Li target_ulong result; 1799e33e175SWeiwei Li 1809e33e175SWeiwei Li if (enc_rnum != 0xA) { 1819e33e175SWeiwei Li temp = ror32(temp, 8); /* Rotate right by 8 */ 1829e33e175SWeiwei Li rcon_ = round_consts[enc_rnum]; 1839e33e175SWeiwei Li } 1849e33e175SWeiwei Li 1859e33e175SWeiwei Li temp = ((uint32_t)AES_sbox[(temp >> 24) & 0xFF] << 24) | 1869e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 16) & 0xFF] << 16) | 1879e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 8) & 0xFF] << 8) | 1889e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 0) & 0xFF] << 0); 1899e33e175SWeiwei Li 1909e33e175SWeiwei Li temp ^= rcon_; 1919e33e175SWeiwei Li 1929e33e175SWeiwei Li result = ((uint64_t)temp << 32) | temp; 1939e33e175SWeiwei Li 1949e33e175SWeiwei Li return result; 1959e33e175SWeiwei Li } 1969e33e175SWeiwei Li 1979e33e175SWeiwei Li target_ulong HELPER(aes64im)(target_ulong rs1) 1989e33e175SWeiwei Li { 199607a5f9dSRichard Henderson AESState t; 2009e33e175SWeiwei Li 201607a5f9dSRichard Henderson t.d[HOST_BIG_ENDIAN] = rs1; 202607a5f9dSRichard Henderson t.d[!HOST_BIG_ENDIAN] = 0; 203607a5f9dSRichard Henderson aesdec_IMC(&t, &t, false); 204607a5f9dSRichard Henderson return t.d[HOST_BIG_ENDIAN]; 2059e33e175SWeiwei Li } 2060976083dSWeiwei Li 2070976083dSWeiwei Li target_ulong HELPER(sm4ed)(target_ulong rs1, target_ulong rs2, 2080976083dSWeiwei Li target_ulong shamt) 2090976083dSWeiwei Li { 2100976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt); 2110976083dSWeiwei Li uint32_t sb_out = (uint32_t)sm4_sbox[sb_in]; 2120976083dSWeiwei Li 2130976083dSWeiwei Li uint32_t x = sb_out ^ (sb_out << 8) ^ (sb_out << 2) ^ (sb_out << 18) ^ 2140976083dSWeiwei Li ((sb_out & 0x3f) << 26) ^ ((sb_out & 0xC0) << 10); 2150976083dSWeiwei Li 2160976083dSWeiwei Li uint32_t rotl = rol32(x, shamt); 2170976083dSWeiwei Li 2180976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1); 2190976083dSWeiwei Li } 2200976083dSWeiwei Li 2210976083dSWeiwei Li target_ulong HELPER(sm4ks)(target_ulong rs1, target_ulong rs2, 2220976083dSWeiwei Li target_ulong shamt) 2230976083dSWeiwei Li { 2240976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt); 2250976083dSWeiwei Li uint32_t sb_out = sm4_sbox[sb_in]; 2260976083dSWeiwei Li 2270976083dSWeiwei Li uint32_t x = sb_out ^ ((sb_out & 0x07) << 29) ^ ((sb_out & 0xFE) << 7) ^ 2280976083dSWeiwei Li ((sb_out & 0x01) << 23) ^ ((sb_out & 0xF8) << 13); 2290976083dSWeiwei Li 2300976083dSWeiwei Li uint32_t rotl = rol32(x, shamt); 2310976083dSWeiwei Li 2320976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1); 2330976083dSWeiwei Li } 23468d19b58SWeiwei Li #undef sext32_xlen 235