168d19b58SWeiwei Li /* 268d19b58SWeiwei Li * RISC-V Crypto Emulation Helpers for QEMU. 368d19b58SWeiwei Li * 468d19b58SWeiwei Li * Copyright (c) 2021 Ruibo Lu, luruibo2000@163.com 568d19b58SWeiwei Li * Copyright (c) 2021 Zewen Ye, lustrew@foxmail.com 668d19b58SWeiwei Li * 768d19b58SWeiwei Li * This program is free software; you can redistribute it and/or modify it 868d19b58SWeiwei Li * under the terms and conditions of the GNU General Public License, 968d19b58SWeiwei Li * version 2 or later, as published by the Free Software Foundation. 1068d19b58SWeiwei Li * 1168d19b58SWeiwei Li * This program is distributed in the hope it will be useful, but WITHOUT 1268d19b58SWeiwei Li * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 1368d19b58SWeiwei Li * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 1468d19b58SWeiwei Li * more details. 1568d19b58SWeiwei Li * 1668d19b58SWeiwei Li * You should have received a copy of the GNU General Public License along with 1768d19b58SWeiwei Li * this program. If not, see <http://www.gnu.org/licenses/>. 1868d19b58SWeiwei Li */ 1968d19b58SWeiwei Li 2068d19b58SWeiwei Li #include "qemu/osdep.h" 2168d19b58SWeiwei Li #include "cpu.h" 2268d19b58SWeiwei Li #include "exec/exec-all.h" 2368d19b58SWeiwei Li #include "exec/helper-proto.h" 2468d19b58SWeiwei Li #include "crypto/aes.h" 2568d19b58SWeiwei Li #include "crypto/sm4.h" 2668d19b58SWeiwei Li 2768d19b58SWeiwei Li #define AES_XTIME(a) \ 2868d19b58SWeiwei Li ((a << 1) ^ ((a & 0x80) ? 0x1b : 0)) 2968d19b58SWeiwei Li 3068d19b58SWeiwei Li #define AES_GFMUL(a, b) (( \ 3168d19b58SWeiwei Li (((b) & 0x1) ? (a) : 0) ^ \ 3268d19b58SWeiwei Li (((b) & 0x2) ? AES_XTIME(a) : 0) ^ \ 3368d19b58SWeiwei Li (((b) & 0x4) ? AES_XTIME(AES_XTIME(a)) : 0) ^ \ 3468d19b58SWeiwei Li (((b) & 0x8) ? AES_XTIME(AES_XTIME(AES_XTIME(a))) : 0)) & 0xFF) 3568d19b58SWeiwei Li 3668d19b58SWeiwei Li static inline uint32_t aes_mixcolumn_byte(uint8_t x, bool fwd) 3768d19b58SWeiwei Li { 3868d19b58SWeiwei Li uint32_t u; 3968d19b58SWeiwei Li 4068d19b58SWeiwei Li if (fwd) { 4168d19b58SWeiwei Li u = (AES_GFMUL(x, 3) << 24) | (x << 16) | (x << 8) | 4268d19b58SWeiwei Li (AES_GFMUL(x, 2) << 0); 4368d19b58SWeiwei Li } else { 4468d19b58SWeiwei Li u = (AES_GFMUL(x, 0xb) << 24) | (AES_GFMUL(x, 0xd) << 16) | 4568d19b58SWeiwei Li (AES_GFMUL(x, 0x9) << 8) | (AES_GFMUL(x, 0xe) << 0); 4668d19b58SWeiwei Li } 4768d19b58SWeiwei Li return u; 4868d19b58SWeiwei Li } 4968d19b58SWeiwei Li 5068d19b58SWeiwei Li #define sext32_xlen(x) (target_ulong)(int32_t)(x) 5168d19b58SWeiwei Li 5268d19b58SWeiwei Li static inline target_ulong aes32_operation(target_ulong shamt, 5368d19b58SWeiwei Li target_ulong rs1, target_ulong rs2, 5468d19b58SWeiwei Li bool enc, bool mix) 5568d19b58SWeiwei Li { 5668d19b58SWeiwei Li uint8_t si = rs2 >> shamt; 5768d19b58SWeiwei Li uint8_t so; 5868d19b58SWeiwei Li uint32_t mixed; 5968d19b58SWeiwei Li target_ulong res; 6068d19b58SWeiwei Li 6168d19b58SWeiwei Li if (enc) { 6268d19b58SWeiwei Li so = AES_sbox[si]; 6368d19b58SWeiwei Li if (mix) { 6468d19b58SWeiwei Li mixed = aes_mixcolumn_byte(so, true); 6568d19b58SWeiwei Li } else { 6668d19b58SWeiwei Li mixed = so; 6768d19b58SWeiwei Li } 6868d19b58SWeiwei Li } else { 6968d19b58SWeiwei Li so = AES_isbox[si]; 7068d19b58SWeiwei Li if (mix) { 7168d19b58SWeiwei Li mixed = aes_mixcolumn_byte(so, false); 7268d19b58SWeiwei Li } else { 7368d19b58SWeiwei Li mixed = so; 7468d19b58SWeiwei Li } 7568d19b58SWeiwei Li } 7668d19b58SWeiwei Li mixed = rol32(mixed, shamt); 7768d19b58SWeiwei Li res = rs1 ^ mixed; 7868d19b58SWeiwei Li 7968d19b58SWeiwei Li return sext32_xlen(res); 8068d19b58SWeiwei Li } 8168d19b58SWeiwei Li 8268d19b58SWeiwei Li target_ulong HELPER(aes32esmi)(target_ulong rs1, target_ulong rs2, 8368d19b58SWeiwei Li target_ulong shamt) 8468d19b58SWeiwei Li { 8568d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, true); 8668d19b58SWeiwei Li } 8768d19b58SWeiwei Li 8868d19b58SWeiwei Li target_ulong HELPER(aes32esi)(target_ulong rs1, target_ulong rs2, 8968d19b58SWeiwei Li target_ulong shamt) 9068d19b58SWeiwei Li { 9168d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, true, false); 9268d19b58SWeiwei Li } 9368d19b58SWeiwei Li 9468d19b58SWeiwei Li target_ulong HELPER(aes32dsmi)(target_ulong rs1, target_ulong rs2, 9568d19b58SWeiwei Li target_ulong shamt) 9668d19b58SWeiwei Li { 9768d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, true); 9868d19b58SWeiwei Li } 9968d19b58SWeiwei Li 10068d19b58SWeiwei Li target_ulong HELPER(aes32dsi)(target_ulong rs1, target_ulong rs2, 10168d19b58SWeiwei Li target_ulong shamt) 10268d19b58SWeiwei Li { 10368d19b58SWeiwei Li return aes32_operation(shamt, rs1, rs2, false, false); 10468d19b58SWeiwei Li } 1059e33e175SWeiwei Li 1069e33e175SWeiwei Li #define BY(X, I) ((X >> (8 * I)) & 0xFF) 1079e33e175SWeiwei Li 1089e33e175SWeiwei Li #define AES_SHIFROWS_LO(RS1, RS2) ( \ 1099e33e175SWeiwei Li (((RS1 >> 24) & 0xFF) << 56) | (((RS2 >> 48) & 0xFF) << 48) | \ 1109e33e175SWeiwei Li (((RS2 >> 8) & 0xFF) << 40) | (((RS1 >> 32) & 0xFF) << 32) | \ 1119e33e175SWeiwei Li (((RS2 >> 56) & 0xFF) << 24) | (((RS2 >> 16) & 0xFF) << 16) | \ 1129e33e175SWeiwei Li (((RS1 >> 40) & 0xFF) << 8) | (((RS1 >> 0) & 0xFF) << 0)) 1139e33e175SWeiwei Li 1149e33e175SWeiwei Li #define AES_INVSHIFROWS_LO(RS1, RS2) ( \ 1159e33e175SWeiwei Li (((RS2 >> 24) & 0xFF) << 56) | (((RS2 >> 48) & 0xFF) << 48) | \ 1169e33e175SWeiwei Li (((RS1 >> 8) & 0xFF) << 40) | (((RS1 >> 32) & 0xFF) << 32) | \ 1179e33e175SWeiwei Li (((RS1 >> 56) & 0xFF) << 24) | (((RS2 >> 16) & 0xFF) << 16) | \ 1189e33e175SWeiwei Li (((RS2 >> 40) & 0xFF) << 8) | (((RS1 >> 0) & 0xFF) << 0)) 1199e33e175SWeiwei Li 1209e33e175SWeiwei Li #define AES_MIXBYTE(COL, B0, B1, B2, B3) ( \ 1219e33e175SWeiwei Li BY(COL, B3) ^ BY(COL, B2) ^ AES_GFMUL(BY(COL, B1), 3) ^ \ 1229e33e175SWeiwei Li AES_GFMUL(BY(COL, B0), 2)) 1239e33e175SWeiwei Li 1249e33e175SWeiwei Li #define AES_MIXCOLUMN(COL) ( \ 1259e33e175SWeiwei Li AES_MIXBYTE(COL, 3, 0, 1, 2) << 24 | \ 1269e33e175SWeiwei Li AES_MIXBYTE(COL, 2, 3, 0, 1) << 16 | \ 1279e33e175SWeiwei Li AES_MIXBYTE(COL, 1, 2, 3, 0) << 8 | AES_MIXBYTE(COL, 0, 1, 2, 3) << 0) 1289e33e175SWeiwei Li 1299e33e175SWeiwei Li #define AES_INVMIXBYTE(COL, B0, B1, B2, B3) ( \ 1309e33e175SWeiwei Li AES_GFMUL(BY(COL, B3), 0x9) ^ AES_GFMUL(BY(COL, B2), 0xd) ^ \ 1319e33e175SWeiwei Li AES_GFMUL(BY(COL, B1), 0xb) ^ AES_GFMUL(BY(COL, B0), 0xe)) 1329e33e175SWeiwei Li 1339e33e175SWeiwei Li #define AES_INVMIXCOLUMN(COL) ( \ 1349e33e175SWeiwei Li AES_INVMIXBYTE(COL, 3, 0, 1, 2) << 24 | \ 1359e33e175SWeiwei Li AES_INVMIXBYTE(COL, 2, 3, 0, 1) << 16 | \ 1369e33e175SWeiwei Li AES_INVMIXBYTE(COL, 1, 2, 3, 0) << 8 | \ 1379e33e175SWeiwei Li AES_INVMIXBYTE(COL, 0, 1, 2, 3) << 0) 1389e33e175SWeiwei Li 1399e33e175SWeiwei Li static inline target_ulong aes64_operation(target_ulong rs1, target_ulong rs2, 1409e33e175SWeiwei Li bool enc, bool mix) 1419e33e175SWeiwei Li { 1429e33e175SWeiwei Li uint64_t RS1 = rs1; 1439e33e175SWeiwei Li uint64_t RS2 = rs2; 1449e33e175SWeiwei Li uint64_t result; 1459e33e175SWeiwei Li uint64_t temp; 1469e33e175SWeiwei Li uint32_t col_0; 1479e33e175SWeiwei Li uint32_t col_1; 1489e33e175SWeiwei Li 1499e33e175SWeiwei Li if (enc) { 1509e33e175SWeiwei Li temp = AES_SHIFROWS_LO(RS1, RS2); 1519e33e175SWeiwei Li temp = (((uint64_t)AES_sbox[(temp >> 0) & 0xFF] << 0) | 1529e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 8) & 0xFF] << 8) | 1539e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 16) & 0xFF] << 16) | 1549e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 24) & 0xFF] << 24) | 1559e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 32) & 0xFF] << 32) | 1569e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 40) & 0xFF] << 40) | 1579e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 48) & 0xFF] << 48) | 1589e33e175SWeiwei Li ((uint64_t)AES_sbox[(temp >> 56) & 0xFF] << 56)); 1599e33e175SWeiwei Li if (mix) { 1609e33e175SWeiwei Li col_0 = temp & 0xFFFFFFFF; 1619e33e175SWeiwei Li col_1 = temp >> 32; 1629e33e175SWeiwei Li 1639e33e175SWeiwei Li col_0 = AES_MIXCOLUMN(col_0); 1649e33e175SWeiwei Li col_1 = AES_MIXCOLUMN(col_1); 1659e33e175SWeiwei Li 1669e33e175SWeiwei Li result = ((uint64_t)col_1 << 32) | col_0; 1679e33e175SWeiwei Li } else { 1689e33e175SWeiwei Li result = temp; 1699e33e175SWeiwei Li } 1709e33e175SWeiwei Li } else { 1719e33e175SWeiwei Li temp = AES_INVSHIFROWS_LO(RS1, RS2); 1729e33e175SWeiwei Li temp = (((uint64_t)AES_isbox[(temp >> 0) & 0xFF] << 0) | 1739e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 8) & 0xFF] << 8) | 1749e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 16) & 0xFF] << 16) | 1759e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 24) & 0xFF] << 24) | 1769e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 32) & 0xFF] << 32) | 1779e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 40) & 0xFF] << 40) | 1789e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 48) & 0xFF] << 48) | 1799e33e175SWeiwei Li ((uint64_t)AES_isbox[(temp >> 56) & 0xFF] << 56)); 1809e33e175SWeiwei Li if (mix) { 1819e33e175SWeiwei Li col_0 = temp & 0xFFFFFFFF; 1829e33e175SWeiwei Li col_1 = temp >> 32; 1839e33e175SWeiwei Li 1849e33e175SWeiwei Li col_0 = AES_INVMIXCOLUMN(col_0); 1859e33e175SWeiwei Li col_1 = AES_INVMIXCOLUMN(col_1); 1869e33e175SWeiwei Li 1879e33e175SWeiwei Li result = ((uint64_t)col_1 << 32) | col_0; 1889e33e175SWeiwei Li } else { 1899e33e175SWeiwei Li result = temp; 1909e33e175SWeiwei Li } 1919e33e175SWeiwei Li } 1929e33e175SWeiwei Li 1939e33e175SWeiwei Li return result; 1949e33e175SWeiwei Li } 1959e33e175SWeiwei Li 1969e33e175SWeiwei Li target_ulong HELPER(aes64esm)(target_ulong rs1, target_ulong rs2) 1979e33e175SWeiwei Li { 1989e33e175SWeiwei Li return aes64_operation(rs1, rs2, true, true); 1999e33e175SWeiwei Li } 2009e33e175SWeiwei Li 2019e33e175SWeiwei Li target_ulong HELPER(aes64es)(target_ulong rs1, target_ulong rs2) 2029e33e175SWeiwei Li { 2039e33e175SWeiwei Li return aes64_operation(rs1, rs2, true, false); 2049e33e175SWeiwei Li } 2059e33e175SWeiwei Li 2069e33e175SWeiwei Li target_ulong HELPER(aes64ds)(target_ulong rs1, target_ulong rs2) 2079e33e175SWeiwei Li { 2089e33e175SWeiwei Li return aes64_operation(rs1, rs2, false, false); 2099e33e175SWeiwei Li } 2109e33e175SWeiwei Li 2119e33e175SWeiwei Li target_ulong HELPER(aes64dsm)(target_ulong rs1, target_ulong rs2) 2129e33e175SWeiwei Li { 2139e33e175SWeiwei Li return aes64_operation(rs1, rs2, false, true); 2149e33e175SWeiwei Li } 2159e33e175SWeiwei Li 2169e33e175SWeiwei Li target_ulong HELPER(aes64ks2)(target_ulong rs1, target_ulong rs2) 2179e33e175SWeiwei Li { 2189e33e175SWeiwei Li uint64_t RS1 = rs1; 2199e33e175SWeiwei Li uint64_t RS2 = rs2; 2209e33e175SWeiwei Li uint32_t rs1_hi = RS1 >> 32; 2219e33e175SWeiwei Li uint32_t rs2_lo = RS2; 2229e33e175SWeiwei Li uint32_t rs2_hi = RS2 >> 32; 2239e33e175SWeiwei Li 2249e33e175SWeiwei Li uint32_t r_lo = (rs1_hi ^ rs2_lo); 2259e33e175SWeiwei Li uint32_t r_hi = (rs1_hi ^ rs2_lo ^ rs2_hi); 2269e33e175SWeiwei Li target_ulong result = ((uint64_t)r_hi << 32) | r_lo; 2279e33e175SWeiwei Li 2289e33e175SWeiwei Li return result; 2299e33e175SWeiwei Li } 2309e33e175SWeiwei Li 2319e33e175SWeiwei Li target_ulong HELPER(aes64ks1i)(target_ulong rs1, target_ulong rnum) 2329e33e175SWeiwei Li { 2339e33e175SWeiwei Li uint64_t RS1 = rs1; 2349e33e175SWeiwei Li static const uint8_t round_consts[10] = { 2359e33e175SWeiwei Li 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36 2369e33e175SWeiwei Li }; 2379e33e175SWeiwei Li 2389e33e175SWeiwei Li uint8_t enc_rnum = rnum; 2399e33e175SWeiwei Li uint32_t temp = (RS1 >> 32) & 0xFFFFFFFF; 2409e33e175SWeiwei Li uint8_t rcon_ = 0; 2419e33e175SWeiwei Li target_ulong result; 2429e33e175SWeiwei Li 2439e33e175SWeiwei Li if (enc_rnum != 0xA) { 2449e33e175SWeiwei Li temp = ror32(temp, 8); /* Rotate right by 8 */ 2459e33e175SWeiwei Li rcon_ = round_consts[enc_rnum]; 2469e33e175SWeiwei Li } 2479e33e175SWeiwei Li 2489e33e175SWeiwei Li temp = ((uint32_t)AES_sbox[(temp >> 24) & 0xFF] << 24) | 2499e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 16) & 0xFF] << 16) | 2509e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 8) & 0xFF] << 8) | 2519e33e175SWeiwei Li ((uint32_t)AES_sbox[(temp >> 0) & 0xFF] << 0); 2529e33e175SWeiwei Li 2539e33e175SWeiwei Li temp ^= rcon_; 2549e33e175SWeiwei Li 2559e33e175SWeiwei Li result = ((uint64_t)temp << 32) | temp; 2569e33e175SWeiwei Li 2579e33e175SWeiwei Li return result; 2589e33e175SWeiwei Li } 2599e33e175SWeiwei Li 2609e33e175SWeiwei Li target_ulong HELPER(aes64im)(target_ulong rs1) 2619e33e175SWeiwei Li { 2629e33e175SWeiwei Li uint64_t RS1 = rs1; 2639e33e175SWeiwei Li uint32_t col_0 = RS1 & 0xFFFFFFFF; 2649e33e175SWeiwei Li uint32_t col_1 = RS1 >> 32; 2659e33e175SWeiwei Li target_ulong result; 2669e33e175SWeiwei Li 2679e33e175SWeiwei Li col_0 = AES_INVMIXCOLUMN(col_0); 2689e33e175SWeiwei Li col_1 = AES_INVMIXCOLUMN(col_1); 2699e33e175SWeiwei Li 2709e33e175SWeiwei Li result = ((uint64_t)col_1 << 32) | col_0; 2719e33e175SWeiwei Li 2729e33e175SWeiwei Li return result; 2739e33e175SWeiwei Li } 274*0976083dSWeiwei Li 275*0976083dSWeiwei Li target_ulong HELPER(sm4ed)(target_ulong rs1, target_ulong rs2, 276*0976083dSWeiwei Li target_ulong shamt) 277*0976083dSWeiwei Li { 278*0976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt); 279*0976083dSWeiwei Li uint32_t sb_out = (uint32_t)sm4_sbox[sb_in]; 280*0976083dSWeiwei Li 281*0976083dSWeiwei Li uint32_t x = sb_out ^ (sb_out << 8) ^ (sb_out << 2) ^ (sb_out << 18) ^ 282*0976083dSWeiwei Li ((sb_out & 0x3f) << 26) ^ ((sb_out & 0xC0) << 10); 283*0976083dSWeiwei Li 284*0976083dSWeiwei Li uint32_t rotl = rol32(x, shamt); 285*0976083dSWeiwei Li 286*0976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1); 287*0976083dSWeiwei Li } 288*0976083dSWeiwei Li 289*0976083dSWeiwei Li target_ulong HELPER(sm4ks)(target_ulong rs1, target_ulong rs2, 290*0976083dSWeiwei Li target_ulong shamt) 291*0976083dSWeiwei Li { 292*0976083dSWeiwei Li uint32_t sb_in = (uint8_t)(rs2 >> shamt); 293*0976083dSWeiwei Li uint32_t sb_out = sm4_sbox[sb_in]; 294*0976083dSWeiwei Li 295*0976083dSWeiwei Li uint32_t x = sb_out ^ ((sb_out & 0x07) << 29) ^ ((sb_out & 0xFE) << 7) ^ 296*0976083dSWeiwei Li ((sb_out & 0x01) << 23) ^ ((sb_out & 0xF8) << 13); 297*0976083dSWeiwei Li 298*0976083dSWeiwei Li uint32_t rotl = rol32(x, shamt); 299*0976083dSWeiwei Li 300*0976083dSWeiwei Li return sext32_xlen(rotl ^ (uint32_t)rs1); 301*0976083dSWeiwei Li } 30268d19b58SWeiwei Li #undef sext32_xlen 303