1e67cd1caSRichard Henderson /* 2e67cd1caSRichard Henderson * AArch64 SME translation 3e67cd1caSRichard Henderson * 4e67cd1caSRichard Henderson * Copyright (c) 2022 Linaro, Ltd 5e67cd1caSRichard Henderson * 6e67cd1caSRichard Henderson * This library is free software; you can redistribute it and/or 7e67cd1caSRichard Henderson * modify it under the terms of the GNU Lesser General Public 8e67cd1caSRichard Henderson * License as published by the Free Software Foundation; either 9e67cd1caSRichard Henderson * version 2.1 of the License, or (at your option) any later version. 10e67cd1caSRichard Henderson * 11e67cd1caSRichard Henderson * This library is distributed in the hope that it will be useful, 12e67cd1caSRichard Henderson * but WITHOUT ANY WARRANTY; without even the implied warranty of 13e67cd1caSRichard Henderson * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14e67cd1caSRichard Henderson * Lesser General Public License for more details. 15e67cd1caSRichard Henderson * 16e67cd1caSRichard Henderson * You should have received a copy of the GNU Lesser General Public 17e67cd1caSRichard Henderson * License along with this library; if not, see <http://www.gnu.org/licenses/>. 18e67cd1caSRichard Henderson */ 19e67cd1caSRichard Henderson 20e67cd1caSRichard Henderson #include "qemu/osdep.h" 21e67cd1caSRichard Henderson #include "translate.h" 22e67cd1caSRichard Henderson #include "translate-a64.h" 23e67cd1caSRichard Henderson 24e67cd1caSRichard Henderson /* 25e67cd1caSRichard Henderson * Include the generated decoder. 26e67cd1caSRichard Henderson */ 27e67cd1caSRichard Henderson 28e67cd1caSRichard Henderson #include "decode-sme.c.inc" 29ad939afbSRichard Henderson 30ad939afbSRichard Henderson 31e9ad3ef1SRichard Henderson /* 32e9ad3ef1SRichard Henderson * Resolve tile.size[index] to a host pointer, where tile and index 33e9ad3ef1SRichard Henderson * are always decoded together, dependent on the element size. 34e9ad3ef1SRichard Henderson */ 35e9ad3ef1SRichard Henderson static TCGv_ptr get_tile_rowcol(DisasContext *s, int esz, int rs, 36e9ad3ef1SRichard Henderson int tile_index, bool vertical) 37e9ad3ef1SRichard Henderson { 38e9ad3ef1SRichard Henderson int tile = tile_index >> (4 - esz); 39e9ad3ef1SRichard Henderson int index = esz == MO_128 ? 0 : extract32(tile_index, 0, 4 - esz); 40e9ad3ef1SRichard Henderson int pos, len, offset; 41e9ad3ef1SRichard Henderson TCGv_i32 tmp; 42e9ad3ef1SRichard Henderson TCGv_ptr addr; 43e9ad3ef1SRichard Henderson 44e9ad3ef1SRichard Henderson /* Compute the final index, which is Rs+imm. */ 45e9ad3ef1SRichard Henderson tmp = tcg_temp_new_i32(); 46e9ad3ef1SRichard Henderson tcg_gen_trunc_tl_i32(tmp, cpu_reg(s, rs)); 47e9ad3ef1SRichard Henderson tcg_gen_addi_i32(tmp, tmp, index); 48e9ad3ef1SRichard Henderson 49e9ad3ef1SRichard Henderson /* Prepare a power-of-two modulo via extraction of @len bits. */ 50e9ad3ef1SRichard Henderson len = ctz32(streaming_vec_reg_size(s)) - esz; 51e9ad3ef1SRichard Henderson 52e9ad3ef1SRichard Henderson if (vertical) { 53e9ad3ef1SRichard Henderson /* 54e9ad3ef1SRichard Henderson * Compute the byte offset of the index within the tile: 55e9ad3ef1SRichard Henderson * (index % (svl / size)) * size 56e9ad3ef1SRichard Henderson * = (index % (svl >> esz)) << esz 57e9ad3ef1SRichard Henderson * Perform the power-of-two modulo via extraction of the low @len bits. 58e9ad3ef1SRichard Henderson * Perform the multiply by shifting left by @pos bits. 59e9ad3ef1SRichard Henderson * Perform these operations simultaneously via deposit into zero. 60e9ad3ef1SRichard Henderson */ 61e9ad3ef1SRichard Henderson pos = esz; 62e9ad3ef1SRichard Henderson tcg_gen_deposit_z_i32(tmp, tmp, pos, len); 63e9ad3ef1SRichard Henderson 64e9ad3ef1SRichard Henderson /* 65e9ad3ef1SRichard Henderson * For big-endian, adjust the indexed column byte offset within 66e9ad3ef1SRichard Henderson * the uint64_t host words that make up env->zarray[]. 67e9ad3ef1SRichard Henderson */ 68e9ad3ef1SRichard Henderson if (HOST_BIG_ENDIAN && esz < MO_64) { 69e9ad3ef1SRichard Henderson tcg_gen_xori_i32(tmp, tmp, 8 - (1 << esz)); 70e9ad3ef1SRichard Henderson } 71e9ad3ef1SRichard Henderson } else { 72e9ad3ef1SRichard Henderson /* 73e9ad3ef1SRichard Henderson * Compute the byte offset of the index within the tile: 74e9ad3ef1SRichard Henderson * (index % (svl / size)) * (size * sizeof(row)) 75e9ad3ef1SRichard Henderson * = (index % (svl >> esz)) << (esz + log2(sizeof(row))) 76e9ad3ef1SRichard Henderson */ 77e9ad3ef1SRichard Henderson pos = esz + ctz32(sizeof(ARMVectorReg)); 78e9ad3ef1SRichard Henderson tcg_gen_deposit_z_i32(tmp, tmp, pos, len); 79e9ad3ef1SRichard Henderson 80e9ad3ef1SRichard Henderson /* Row slices are always aligned and need no endian adjustment. */ 81e9ad3ef1SRichard Henderson } 82e9ad3ef1SRichard Henderson 83e9ad3ef1SRichard Henderson /* The tile byte offset within env->zarray is the row. */ 84e9ad3ef1SRichard Henderson offset = tile * sizeof(ARMVectorReg); 85e9ad3ef1SRichard Henderson 86e9ad3ef1SRichard Henderson /* Include the byte offset of zarray to make this relative to env. */ 87e9ad3ef1SRichard Henderson offset += offsetof(CPUARMState, zarray); 88e9ad3ef1SRichard Henderson tcg_gen_addi_i32(tmp, tmp, offset); 89e9ad3ef1SRichard Henderson 90e9ad3ef1SRichard Henderson /* Add the byte offset to env to produce the final pointer. */ 91e9ad3ef1SRichard Henderson addr = tcg_temp_new_ptr(); 92e9ad3ef1SRichard Henderson tcg_gen_ext_i32_ptr(addr, tmp); 93e9ad3ef1SRichard Henderson tcg_gen_add_ptr(addr, addr, cpu_env); 94e9ad3ef1SRichard Henderson 95e9ad3ef1SRichard Henderson return addr; 96e9ad3ef1SRichard Henderson } 97e9ad3ef1SRichard Henderson 98*1f51573fSRichard Henderson /* 99*1f51573fSRichard Henderson * Resolve tile.size[0] to a host pointer. 100*1f51573fSRichard Henderson * Used by e.g. outer product insns where we require the entire tile. 101*1f51573fSRichard Henderson */ 102*1f51573fSRichard Henderson static TCGv_ptr get_tile(DisasContext *s, int esz, int tile) 103*1f51573fSRichard Henderson { 104*1f51573fSRichard Henderson TCGv_ptr addr = tcg_temp_new_ptr(); 105*1f51573fSRichard Henderson int offset; 106*1f51573fSRichard Henderson 107*1f51573fSRichard Henderson offset = tile * sizeof(ARMVectorReg) + offsetof(CPUARMState, zarray); 108*1f51573fSRichard Henderson 109*1f51573fSRichard Henderson tcg_gen_addi_ptr(addr, cpu_env, offset); 110*1f51573fSRichard Henderson return addr; 111*1f51573fSRichard Henderson } 112*1f51573fSRichard Henderson 113ad939afbSRichard Henderson static bool trans_ZERO(DisasContext *s, arg_ZERO *a) 114ad939afbSRichard Henderson { 115ad939afbSRichard Henderson if (!dc_isar_feature(aa64_sme, s)) { 116ad939afbSRichard Henderson return false; 117ad939afbSRichard Henderson } 118ad939afbSRichard Henderson if (sme_za_enabled_check(s)) { 119ad939afbSRichard Henderson gen_helper_sme_zero(cpu_env, tcg_constant_i32(a->imm), 120ad939afbSRichard Henderson tcg_constant_i32(streaming_vec_reg_size(s))); 121ad939afbSRichard Henderson } 122ad939afbSRichard Henderson return true; 123ad939afbSRichard Henderson } 124e9ad3ef1SRichard Henderson 125e9ad3ef1SRichard Henderson static bool trans_MOVA(DisasContext *s, arg_MOVA *a) 126e9ad3ef1SRichard Henderson { 127e9ad3ef1SRichard Henderson static gen_helper_gvec_4 * const h_fns[5] = { 128e9ad3ef1SRichard Henderson gen_helper_sve_sel_zpzz_b, gen_helper_sve_sel_zpzz_h, 129e9ad3ef1SRichard Henderson gen_helper_sve_sel_zpzz_s, gen_helper_sve_sel_zpzz_d, 130e9ad3ef1SRichard Henderson gen_helper_sve_sel_zpzz_q 131e9ad3ef1SRichard Henderson }; 132e9ad3ef1SRichard Henderson static gen_helper_gvec_3 * const cz_fns[5] = { 133e9ad3ef1SRichard Henderson gen_helper_sme_mova_cz_b, gen_helper_sme_mova_cz_h, 134e9ad3ef1SRichard Henderson gen_helper_sme_mova_cz_s, gen_helper_sme_mova_cz_d, 135e9ad3ef1SRichard Henderson gen_helper_sme_mova_cz_q, 136e9ad3ef1SRichard Henderson }; 137e9ad3ef1SRichard Henderson static gen_helper_gvec_3 * const zc_fns[5] = { 138e9ad3ef1SRichard Henderson gen_helper_sme_mova_zc_b, gen_helper_sme_mova_zc_h, 139e9ad3ef1SRichard Henderson gen_helper_sme_mova_zc_s, gen_helper_sme_mova_zc_d, 140e9ad3ef1SRichard Henderson gen_helper_sme_mova_zc_q, 141e9ad3ef1SRichard Henderson }; 142e9ad3ef1SRichard Henderson 143e9ad3ef1SRichard Henderson TCGv_ptr t_za, t_zr, t_pg; 144e9ad3ef1SRichard Henderson TCGv_i32 t_desc; 145e9ad3ef1SRichard Henderson int svl; 146e9ad3ef1SRichard Henderson 147e9ad3ef1SRichard Henderson if (!dc_isar_feature(aa64_sme, s)) { 148e9ad3ef1SRichard Henderson return false; 149e9ad3ef1SRichard Henderson } 150e9ad3ef1SRichard Henderson if (!sme_smza_enabled_check(s)) { 151e9ad3ef1SRichard Henderson return true; 152e9ad3ef1SRichard Henderson } 153e9ad3ef1SRichard Henderson 154e9ad3ef1SRichard Henderson t_za = get_tile_rowcol(s, a->esz, a->rs, a->za_imm, a->v); 155e9ad3ef1SRichard Henderson t_zr = vec_full_reg_ptr(s, a->zr); 156e9ad3ef1SRichard Henderson t_pg = pred_full_reg_ptr(s, a->pg); 157e9ad3ef1SRichard Henderson 158e9ad3ef1SRichard Henderson svl = streaming_vec_reg_size(s); 159e9ad3ef1SRichard Henderson t_desc = tcg_constant_i32(simd_desc(svl, svl, 0)); 160e9ad3ef1SRichard Henderson 161e9ad3ef1SRichard Henderson if (a->v) { 162e9ad3ef1SRichard Henderson /* Vertical slice -- use sme mova helpers. */ 163e9ad3ef1SRichard Henderson if (a->to_vec) { 164e9ad3ef1SRichard Henderson zc_fns[a->esz](t_zr, t_za, t_pg, t_desc); 165e9ad3ef1SRichard Henderson } else { 166e9ad3ef1SRichard Henderson cz_fns[a->esz](t_za, t_zr, t_pg, t_desc); 167e9ad3ef1SRichard Henderson } 168e9ad3ef1SRichard Henderson } else { 169e9ad3ef1SRichard Henderson /* Horizontal slice -- reuse sve sel helpers. */ 170e9ad3ef1SRichard Henderson if (a->to_vec) { 171e9ad3ef1SRichard Henderson h_fns[a->esz](t_zr, t_za, t_zr, t_pg, t_desc); 172e9ad3ef1SRichard Henderson } else { 173e9ad3ef1SRichard Henderson h_fns[a->esz](t_za, t_zr, t_za, t_pg, t_desc); 174e9ad3ef1SRichard Henderson } 175e9ad3ef1SRichard Henderson } 176e9ad3ef1SRichard Henderson return true; 177e9ad3ef1SRichard Henderson } 1787390e0e9SRichard Henderson 1797390e0e9SRichard Henderson static bool trans_LDST1(DisasContext *s, arg_LDST1 *a) 1807390e0e9SRichard Henderson { 1817390e0e9SRichard Henderson typedef void GenLdSt1(TCGv_env, TCGv_ptr, TCGv_ptr, TCGv, TCGv_i32); 1827390e0e9SRichard Henderson 1837390e0e9SRichard Henderson /* 1847390e0e9SRichard Henderson * Indexed by [esz][be][v][mte][st], which is (except for load/store) 1857390e0e9SRichard Henderson * also the order in which the elements appear in the function names, 1867390e0e9SRichard Henderson * and so how we must concatenate the pieces. 1877390e0e9SRichard Henderson */ 1887390e0e9SRichard Henderson 1897390e0e9SRichard Henderson #define FN_LS(F) { gen_helper_sme_ld1##F, gen_helper_sme_st1##F } 1907390e0e9SRichard Henderson #define FN_MTE(F) { FN_LS(F), FN_LS(F##_mte) } 1917390e0e9SRichard Henderson #define FN_HV(F) { FN_MTE(F##_h), FN_MTE(F##_v) } 1927390e0e9SRichard Henderson #define FN_END(L, B) { FN_HV(L), FN_HV(B) } 1937390e0e9SRichard Henderson 1947390e0e9SRichard Henderson static GenLdSt1 * const fns[5][2][2][2][2] = { 1957390e0e9SRichard Henderson FN_END(b, b), 1967390e0e9SRichard Henderson FN_END(h_le, h_be), 1977390e0e9SRichard Henderson FN_END(s_le, s_be), 1987390e0e9SRichard Henderson FN_END(d_le, d_be), 1997390e0e9SRichard Henderson FN_END(q_le, q_be), 2007390e0e9SRichard Henderson }; 2017390e0e9SRichard Henderson 2027390e0e9SRichard Henderson #undef FN_LS 2037390e0e9SRichard Henderson #undef FN_MTE 2047390e0e9SRichard Henderson #undef FN_HV 2057390e0e9SRichard Henderson #undef FN_END 2067390e0e9SRichard Henderson 2077390e0e9SRichard Henderson TCGv_ptr t_za, t_pg; 2087390e0e9SRichard Henderson TCGv_i64 addr; 2097390e0e9SRichard Henderson int svl, desc = 0; 2107390e0e9SRichard Henderson bool be = s->be_data == MO_BE; 2117390e0e9SRichard Henderson bool mte = s->mte_active[0]; 2127390e0e9SRichard Henderson 2137390e0e9SRichard Henderson if (!dc_isar_feature(aa64_sme, s)) { 2147390e0e9SRichard Henderson return false; 2157390e0e9SRichard Henderson } 2167390e0e9SRichard Henderson if (!sme_smza_enabled_check(s)) { 2177390e0e9SRichard Henderson return true; 2187390e0e9SRichard Henderson } 2197390e0e9SRichard Henderson 2207390e0e9SRichard Henderson t_za = get_tile_rowcol(s, a->esz, a->rs, a->za_imm, a->v); 2217390e0e9SRichard Henderson t_pg = pred_full_reg_ptr(s, a->pg); 2227390e0e9SRichard Henderson addr = tcg_temp_new_i64(); 2237390e0e9SRichard Henderson 2247390e0e9SRichard Henderson tcg_gen_shli_i64(addr, cpu_reg(s, a->rm), a->esz); 2257390e0e9SRichard Henderson tcg_gen_add_i64(addr, addr, cpu_reg_sp(s, a->rn)); 2267390e0e9SRichard Henderson 2277390e0e9SRichard Henderson if (mte) { 2287390e0e9SRichard Henderson desc = FIELD_DP32(desc, MTEDESC, MIDX, get_mem_index(s)); 2297390e0e9SRichard Henderson desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid); 2307390e0e9SRichard Henderson desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma); 2317390e0e9SRichard Henderson desc = FIELD_DP32(desc, MTEDESC, WRITE, a->st); 2327390e0e9SRichard Henderson desc = FIELD_DP32(desc, MTEDESC, SIZEM1, (1 << a->esz) - 1); 2337390e0e9SRichard Henderson desc <<= SVE_MTEDESC_SHIFT; 2347390e0e9SRichard Henderson } else { 2357390e0e9SRichard Henderson addr = clean_data_tbi(s, addr); 2367390e0e9SRichard Henderson } 2377390e0e9SRichard Henderson svl = streaming_vec_reg_size(s); 2387390e0e9SRichard Henderson desc = simd_desc(svl, svl, desc); 2397390e0e9SRichard Henderson 2407390e0e9SRichard Henderson fns[a->esz][be][a->v][mte][a->st](cpu_env, t_za, t_pg, addr, 2417390e0e9SRichard Henderson tcg_constant_i32(desc)); 2427390e0e9SRichard Henderson return true; 2437390e0e9SRichard Henderson } 2444c46a5f1SRichard Henderson 2454c46a5f1SRichard Henderson typedef void GenLdStR(DisasContext *, TCGv_ptr, int, int, int, int); 2464c46a5f1SRichard Henderson 2474c46a5f1SRichard Henderson static bool do_ldst_r(DisasContext *s, arg_ldstr *a, GenLdStR *fn) 2484c46a5f1SRichard Henderson { 2494c46a5f1SRichard Henderson int svl = streaming_vec_reg_size(s); 2504c46a5f1SRichard Henderson int imm = a->imm; 2514c46a5f1SRichard Henderson TCGv_ptr base; 2524c46a5f1SRichard Henderson 2534c46a5f1SRichard Henderson if (!sme_za_enabled_check(s)) { 2544c46a5f1SRichard Henderson return true; 2554c46a5f1SRichard Henderson } 2564c46a5f1SRichard Henderson 2574c46a5f1SRichard Henderson /* ZA[n] equates to ZA0H.B[n]. */ 2584c46a5f1SRichard Henderson base = get_tile_rowcol(s, MO_8, a->rv, imm, false); 2594c46a5f1SRichard Henderson 2604c46a5f1SRichard Henderson fn(s, base, 0, svl, a->rn, imm * svl); 2614c46a5f1SRichard Henderson return true; 2624c46a5f1SRichard Henderson } 2634c46a5f1SRichard Henderson 2644c46a5f1SRichard Henderson TRANS_FEAT(LDR, aa64_sme, do_ldst_r, a, gen_sve_ldr) 2654c46a5f1SRichard Henderson TRANS_FEAT(STR, aa64_sme, do_ldst_r, a, gen_sve_str) 266bc4420d9SRichard Henderson 267bc4420d9SRichard Henderson static bool do_adda(DisasContext *s, arg_adda *a, MemOp esz, 268bc4420d9SRichard Henderson gen_helper_gvec_4 *fn) 269bc4420d9SRichard Henderson { 270bc4420d9SRichard Henderson int svl = streaming_vec_reg_size(s); 271bc4420d9SRichard Henderson uint32_t desc = simd_desc(svl, svl, 0); 272bc4420d9SRichard Henderson TCGv_ptr za, zn, pn, pm; 273bc4420d9SRichard Henderson 274bc4420d9SRichard Henderson if (!sme_smza_enabled_check(s)) { 275bc4420d9SRichard Henderson return true; 276bc4420d9SRichard Henderson } 277bc4420d9SRichard Henderson 278*1f51573fSRichard Henderson za = get_tile(s, esz, a->zad); 279bc4420d9SRichard Henderson zn = vec_full_reg_ptr(s, a->zn); 280bc4420d9SRichard Henderson pn = pred_full_reg_ptr(s, a->pn); 281bc4420d9SRichard Henderson pm = pred_full_reg_ptr(s, a->pm); 282bc4420d9SRichard Henderson 283bc4420d9SRichard Henderson fn(za, zn, pn, pm, tcg_constant_i32(desc)); 284bc4420d9SRichard Henderson return true; 285bc4420d9SRichard Henderson } 286bc4420d9SRichard Henderson 287bc4420d9SRichard Henderson TRANS_FEAT(ADDHA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addha_s) 288bc4420d9SRichard Henderson TRANS_FEAT(ADDVA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addva_s) 289bc4420d9SRichard Henderson TRANS_FEAT(ADDHA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addha_d) 290bc4420d9SRichard Henderson TRANS_FEAT(ADDVA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addva_d) 291558e956cSRichard Henderson 292920f640dSRichard Henderson static bool do_outprod(DisasContext *s, arg_op *a, MemOp esz, 293920f640dSRichard Henderson gen_helper_gvec_5 *fn) 294920f640dSRichard Henderson { 295920f640dSRichard Henderson int svl = streaming_vec_reg_size(s); 296920f640dSRichard Henderson uint32_t desc = simd_desc(svl, svl, a->sub); 297920f640dSRichard Henderson TCGv_ptr za, zn, zm, pn, pm; 298920f640dSRichard Henderson 299920f640dSRichard Henderson if (!sme_smza_enabled_check(s)) { 300920f640dSRichard Henderson return true; 301920f640dSRichard Henderson } 302920f640dSRichard Henderson 303*1f51573fSRichard Henderson za = get_tile(s, esz, a->zad); 304920f640dSRichard Henderson zn = vec_full_reg_ptr(s, a->zn); 305920f640dSRichard Henderson zm = vec_full_reg_ptr(s, a->zm); 306920f640dSRichard Henderson pn = pred_full_reg_ptr(s, a->pn); 307920f640dSRichard Henderson pm = pred_full_reg_ptr(s, a->pm); 308920f640dSRichard Henderson 309920f640dSRichard Henderson fn(za, zn, zm, pn, pm, tcg_constant_i32(desc)); 310920f640dSRichard Henderson return true; 311920f640dSRichard Henderson } 312920f640dSRichard Henderson 313558e956cSRichard Henderson static bool do_outprod_fpst(DisasContext *s, arg_op *a, MemOp esz, 314558e956cSRichard Henderson gen_helper_gvec_5_ptr *fn) 315558e956cSRichard Henderson { 316558e956cSRichard Henderson int svl = streaming_vec_reg_size(s); 317558e956cSRichard Henderson uint32_t desc = simd_desc(svl, svl, a->sub); 318558e956cSRichard Henderson TCGv_ptr za, zn, zm, pn, pm, fpst; 319558e956cSRichard Henderson 320558e956cSRichard Henderson if (!sme_smza_enabled_check(s)) { 321558e956cSRichard Henderson return true; 322558e956cSRichard Henderson } 323558e956cSRichard Henderson 324*1f51573fSRichard Henderson za = get_tile(s, esz, a->zad); 325558e956cSRichard Henderson zn = vec_full_reg_ptr(s, a->zn); 326558e956cSRichard Henderson zm = vec_full_reg_ptr(s, a->zm); 327558e956cSRichard Henderson pn = pred_full_reg_ptr(s, a->pn); 328558e956cSRichard Henderson pm = pred_full_reg_ptr(s, a->pm); 329558e956cSRichard Henderson fpst = fpstatus_ptr(FPST_FPCR); 330558e956cSRichard Henderson 331558e956cSRichard Henderson fn(za, zn, zm, pn, pm, fpst, tcg_constant_i32(desc)); 332558e956cSRichard Henderson return true; 333558e956cSRichard Henderson } 334558e956cSRichard Henderson 3353916841aSRichard Henderson TRANS_FEAT(FMOPA_h, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_h) 336558e956cSRichard Henderson TRANS_FEAT(FMOPA_s, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_s) 337558e956cSRichard Henderson TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a, MO_64, gen_helper_sme_fmopa_d) 338920f640dSRichard Henderson 339920f640dSRichard Henderson /* TODO: FEAT_EBF16 */ 340920f640dSRichard Henderson TRANS_FEAT(BFMOPA, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_bfmopa) 34123a5e385SRichard Henderson 34223a5e385SRichard Henderson TRANS_FEAT(SMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_smopa_s) 34323a5e385SRichard Henderson TRANS_FEAT(UMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_umopa_s) 34423a5e385SRichard Henderson TRANS_FEAT(SUMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_sumopa_s) 34523a5e385SRichard Henderson TRANS_FEAT(USMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_usmopa_s) 34623a5e385SRichard Henderson 34723a5e385SRichard Henderson TRANS_FEAT(SMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_smopa_d) 34823a5e385SRichard Henderson TRANS_FEAT(UMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_umopa_d) 34923a5e385SRichard Henderson TRANS_FEAT(SUMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_sumopa_d) 35023a5e385SRichard Henderson TRANS_FEAT(USMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_usmopa_d) 351