xref: /qemu/target/arm/tcg/translate-sme.c (revision 1f51573f7925b80e79a29f87c7d9d6ead60960c0)
1e67cd1caSRichard Henderson /*
2e67cd1caSRichard Henderson  * AArch64 SME translation
3e67cd1caSRichard Henderson  *
4e67cd1caSRichard Henderson  * Copyright (c) 2022 Linaro, Ltd
5e67cd1caSRichard Henderson  *
6e67cd1caSRichard Henderson  * This library is free software; you can redistribute it and/or
7e67cd1caSRichard Henderson  * modify it under the terms of the GNU Lesser General Public
8e67cd1caSRichard Henderson  * License as published by the Free Software Foundation; either
9e67cd1caSRichard Henderson  * version 2.1 of the License, or (at your option) any later version.
10e67cd1caSRichard Henderson  *
11e67cd1caSRichard Henderson  * This library is distributed in the hope that it will be useful,
12e67cd1caSRichard Henderson  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13e67cd1caSRichard Henderson  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14e67cd1caSRichard Henderson  * Lesser General Public License for more details.
15e67cd1caSRichard Henderson  *
16e67cd1caSRichard Henderson  * You should have received a copy of the GNU Lesser General Public
17e67cd1caSRichard Henderson  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18e67cd1caSRichard Henderson  */
19e67cd1caSRichard Henderson 
20e67cd1caSRichard Henderson #include "qemu/osdep.h"
21e67cd1caSRichard Henderson #include "translate.h"
22e67cd1caSRichard Henderson #include "translate-a64.h"
23e67cd1caSRichard Henderson 
24e67cd1caSRichard Henderson /*
25e67cd1caSRichard Henderson  * Include the generated decoder.
26e67cd1caSRichard Henderson  */
27e67cd1caSRichard Henderson 
28e67cd1caSRichard Henderson #include "decode-sme.c.inc"
29ad939afbSRichard Henderson 
30ad939afbSRichard Henderson 
31e9ad3ef1SRichard Henderson /*
32e9ad3ef1SRichard Henderson  * Resolve tile.size[index] to a host pointer, where tile and index
33e9ad3ef1SRichard Henderson  * are always decoded together, dependent on the element size.
34e9ad3ef1SRichard Henderson  */
35e9ad3ef1SRichard Henderson static TCGv_ptr get_tile_rowcol(DisasContext *s, int esz, int rs,
36e9ad3ef1SRichard Henderson                                 int tile_index, bool vertical)
37e9ad3ef1SRichard Henderson {
38e9ad3ef1SRichard Henderson     int tile = tile_index >> (4 - esz);
39e9ad3ef1SRichard Henderson     int index = esz == MO_128 ? 0 : extract32(tile_index, 0, 4 - esz);
40e9ad3ef1SRichard Henderson     int pos, len, offset;
41e9ad3ef1SRichard Henderson     TCGv_i32 tmp;
42e9ad3ef1SRichard Henderson     TCGv_ptr addr;
43e9ad3ef1SRichard Henderson 
44e9ad3ef1SRichard Henderson     /* Compute the final index, which is Rs+imm. */
45e9ad3ef1SRichard Henderson     tmp = tcg_temp_new_i32();
46e9ad3ef1SRichard Henderson     tcg_gen_trunc_tl_i32(tmp, cpu_reg(s, rs));
47e9ad3ef1SRichard Henderson     tcg_gen_addi_i32(tmp, tmp, index);
48e9ad3ef1SRichard Henderson 
49e9ad3ef1SRichard Henderson     /* Prepare a power-of-two modulo via extraction of @len bits. */
50e9ad3ef1SRichard Henderson     len = ctz32(streaming_vec_reg_size(s)) - esz;
51e9ad3ef1SRichard Henderson 
52e9ad3ef1SRichard Henderson     if (vertical) {
53e9ad3ef1SRichard Henderson         /*
54e9ad3ef1SRichard Henderson          * Compute the byte offset of the index within the tile:
55e9ad3ef1SRichard Henderson          *     (index % (svl / size)) * size
56e9ad3ef1SRichard Henderson          *   = (index % (svl >> esz)) << esz
57e9ad3ef1SRichard Henderson          * Perform the power-of-two modulo via extraction of the low @len bits.
58e9ad3ef1SRichard Henderson          * Perform the multiply by shifting left by @pos bits.
59e9ad3ef1SRichard Henderson          * Perform these operations simultaneously via deposit into zero.
60e9ad3ef1SRichard Henderson          */
61e9ad3ef1SRichard Henderson         pos = esz;
62e9ad3ef1SRichard Henderson         tcg_gen_deposit_z_i32(tmp, tmp, pos, len);
63e9ad3ef1SRichard Henderson 
64e9ad3ef1SRichard Henderson         /*
65e9ad3ef1SRichard Henderson          * For big-endian, adjust the indexed column byte offset within
66e9ad3ef1SRichard Henderson          * the uint64_t host words that make up env->zarray[].
67e9ad3ef1SRichard Henderson          */
68e9ad3ef1SRichard Henderson         if (HOST_BIG_ENDIAN && esz < MO_64) {
69e9ad3ef1SRichard Henderson             tcg_gen_xori_i32(tmp, tmp, 8 - (1 << esz));
70e9ad3ef1SRichard Henderson         }
71e9ad3ef1SRichard Henderson     } else {
72e9ad3ef1SRichard Henderson         /*
73e9ad3ef1SRichard Henderson          * Compute the byte offset of the index within the tile:
74e9ad3ef1SRichard Henderson          *     (index % (svl / size)) * (size * sizeof(row))
75e9ad3ef1SRichard Henderson          *   = (index % (svl >> esz)) << (esz + log2(sizeof(row)))
76e9ad3ef1SRichard Henderson          */
77e9ad3ef1SRichard Henderson         pos = esz + ctz32(sizeof(ARMVectorReg));
78e9ad3ef1SRichard Henderson         tcg_gen_deposit_z_i32(tmp, tmp, pos, len);
79e9ad3ef1SRichard Henderson 
80e9ad3ef1SRichard Henderson         /* Row slices are always aligned and need no endian adjustment. */
81e9ad3ef1SRichard Henderson     }
82e9ad3ef1SRichard Henderson 
83e9ad3ef1SRichard Henderson     /* The tile byte offset within env->zarray is the row. */
84e9ad3ef1SRichard Henderson     offset = tile * sizeof(ARMVectorReg);
85e9ad3ef1SRichard Henderson 
86e9ad3ef1SRichard Henderson     /* Include the byte offset of zarray to make this relative to env. */
87e9ad3ef1SRichard Henderson     offset += offsetof(CPUARMState, zarray);
88e9ad3ef1SRichard Henderson     tcg_gen_addi_i32(tmp, tmp, offset);
89e9ad3ef1SRichard Henderson 
90e9ad3ef1SRichard Henderson     /* Add the byte offset to env to produce the final pointer. */
91e9ad3ef1SRichard Henderson     addr = tcg_temp_new_ptr();
92e9ad3ef1SRichard Henderson     tcg_gen_ext_i32_ptr(addr, tmp);
93e9ad3ef1SRichard Henderson     tcg_gen_add_ptr(addr, addr, cpu_env);
94e9ad3ef1SRichard Henderson 
95e9ad3ef1SRichard Henderson     return addr;
96e9ad3ef1SRichard Henderson }
97e9ad3ef1SRichard Henderson 
98*1f51573fSRichard Henderson /*
99*1f51573fSRichard Henderson  * Resolve tile.size[0] to a host pointer.
100*1f51573fSRichard Henderson  * Used by e.g. outer product insns where we require the entire tile.
101*1f51573fSRichard Henderson  */
102*1f51573fSRichard Henderson static TCGv_ptr get_tile(DisasContext *s, int esz, int tile)
103*1f51573fSRichard Henderson {
104*1f51573fSRichard Henderson     TCGv_ptr addr = tcg_temp_new_ptr();
105*1f51573fSRichard Henderson     int offset;
106*1f51573fSRichard Henderson 
107*1f51573fSRichard Henderson     offset = tile * sizeof(ARMVectorReg) + offsetof(CPUARMState, zarray);
108*1f51573fSRichard Henderson 
109*1f51573fSRichard Henderson     tcg_gen_addi_ptr(addr, cpu_env, offset);
110*1f51573fSRichard Henderson     return addr;
111*1f51573fSRichard Henderson }
112*1f51573fSRichard Henderson 
113ad939afbSRichard Henderson static bool trans_ZERO(DisasContext *s, arg_ZERO *a)
114ad939afbSRichard Henderson {
115ad939afbSRichard Henderson     if (!dc_isar_feature(aa64_sme, s)) {
116ad939afbSRichard Henderson         return false;
117ad939afbSRichard Henderson     }
118ad939afbSRichard Henderson     if (sme_za_enabled_check(s)) {
119ad939afbSRichard Henderson         gen_helper_sme_zero(cpu_env, tcg_constant_i32(a->imm),
120ad939afbSRichard Henderson                             tcg_constant_i32(streaming_vec_reg_size(s)));
121ad939afbSRichard Henderson     }
122ad939afbSRichard Henderson     return true;
123ad939afbSRichard Henderson }
124e9ad3ef1SRichard Henderson 
125e9ad3ef1SRichard Henderson static bool trans_MOVA(DisasContext *s, arg_MOVA *a)
126e9ad3ef1SRichard Henderson {
127e9ad3ef1SRichard Henderson     static gen_helper_gvec_4 * const h_fns[5] = {
128e9ad3ef1SRichard Henderson         gen_helper_sve_sel_zpzz_b, gen_helper_sve_sel_zpzz_h,
129e9ad3ef1SRichard Henderson         gen_helper_sve_sel_zpzz_s, gen_helper_sve_sel_zpzz_d,
130e9ad3ef1SRichard Henderson         gen_helper_sve_sel_zpzz_q
131e9ad3ef1SRichard Henderson     };
132e9ad3ef1SRichard Henderson     static gen_helper_gvec_3 * const cz_fns[5] = {
133e9ad3ef1SRichard Henderson         gen_helper_sme_mova_cz_b, gen_helper_sme_mova_cz_h,
134e9ad3ef1SRichard Henderson         gen_helper_sme_mova_cz_s, gen_helper_sme_mova_cz_d,
135e9ad3ef1SRichard Henderson         gen_helper_sme_mova_cz_q,
136e9ad3ef1SRichard Henderson     };
137e9ad3ef1SRichard Henderson     static gen_helper_gvec_3 * const zc_fns[5] = {
138e9ad3ef1SRichard Henderson         gen_helper_sme_mova_zc_b, gen_helper_sme_mova_zc_h,
139e9ad3ef1SRichard Henderson         gen_helper_sme_mova_zc_s, gen_helper_sme_mova_zc_d,
140e9ad3ef1SRichard Henderson         gen_helper_sme_mova_zc_q,
141e9ad3ef1SRichard Henderson     };
142e9ad3ef1SRichard Henderson 
143e9ad3ef1SRichard Henderson     TCGv_ptr t_za, t_zr, t_pg;
144e9ad3ef1SRichard Henderson     TCGv_i32 t_desc;
145e9ad3ef1SRichard Henderson     int svl;
146e9ad3ef1SRichard Henderson 
147e9ad3ef1SRichard Henderson     if (!dc_isar_feature(aa64_sme, s)) {
148e9ad3ef1SRichard Henderson         return false;
149e9ad3ef1SRichard Henderson     }
150e9ad3ef1SRichard Henderson     if (!sme_smza_enabled_check(s)) {
151e9ad3ef1SRichard Henderson         return true;
152e9ad3ef1SRichard Henderson     }
153e9ad3ef1SRichard Henderson 
154e9ad3ef1SRichard Henderson     t_za = get_tile_rowcol(s, a->esz, a->rs, a->za_imm, a->v);
155e9ad3ef1SRichard Henderson     t_zr = vec_full_reg_ptr(s, a->zr);
156e9ad3ef1SRichard Henderson     t_pg = pred_full_reg_ptr(s, a->pg);
157e9ad3ef1SRichard Henderson 
158e9ad3ef1SRichard Henderson     svl = streaming_vec_reg_size(s);
159e9ad3ef1SRichard Henderson     t_desc = tcg_constant_i32(simd_desc(svl, svl, 0));
160e9ad3ef1SRichard Henderson 
161e9ad3ef1SRichard Henderson     if (a->v) {
162e9ad3ef1SRichard Henderson         /* Vertical slice -- use sme mova helpers. */
163e9ad3ef1SRichard Henderson         if (a->to_vec) {
164e9ad3ef1SRichard Henderson             zc_fns[a->esz](t_zr, t_za, t_pg, t_desc);
165e9ad3ef1SRichard Henderson         } else {
166e9ad3ef1SRichard Henderson             cz_fns[a->esz](t_za, t_zr, t_pg, t_desc);
167e9ad3ef1SRichard Henderson         }
168e9ad3ef1SRichard Henderson     } else {
169e9ad3ef1SRichard Henderson         /* Horizontal slice -- reuse sve sel helpers. */
170e9ad3ef1SRichard Henderson         if (a->to_vec) {
171e9ad3ef1SRichard Henderson             h_fns[a->esz](t_zr, t_za, t_zr, t_pg, t_desc);
172e9ad3ef1SRichard Henderson         } else {
173e9ad3ef1SRichard Henderson             h_fns[a->esz](t_za, t_zr, t_za, t_pg, t_desc);
174e9ad3ef1SRichard Henderson         }
175e9ad3ef1SRichard Henderson     }
176e9ad3ef1SRichard Henderson     return true;
177e9ad3ef1SRichard Henderson }
1787390e0e9SRichard Henderson 
1797390e0e9SRichard Henderson static bool trans_LDST1(DisasContext *s, arg_LDST1 *a)
1807390e0e9SRichard Henderson {
1817390e0e9SRichard Henderson     typedef void GenLdSt1(TCGv_env, TCGv_ptr, TCGv_ptr, TCGv, TCGv_i32);
1827390e0e9SRichard Henderson 
1837390e0e9SRichard Henderson     /*
1847390e0e9SRichard Henderson      * Indexed by [esz][be][v][mte][st], which is (except for load/store)
1857390e0e9SRichard Henderson      * also the order in which the elements appear in the function names,
1867390e0e9SRichard Henderson      * and so how we must concatenate the pieces.
1877390e0e9SRichard Henderson      */
1887390e0e9SRichard Henderson 
1897390e0e9SRichard Henderson #define FN_LS(F)     { gen_helper_sme_ld1##F, gen_helper_sme_st1##F }
1907390e0e9SRichard Henderson #define FN_MTE(F)    { FN_LS(F), FN_LS(F##_mte) }
1917390e0e9SRichard Henderson #define FN_HV(F)     { FN_MTE(F##_h), FN_MTE(F##_v) }
1927390e0e9SRichard Henderson #define FN_END(L, B) { FN_HV(L), FN_HV(B) }
1937390e0e9SRichard Henderson 
1947390e0e9SRichard Henderson     static GenLdSt1 * const fns[5][2][2][2][2] = {
1957390e0e9SRichard Henderson         FN_END(b, b),
1967390e0e9SRichard Henderson         FN_END(h_le, h_be),
1977390e0e9SRichard Henderson         FN_END(s_le, s_be),
1987390e0e9SRichard Henderson         FN_END(d_le, d_be),
1997390e0e9SRichard Henderson         FN_END(q_le, q_be),
2007390e0e9SRichard Henderson     };
2017390e0e9SRichard Henderson 
2027390e0e9SRichard Henderson #undef FN_LS
2037390e0e9SRichard Henderson #undef FN_MTE
2047390e0e9SRichard Henderson #undef FN_HV
2057390e0e9SRichard Henderson #undef FN_END
2067390e0e9SRichard Henderson 
2077390e0e9SRichard Henderson     TCGv_ptr t_za, t_pg;
2087390e0e9SRichard Henderson     TCGv_i64 addr;
2097390e0e9SRichard Henderson     int svl, desc = 0;
2107390e0e9SRichard Henderson     bool be = s->be_data == MO_BE;
2117390e0e9SRichard Henderson     bool mte = s->mte_active[0];
2127390e0e9SRichard Henderson 
2137390e0e9SRichard Henderson     if (!dc_isar_feature(aa64_sme, s)) {
2147390e0e9SRichard Henderson         return false;
2157390e0e9SRichard Henderson     }
2167390e0e9SRichard Henderson     if (!sme_smza_enabled_check(s)) {
2177390e0e9SRichard Henderson         return true;
2187390e0e9SRichard Henderson     }
2197390e0e9SRichard Henderson 
2207390e0e9SRichard Henderson     t_za = get_tile_rowcol(s, a->esz, a->rs, a->za_imm, a->v);
2217390e0e9SRichard Henderson     t_pg = pred_full_reg_ptr(s, a->pg);
2227390e0e9SRichard Henderson     addr = tcg_temp_new_i64();
2237390e0e9SRichard Henderson 
2247390e0e9SRichard Henderson     tcg_gen_shli_i64(addr, cpu_reg(s, a->rm), a->esz);
2257390e0e9SRichard Henderson     tcg_gen_add_i64(addr, addr, cpu_reg_sp(s, a->rn));
2267390e0e9SRichard Henderson 
2277390e0e9SRichard Henderson     if (mte) {
2287390e0e9SRichard Henderson         desc = FIELD_DP32(desc, MTEDESC, MIDX, get_mem_index(s));
2297390e0e9SRichard Henderson         desc = FIELD_DP32(desc, MTEDESC, TBI, s->tbid);
2307390e0e9SRichard Henderson         desc = FIELD_DP32(desc, MTEDESC, TCMA, s->tcma);
2317390e0e9SRichard Henderson         desc = FIELD_DP32(desc, MTEDESC, WRITE, a->st);
2327390e0e9SRichard Henderson         desc = FIELD_DP32(desc, MTEDESC, SIZEM1, (1 << a->esz) - 1);
2337390e0e9SRichard Henderson         desc <<= SVE_MTEDESC_SHIFT;
2347390e0e9SRichard Henderson     } else {
2357390e0e9SRichard Henderson         addr = clean_data_tbi(s, addr);
2367390e0e9SRichard Henderson     }
2377390e0e9SRichard Henderson     svl = streaming_vec_reg_size(s);
2387390e0e9SRichard Henderson     desc = simd_desc(svl, svl, desc);
2397390e0e9SRichard Henderson 
2407390e0e9SRichard Henderson     fns[a->esz][be][a->v][mte][a->st](cpu_env, t_za, t_pg, addr,
2417390e0e9SRichard Henderson                                       tcg_constant_i32(desc));
2427390e0e9SRichard Henderson     return true;
2437390e0e9SRichard Henderson }
2444c46a5f1SRichard Henderson 
2454c46a5f1SRichard Henderson typedef void GenLdStR(DisasContext *, TCGv_ptr, int, int, int, int);
2464c46a5f1SRichard Henderson 
2474c46a5f1SRichard Henderson static bool do_ldst_r(DisasContext *s, arg_ldstr *a, GenLdStR *fn)
2484c46a5f1SRichard Henderson {
2494c46a5f1SRichard Henderson     int svl = streaming_vec_reg_size(s);
2504c46a5f1SRichard Henderson     int imm = a->imm;
2514c46a5f1SRichard Henderson     TCGv_ptr base;
2524c46a5f1SRichard Henderson 
2534c46a5f1SRichard Henderson     if (!sme_za_enabled_check(s)) {
2544c46a5f1SRichard Henderson         return true;
2554c46a5f1SRichard Henderson     }
2564c46a5f1SRichard Henderson 
2574c46a5f1SRichard Henderson     /* ZA[n] equates to ZA0H.B[n]. */
2584c46a5f1SRichard Henderson     base = get_tile_rowcol(s, MO_8, a->rv, imm, false);
2594c46a5f1SRichard Henderson 
2604c46a5f1SRichard Henderson     fn(s, base, 0, svl, a->rn, imm * svl);
2614c46a5f1SRichard Henderson     return true;
2624c46a5f1SRichard Henderson }
2634c46a5f1SRichard Henderson 
2644c46a5f1SRichard Henderson TRANS_FEAT(LDR, aa64_sme, do_ldst_r, a, gen_sve_ldr)
2654c46a5f1SRichard Henderson TRANS_FEAT(STR, aa64_sme, do_ldst_r, a, gen_sve_str)
266bc4420d9SRichard Henderson 
267bc4420d9SRichard Henderson static bool do_adda(DisasContext *s, arg_adda *a, MemOp esz,
268bc4420d9SRichard Henderson                     gen_helper_gvec_4 *fn)
269bc4420d9SRichard Henderson {
270bc4420d9SRichard Henderson     int svl = streaming_vec_reg_size(s);
271bc4420d9SRichard Henderson     uint32_t desc = simd_desc(svl, svl, 0);
272bc4420d9SRichard Henderson     TCGv_ptr za, zn, pn, pm;
273bc4420d9SRichard Henderson 
274bc4420d9SRichard Henderson     if (!sme_smza_enabled_check(s)) {
275bc4420d9SRichard Henderson         return true;
276bc4420d9SRichard Henderson     }
277bc4420d9SRichard Henderson 
278*1f51573fSRichard Henderson     za = get_tile(s, esz, a->zad);
279bc4420d9SRichard Henderson     zn = vec_full_reg_ptr(s, a->zn);
280bc4420d9SRichard Henderson     pn = pred_full_reg_ptr(s, a->pn);
281bc4420d9SRichard Henderson     pm = pred_full_reg_ptr(s, a->pm);
282bc4420d9SRichard Henderson 
283bc4420d9SRichard Henderson     fn(za, zn, pn, pm, tcg_constant_i32(desc));
284bc4420d9SRichard Henderson     return true;
285bc4420d9SRichard Henderson }
286bc4420d9SRichard Henderson 
287bc4420d9SRichard Henderson TRANS_FEAT(ADDHA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addha_s)
288bc4420d9SRichard Henderson TRANS_FEAT(ADDVA_s, aa64_sme, do_adda, a, MO_32, gen_helper_sme_addva_s)
289bc4420d9SRichard Henderson TRANS_FEAT(ADDHA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addha_d)
290bc4420d9SRichard Henderson TRANS_FEAT(ADDVA_d, aa64_sme_i16i64, do_adda, a, MO_64, gen_helper_sme_addva_d)
291558e956cSRichard Henderson 
292920f640dSRichard Henderson static bool do_outprod(DisasContext *s, arg_op *a, MemOp esz,
293920f640dSRichard Henderson                        gen_helper_gvec_5 *fn)
294920f640dSRichard Henderson {
295920f640dSRichard Henderson     int svl = streaming_vec_reg_size(s);
296920f640dSRichard Henderson     uint32_t desc = simd_desc(svl, svl, a->sub);
297920f640dSRichard Henderson     TCGv_ptr za, zn, zm, pn, pm;
298920f640dSRichard Henderson 
299920f640dSRichard Henderson     if (!sme_smza_enabled_check(s)) {
300920f640dSRichard Henderson         return true;
301920f640dSRichard Henderson     }
302920f640dSRichard Henderson 
303*1f51573fSRichard Henderson     za = get_tile(s, esz, a->zad);
304920f640dSRichard Henderson     zn = vec_full_reg_ptr(s, a->zn);
305920f640dSRichard Henderson     zm = vec_full_reg_ptr(s, a->zm);
306920f640dSRichard Henderson     pn = pred_full_reg_ptr(s, a->pn);
307920f640dSRichard Henderson     pm = pred_full_reg_ptr(s, a->pm);
308920f640dSRichard Henderson 
309920f640dSRichard Henderson     fn(za, zn, zm, pn, pm, tcg_constant_i32(desc));
310920f640dSRichard Henderson     return true;
311920f640dSRichard Henderson }
312920f640dSRichard Henderson 
313558e956cSRichard Henderson static bool do_outprod_fpst(DisasContext *s, arg_op *a, MemOp esz,
314558e956cSRichard Henderson                             gen_helper_gvec_5_ptr *fn)
315558e956cSRichard Henderson {
316558e956cSRichard Henderson     int svl = streaming_vec_reg_size(s);
317558e956cSRichard Henderson     uint32_t desc = simd_desc(svl, svl, a->sub);
318558e956cSRichard Henderson     TCGv_ptr za, zn, zm, pn, pm, fpst;
319558e956cSRichard Henderson 
320558e956cSRichard Henderson     if (!sme_smza_enabled_check(s)) {
321558e956cSRichard Henderson         return true;
322558e956cSRichard Henderson     }
323558e956cSRichard Henderson 
324*1f51573fSRichard Henderson     za = get_tile(s, esz, a->zad);
325558e956cSRichard Henderson     zn = vec_full_reg_ptr(s, a->zn);
326558e956cSRichard Henderson     zm = vec_full_reg_ptr(s, a->zm);
327558e956cSRichard Henderson     pn = pred_full_reg_ptr(s, a->pn);
328558e956cSRichard Henderson     pm = pred_full_reg_ptr(s, a->pm);
329558e956cSRichard Henderson     fpst = fpstatus_ptr(FPST_FPCR);
330558e956cSRichard Henderson 
331558e956cSRichard Henderson     fn(za, zn, zm, pn, pm, fpst, tcg_constant_i32(desc));
332558e956cSRichard Henderson     return true;
333558e956cSRichard Henderson }
334558e956cSRichard Henderson 
3353916841aSRichard Henderson TRANS_FEAT(FMOPA_h, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_h)
336558e956cSRichard Henderson TRANS_FEAT(FMOPA_s, aa64_sme, do_outprod_fpst, a, MO_32, gen_helper_sme_fmopa_s)
337558e956cSRichard Henderson TRANS_FEAT(FMOPA_d, aa64_sme_f64f64, do_outprod_fpst, a, MO_64, gen_helper_sme_fmopa_d)
338920f640dSRichard Henderson 
339920f640dSRichard Henderson /* TODO: FEAT_EBF16 */
340920f640dSRichard Henderson TRANS_FEAT(BFMOPA, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_bfmopa)
34123a5e385SRichard Henderson 
34223a5e385SRichard Henderson TRANS_FEAT(SMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_smopa_s)
34323a5e385SRichard Henderson TRANS_FEAT(UMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_umopa_s)
34423a5e385SRichard Henderson TRANS_FEAT(SUMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_sumopa_s)
34523a5e385SRichard Henderson TRANS_FEAT(USMOPA_s, aa64_sme, do_outprod, a, MO_32, gen_helper_sme_usmopa_s)
34623a5e385SRichard Henderson 
34723a5e385SRichard Henderson TRANS_FEAT(SMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_smopa_d)
34823a5e385SRichard Henderson TRANS_FEAT(UMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_umopa_d)
34923a5e385SRichard Henderson TRANS_FEAT(SUMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_sumopa_d)
35023a5e385SRichard Henderson TRANS_FEAT(USMOPA_d, aa64_sme_i16i64, do_outprod, a, MO_64, gen_helper_sme_usmopa_d)
351