1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 3372fd2efbSEmilio G. Cota #include "qemu/error-report.h" 34f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 351de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 36d4c51a0aSMarkus Armbruster #include "qemu/qemu-print.h" 371de7afc9SPaolo Bonzini #include "qemu/timer.h" 38084cfca1SRichard Henderson #include "qemu/cacheflush.h" 39c896fe29Sbellard 40c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 41c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 42c896fe29Sbellard instructions */ 43c896fe29Sbellard #define NO_CPU_IO_DEFS 44c896fe29Sbellard 4563c91552SPaolo Bonzini #include "exec/exec-all.h" 46dcb32f1dSPhilippe Mathieu-Daudé #include "tcg/tcg-op.h" 47813da627SRichard Henderson 48edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 49813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 50edee2579SRichard Henderson #else 51edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 52813da627SRichard Henderson #endif 53813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 54813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 55813da627SRichard Henderson #else 56813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 57813da627SRichard Henderson #endif 58813da627SRichard Henderson 59c896fe29Sbellard #include "elf.h" 60508127e2SPaolo Bonzini #include "exec/log.h" 615ff7258cSRichard Henderson #include "tcg-internal.h" 62c896fe29Sbellard 63139c1837SPaolo Bonzini /* Forward declarations for functions declared in tcg-target.c.inc and 64ce151109SPeter Maydell used here. */ 65e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 66e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 676ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type, 682ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 69c896fe29Sbellard 70497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 71497a22ebSRichard Henderson typedef struct { 72497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 73497a22ebSRichard Henderson uint32_t id; 74497a22ebSRichard Henderson uint8_t version; 75497a22ebSRichard Henderson char augmentation[1]; 76497a22ebSRichard Henderson uint8_t code_align; 77497a22ebSRichard Henderson uint8_t data_align; 78497a22ebSRichard Henderson uint8_t return_column; 79497a22ebSRichard Henderson } DebugFrameCIE; 80497a22ebSRichard Henderson 81497a22ebSRichard Henderson typedef struct QEMU_PACKED { 82497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 83497a22ebSRichard Henderson uint32_t cie_offset; 84edee2579SRichard Henderson uintptr_t func_start; 85edee2579SRichard Henderson uintptr_t func_len; 86497a22ebSRichard Henderson } DebugFrameFDEHeader; 87497a22ebSRichard Henderson 882c90784aSRichard Henderson typedef struct QEMU_PACKED { 892c90784aSRichard Henderson DebugFrameCIE cie; 902c90784aSRichard Henderson DebugFrameFDEHeader fde; 912c90784aSRichard Henderson } DebugFrameHeader; 922c90784aSRichard Henderson 93755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf, size_t size, 942c90784aSRichard Henderson const void *debug_frame, 952c90784aSRichard Henderson size_t debug_frame_size) 96813da627SRichard Henderson __attribute__((unused)); 97813da627SRichard Henderson 98139c1837SPaolo Bonzini /* Forward declarations for functions declared and used in tcg-target.c.inc. */ 992a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 100a05b5b9bSRichard Henderson intptr_t arg2); 10178113e83SRichard Henderson static bool tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 102c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1032a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 1045e8892dbSMiroslav Rezanina static void tcg_out_op(TCGContext *s, TCGOpcode opc, 1055e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1065e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]); 107d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 108e7632cfaSRichard Henderson static bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece, 109e7632cfaSRichard Henderson TCGReg dst, TCGReg src); 110d6ecb4a9SRichard Henderson static bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece, 111d6ecb4a9SRichard Henderson TCGReg dst, TCGReg base, intptr_t offset); 1124e186175SRichard Henderson static void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece, 1134e186175SRichard Henderson TCGReg dst, int64_t arg); 1145e8892dbSMiroslav Rezanina static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, 1155e8892dbSMiroslav Rezanina unsigned vecl, unsigned vece, 1165e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1175e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]); 118d2fd745fSRichard Henderson #else 119e7632cfaSRichard Henderson static inline bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece, 120e7632cfaSRichard Henderson TCGReg dst, TCGReg src) 121e7632cfaSRichard Henderson { 122e7632cfaSRichard Henderson g_assert_not_reached(); 123e7632cfaSRichard Henderson } 124d6ecb4a9SRichard Henderson static inline bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece, 125d6ecb4a9SRichard Henderson TCGReg dst, TCGReg base, intptr_t offset) 126d6ecb4a9SRichard Henderson { 127d6ecb4a9SRichard Henderson g_assert_not_reached(); 128d6ecb4a9SRichard Henderson } 1294e186175SRichard Henderson static inline void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece, 1304e186175SRichard Henderson TCGReg dst, int64_t arg) 131e7632cfaSRichard Henderson { 132e7632cfaSRichard Henderson g_assert_not_reached(); 133e7632cfaSRichard Henderson } 1345e8892dbSMiroslav Rezanina static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, 1355e8892dbSMiroslav Rezanina unsigned vecl, unsigned vece, 1365e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1375e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]) 138d2fd745fSRichard Henderson { 139d2fd745fSRichard Henderson g_assert_not_reached(); 140d2fd745fSRichard Henderson } 141d2fd745fSRichard Henderson #endif 1422a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 143a05b5b9bSRichard Henderson intptr_t arg2); 14459d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 14559d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 1462be7d76bSRichard Henderson static void tcg_out_call(TCGContext *s, const tcg_insn_unit *target); 147a4fbbd77SRichard Henderson static bool tcg_target_const_match(int64_t val, TCGType type, int ct); 148659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 149aeee05f5SRichard Henderson static int tcg_out_ldst_finalize(TCGContext *s); 150659ef5cbSRichard Henderson #endif 151c896fe29Sbellard 15242eb6dfcSRichard Henderson TCGContext tcg_init_ctx; 15342eb6dfcSRichard Henderson __thread TCGContext *tcg_ctx; 15442eb6dfcSRichard Henderson 1555ff7258cSRichard Henderson TCGContext **tcg_ctxs; 1560e2d61cfSRichard Henderson unsigned int tcg_cur_ctxs; 1570e2d61cfSRichard Henderson unsigned int tcg_max_ctxs; 1581c2adb95SRichard Henderson TCGv_env cpu_env = 0; 159c8bc1168SRichard Henderson const void *tcg_code_gen_epilogue; 160db0c51a3SRichard Henderson uintptr_t tcg_splitwx_diff; 161df2cce29SEmilio G. Cota 162b91ccb31SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 163b91ccb31SRichard Henderson tcg_prologue_fn *tcg_qemu_tb_exec; 164b91ccb31SRichard Henderson #endif 165b91ccb31SRichard Henderson 166d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 167b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 168c896fe29Sbellard 1691813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1704196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 171c896fe29Sbellard { 172c896fe29Sbellard *s->code_ptr++ = v; 173c896fe29Sbellard } 174c896fe29Sbellard 1754196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1764196dca6SPeter Maydell uint8_t v) 1775c53bb81SPeter Maydell { 1781813e175SRichard Henderson *p = v; 1795c53bb81SPeter Maydell } 1801813e175SRichard Henderson #endif 1815c53bb81SPeter Maydell 1821813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1834196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 184c896fe29Sbellard { 1851813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1861813e175SRichard Henderson *s->code_ptr++ = v; 1871813e175SRichard Henderson } else { 1881813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1894387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1901813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 1911813e175SRichard Henderson } 192c896fe29Sbellard } 193c896fe29Sbellard 1944196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 1954196dca6SPeter Maydell uint16_t v) 1965c53bb81SPeter Maydell { 1971813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1981813e175SRichard Henderson *p = v; 1991813e175SRichard Henderson } else { 2005c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2015c53bb81SPeter Maydell } 2021813e175SRichard Henderson } 2031813e175SRichard Henderson #endif 2045c53bb81SPeter Maydell 2051813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2064196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 207c896fe29Sbellard { 2081813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2091813e175SRichard Henderson *s->code_ptr++ = v; 2101813e175SRichard Henderson } else { 2111813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2124387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2131813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2141813e175SRichard Henderson } 215c896fe29Sbellard } 216c896fe29Sbellard 2174196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2184196dca6SPeter Maydell uint32_t v) 2195c53bb81SPeter Maydell { 2201813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2211813e175SRichard Henderson *p = v; 2221813e175SRichard Henderson } else { 2235c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2245c53bb81SPeter Maydell } 2251813e175SRichard Henderson } 2261813e175SRichard Henderson #endif 2275c53bb81SPeter Maydell 2281813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2294196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 230ac26eb69SRichard Henderson { 2311813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2321813e175SRichard Henderson *s->code_ptr++ = v; 2331813e175SRichard Henderson } else { 2341813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2354387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2361813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2371813e175SRichard Henderson } 238ac26eb69SRichard Henderson } 239ac26eb69SRichard Henderson 2404196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2414196dca6SPeter Maydell uint64_t v) 2425c53bb81SPeter Maydell { 2431813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2441813e175SRichard Henderson *p = v; 2451813e175SRichard Henderson } else { 2465c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2475c53bb81SPeter Maydell } 2481813e175SRichard Henderson } 2491813e175SRichard Henderson #endif 2505c53bb81SPeter Maydell 251c896fe29Sbellard /* label relocation processing */ 252c896fe29Sbellard 2531813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 254bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 255c896fe29Sbellard { 2567ecd02a0SRichard Henderson TCGRelocation *r = tcg_malloc(sizeof(TCGRelocation)); 257c896fe29Sbellard 258c896fe29Sbellard r->type = type; 259c896fe29Sbellard r->ptr = code_ptr; 260c896fe29Sbellard r->addend = addend; 2617ecd02a0SRichard Henderson QSIMPLEQ_INSERT_TAIL(&l->relocs, r, next); 262c896fe29Sbellard } 263c896fe29Sbellard 26492ab8e7dSRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l) 265c896fe29Sbellard { 266eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 267c896fe29Sbellard l->has_value = 1; 26892ab8e7dSRichard Henderson l->u.value_ptr = tcg_splitwx_to_rx(s->code_ptr); 269c896fe29Sbellard } 270c896fe29Sbellard 27142a268c2SRichard Henderson TCGLabel *gen_new_label(void) 272c896fe29Sbellard { 273b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 27451e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 275c896fe29Sbellard 2767ecd02a0SRichard Henderson memset(l, 0, sizeof(TCGLabel)); 2777ecd02a0SRichard Henderson l->id = s->nb_labels++; 2787ecd02a0SRichard Henderson QSIMPLEQ_INIT(&l->relocs); 2797ecd02a0SRichard Henderson 280bef16ab4SRichard Henderson QSIMPLEQ_INSERT_TAIL(&s->labels, l, next); 28142a268c2SRichard Henderson 28242a268c2SRichard Henderson return l; 283c896fe29Sbellard } 284c896fe29Sbellard 2857ecd02a0SRichard Henderson static bool tcg_resolve_relocs(TCGContext *s) 2867ecd02a0SRichard Henderson { 2877ecd02a0SRichard Henderson TCGLabel *l; 2887ecd02a0SRichard Henderson 2897ecd02a0SRichard Henderson QSIMPLEQ_FOREACH(l, &s->labels, next) { 2907ecd02a0SRichard Henderson TCGRelocation *r; 2917ecd02a0SRichard Henderson uintptr_t value = l->u.value; 2927ecd02a0SRichard Henderson 2937ecd02a0SRichard Henderson QSIMPLEQ_FOREACH(r, &l->relocs, next) { 2947ecd02a0SRichard Henderson if (!patch_reloc(r->ptr, r->type, value, r->addend)) { 2957ecd02a0SRichard Henderson return false; 2967ecd02a0SRichard Henderson } 2977ecd02a0SRichard Henderson } 2987ecd02a0SRichard Henderson } 2997ecd02a0SRichard Henderson return true; 3007ecd02a0SRichard Henderson } 3017ecd02a0SRichard Henderson 3029f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which) 3039f754620SRichard Henderson { 304f14bed3fSRichard Henderson /* 305f14bed3fSRichard Henderson * We will check for overflow at the end of the opcode loop in 306f14bed3fSRichard Henderson * tcg_gen_code, where we bound tcg_current_code_size to UINT16_MAX. 307f14bed3fSRichard Henderson */ 308f14bed3fSRichard Henderson s->tb_jmp_reset_offset[which] = tcg_current_code_size(s); 3099f754620SRichard Henderson } 3109f754620SRichard Henderson 311db6b7d0cSRichard Henderson /* Signal overflow, starting over with fewer guest insns. */ 312db6b7d0cSRichard Henderson static void QEMU_NORETURN tcg_raise_tb_overflow(TCGContext *s) 313db6b7d0cSRichard Henderson { 314db6b7d0cSRichard Henderson siglongjmp(s->jmp_trans, -2); 315db6b7d0cSRichard Henderson } 316db6b7d0cSRichard Henderson 3174c22e840SRichard Henderson #define C_PFX1(P, A) P##A 3184c22e840SRichard Henderson #define C_PFX2(P, A, B) P##A##_##B 3194c22e840SRichard Henderson #define C_PFX3(P, A, B, C) P##A##_##B##_##C 3204c22e840SRichard Henderson #define C_PFX4(P, A, B, C, D) P##A##_##B##_##C##_##D 3214c22e840SRichard Henderson #define C_PFX5(P, A, B, C, D, E) P##A##_##B##_##C##_##D##_##E 3224c22e840SRichard Henderson #define C_PFX6(P, A, B, C, D, E, F) P##A##_##B##_##C##_##D##_##E##_##F 3234c22e840SRichard Henderson 3244c22e840SRichard Henderson /* Define an enumeration for the various combinations. */ 3254c22e840SRichard Henderson 3264c22e840SRichard Henderson #define C_O0_I1(I1) C_PFX1(c_o0_i1_, I1), 3274c22e840SRichard Henderson #define C_O0_I2(I1, I2) C_PFX2(c_o0_i2_, I1, I2), 3284c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) C_PFX3(c_o0_i3_, I1, I2, I3), 3294c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) C_PFX4(c_o0_i4_, I1, I2, I3, I4), 3304c22e840SRichard Henderson 3314c22e840SRichard Henderson #define C_O1_I1(O1, I1) C_PFX2(c_o1_i1_, O1, I1), 3324c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) C_PFX3(c_o1_i2_, O1, I1, I2), 3334c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) C_PFX4(c_o1_i3_, O1, I1, I2, I3), 3344c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) C_PFX5(c_o1_i4_, O1, I1, I2, I3, I4), 3354c22e840SRichard Henderson 3364c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) C_PFX3(c_n1_i2_, O1, I1, I2), 3374c22e840SRichard Henderson 3384c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) C_PFX3(c_o2_i1_, O1, O2, I1), 3394c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) C_PFX4(c_o2_i2_, O1, O2, I1, I2), 3404c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) C_PFX5(c_o2_i3_, O1, O2, I1, I2, I3), 3414c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) C_PFX6(c_o2_i4_, O1, O2, I1, I2, I3, I4), 3424c22e840SRichard Henderson 3434c22e840SRichard Henderson typedef enum { 3444c22e840SRichard Henderson #include "tcg-target-con-set.h" 3454c22e840SRichard Henderson } TCGConstraintSetIndex; 3464c22e840SRichard Henderson 3474c22e840SRichard Henderson static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode); 3484c22e840SRichard Henderson 3494c22e840SRichard Henderson #undef C_O0_I1 3504c22e840SRichard Henderson #undef C_O0_I2 3514c22e840SRichard Henderson #undef C_O0_I3 3524c22e840SRichard Henderson #undef C_O0_I4 3534c22e840SRichard Henderson #undef C_O1_I1 3544c22e840SRichard Henderson #undef C_O1_I2 3554c22e840SRichard Henderson #undef C_O1_I3 3564c22e840SRichard Henderson #undef C_O1_I4 3574c22e840SRichard Henderson #undef C_N1_I2 3584c22e840SRichard Henderson #undef C_O2_I1 3594c22e840SRichard Henderson #undef C_O2_I2 3604c22e840SRichard Henderson #undef C_O2_I3 3614c22e840SRichard Henderson #undef C_O2_I4 3624c22e840SRichard Henderson 3634c22e840SRichard Henderson /* Put all of the constraint sets into an array, indexed by the enum. */ 3644c22e840SRichard Henderson 3654c22e840SRichard Henderson #define C_O0_I1(I1) { .args_ct_str = { #I1 } }, 3664c22e840SRichard Henderson #define C_O0_I2(I1, I2) { .args_ct_str = { #I1, #I2 } }, 3674c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) { .args_ct_str = { #I1, #I2, #I3 } }, 3684c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) { .args_ct_str = { #I1, #I2, #I3, #I4 } }, 3694c22e840SRichard Henderson 3704c22e840SRichard Henderson #define C_O1_I1(O1, I1) { .args_ct_str = { #O1, #I1 } }, 3714c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) { .args_ct_str = { #O1, #I1, #I2 } }, 3724c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) { .args_ct_str = { #O1, #I1, #I2, #I3 } }, 3734c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) { .args_ct_str = { #O1, #I1, #I2, #I3, #I4 } }, 3744c22e840SRichard Henderson 3754c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) { .args_ct_str = { "&" #O1, #I1, #I2 } }, 3764c22e840SRichard Henderson 3774c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) { .args_ct_str = { #O1, #O2, #I1 } }, 3784c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) { .args_ct_str = { #O1, #O2, #I1, #I2 } }, 3794c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) { .args_ct_str = { #O1, #O2, #I1, #I2, #I3 } }, 3804c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) { .args_ct_str = { #O1, #O2, #I1, #I2, #I3, #I4 } }, 3814c22e840SRichard Henderson 3824c22e840SRichard Henderson static const TCGTargetOpDef constraint_sets[] = { 3834c22e840SRichard Henderson #include "tcg-target-con-set.h" 3844c22e840SRichard Henderson }; 3854c22e840SRichard Henderson 3864c22e840SRichard Henderson 3874c22e840SRichard Henderson #undef C_O0_I1 3884c22e840SRichard Henderson #undef C_O0_I2 3894c22e840SRichard Henderson #undef C_O0_I3 3904c22e840SRichard Henderson #undef C_O0_I4 3914c22e840SRichard Henderson #undef C_O1_I1 3924c22e840SRichard Henderson #undef C_O1_I2 3934c22e840SRichard Henderson #undef C_O1_I3 3944c22e840SRichard Henderson #undef C_O1_I4 3954c22e840SRichard Henderson #undef C_N1_I2 3964c22e840SRichard Henderson #undef C_O2_I1 3974c22e840SRichard Henderson #undef C_O2_I2 3984c22e840SRichard Henderson #undef C_O2_I3 3994c22e840SRichard Henderson #undef C_O2_I4 4004c22e840SRichard Henderson 4014c22e840SRichard Henderson /* Expand the enumerator to be returned from tcg_target_op_def(). */ 4024c22e840SRichard Henderson 4034c22e840SRichard Henderson #define C_O0_I1(I1) C_PFX1(c_o0_i1_, I1) 4044c22e840SRichard Henderson #define C_O0_I2(I1, I2) C_PFX2(c_o0_i2_, I1, I2) 4054c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) C_PFX3(c_o0_i3_, I1, I2, I3) 4064c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) C_PFX4(c_o0_i4_, I1, I2, I3, I4) 4074c22e840SRichard Henderson 4084c22e840SRichard Henderson #define C_O1_I1(O1, I1) C_PFX2(c_o1_i1_, O1, I1) 4094c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) C_PFX3(c_o1_i2_, O1, I1, I2) 4104c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) C_PFX4(c_o1_i3_, O1, I1, I2, I3) 4114c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) C_PFX5(c_o1_i4_, O1, I1, I2, I3, I4) 4124c22e840SRichard Henderson 4134c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) C_PFX3(c_n1_i2_, O1, I1, I2) 4144c22e840SRichard Henderson 4154c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) C_PFX3(c_o2_i1_, O1, O2, I1) 4164c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) C_PFX4(c_o2_i2_, O1, O2, I1, I2) 4174c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) C_PFX5(c_o2_i3_, O1, O2, I1, I2, I3) 4184c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) C_PFX6(c_o2_i4_, O1, O2, I1, I2, I3, I4) 4194c22e840SRichard Henderson 420139c1837SPaolo Bonzini #include "tcg-target.c.inc" 421c896fe29Sbellard 42238b47b19SEmilio G. Cota static void alloc_tcg_plugin_context(TCGContext *s) 42338b47b19SEmilio G. Cota { 42438b47b19SEmilio G. Cota #ifdef CONFIG_PLUGIN 42538b47b19SEmilio G. Cota s->plugin_tb = g_new0(struct qemu_plugin_tb, 1); 42638b47b19SEmilio G. Cota s->plugin_tb->insns = 42738b47b19SEmilio G. Cota g_ptr_array_new_with_free_func(qemu_plugin_insn_cleanup_fn); 42838b47b19SEmilio G. Cota #endif 42938b47b19SEmilio G. Cota } 43038b47b19SEmilio G. Cota 431e8feb96fSEmilio G. Cota /* 4323468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 4333468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 4343468b59eSEmilio G. Cota * before initiating translation. 4353468b59eSEmilio G. Cota * 4363468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 4373468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 4383468b59eSEmilio G. Cota * 4393468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 4403468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 4413468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 4423468b59eSEmilio G. Cota * 4433468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 4443468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 4453468b59eSEmilio G. Cota */ 4463468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 4473468b59eSEmilio G. Cota void tcg_register_thread(void) 4483468b59eSEmilio G. Cota { 4493468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 4503468b59eSEmilio G. Cota } 4513468b59eSEmilio G. Cota #else 4523468b59eSEmilio G. Cota void tcg_register_thread(void) 4533468b59eSEmilio G. Cota { 4543468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 4553468b59eSEmilio G. Cota unsigned int i, n; 4563468b59eSEmilio G. Cota 4573468b59eSEmilio G. Cota *s = tcg_init_ctx; 4583468b59eSEmilio G. Cota 4593468b59eSEmilio G. Cota /* Relink mem_base. */ 4603468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 4613468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 4623468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 4633468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 4643468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 4653468b59eSEmilio G. Cota } 4663468b59eSEmilio G. Cota } 4673468b59eSEmilio G. Cota 4683468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 4690e2d61cfSRichard Henderson n = qatomic_fetch_inc(&tcg_cur_ctxs); 4700e2d61cfSRichard Henderson g_assert(n < tcg_max_ctxs); 471d73415a3SStefan Hajnoczi qatomic_set(&tcg_ctxs[n], s); 4723468b59eSEmilio G. Cota 47338b47b19SEmilio G. Cota if (n > 0) { 47438b47b19SEmilio G. Cota alloc_tcg_plugin_context(s); 475bf042e8eSRichard Henderson tcg_region_initial_alloc(s); 47638b47b19SEmilio G. Cota } 47738b47b19SEmilio G. Cota 4783468b59eSEmilio G. Cota tcg_ctx = s; 4793468b59eSEmilio G. Cota } 4803468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 4813468b59eSEmilio G. Cota 482c896fe29Sbellard /* pool based memory allocation */ 483c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 484c896fe29Sbellard { 485c896fe29Sbellard TCGPool *p; 486c896fe29Sbellard int pool_size; 487c896fe29Sbellard 488c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 489c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 4907267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 491c896fe29Sbellard p->size = size; 4924055299eSKirill Batuzov p->next = s->pool_first_large; 4934055299eSKirill Batuzov s->pool_first_large = p; 4944055299eSKirill Batuzov return p->data; 495c896fe29Sbellard } else { 496c896fe29Sbellard p = s->pool_current; 497c896fe29Sbellard if (!p) { 498c896fe29Sbellard p = s->pool_first; 499c896fe29Sbellard if (!p) 500c896fe29Sbellard goto new_pool; 501c896fe29Sbellard } else { 502c896fe29Sbellard if (!p->next) { 503c896fe29Sbellard new_pool: 504c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 5057267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 506c896fe29Sbellard p->size = pool_size; 507c896fe29Sbellard p->next = NULL; 508c896fe29Sbellard if (s->pool_current) 509c896fe29Sbellard s->pool_current->next = p; 510c896fe29Sbellard else 511c896fe29Sbellard s->pool_first = p; 512c896fe29Sbellard } else { 513c896fe29Sbellard p = p->next; 514c896fe29Sbellard } 515c896fe29Sbellard } 516c896fe29Sbellard } 517c896fe29Sbellard s->pool_current = p; 518c896fe29Sbellard s->pool_cur = p->data + size; 519c896fe29Sbellard s->pool_end = p->data + p->size; 520c896fe29Sbellard return p->data; 521c896fe29Sbellard } 522c896fe29Sbellard 523c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 524c896fe29Sbellard { 5254055299eSKirill Batuzov TCGPool *p, *t; 5264055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 5274055299eSKirill Batuzov t = p->next; 5284055299eSKirill Batuzov g_free(p); 5294055299eSKirill Batuzov } 5304055299eSKirill Batuzov s->pool_first_large = NULL; 531c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 532c896fe29Sbellard s->pool_current = NULL; 533c896fe29Sbellard } 534c896fe29Sbellard 5352ef6175aSRichard Henderson #include "exec/helper-proto.h" 5362ef6175aSRichard Henderson 537100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 5382ef6175aSRichard Henderson #include "exec/helper-tcg.h" 539100b5e01SRichard Henderson }; 540619205fdSEmilio G. Cota static GHashTable *helper_table; 541100b5e01SRichard Henderson 54291478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 543f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 5441c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 5451c2adb95SRichard Henderson TCGReg reg, const char *name); 54691478cefSRichard Henderson 54743b972b7SRichard Henderson static void tcg_context_init(unsigned max_cpus) 548c896fe29Sbellard { 549a76aabd3SRichard Henderson TCGContext *s = &tcg_init_ctx; 550100b5e01SRichard Henderson int op, total_args, n, i; 551c896fe29Sbellard TCGOpDef *def; 552c896fe29Sbellard TCGArgConstraint *args_ct; 5531c2adb95SRichard Henderson TCGTemp *ts; 554c896fe29Sbellard 555c896fe29Sbellard memset(s, 0, sizeof(*s)); 556c896fe29Sbellard s->nb_globals = 0; 557c896fe29Sbellard 558c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 559c896fe29Sbellard space */ 560c896fe29Sbellard total_args = 0; 561c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 562c896fe29Sbellard def = &tcg_op_defs[op]; 563c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 564c896fe29Sbellard total_args += n; 565c896fe29Sbellard } 566c896fe29Sbellard 567bc2b17e6SRichard Henderson args_ct = g_new0(TCGArgConstraint, total_args); 568c896fe29Sbellard 569c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 570c896fe29Sbellard def = &tcg_op_defs[op]; 571c896fe29Sbellard def->args_ct = args_ct; 572c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 573c896fe29Sbellard args_ct += n; 574c896fe29Sbellard } 575c896fe29Sbellard 5765cd8f621SRichard Henderson /* Register helpers. */ 57784fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 578619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 57984fd9dd3SRichard Henderson 580100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 58184fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 58272866e82SRichard Henderson (gpointer)&all_helpers[i]); 583100b5e01SRichard Henderson } 5845cd8f621SRichard Henderson 585c896fe29Sbellard tcg_target_init(s); 586f69d277eSRichard Henderson process_op_defs(s); 58791478cefSRichard Henderson 58891478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 58991478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 59091478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 59191478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 59291478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 59391478cefSRichard Henderson break; 59491478cefSRichard Henderson } 59591478cefSRichard Henderson } 59691478cefSRichard Henderson for (i = 0; i < n; ++i) { 59791478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 59891478cefSRichard Henderson } 59991478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 60091478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 60191478cefSRichard Henderson } 602b1311c4aSEmilio G. Cota 60338b47b19SEmilio G. Cota alloc_tcg_plugin_context(s); 60438b47b19SEmilio G. Cota 605b1311c4aSEmilio G. Cota tcg_ctx = s; 6063468b59eSEmilio G. Cota /* 6073468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 6083468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 6093468b59eSEmilio G. Cota * reasoning behind this. 6103468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 6113468b59eSEmilio G. Cota */ 6123468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 613df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 6140e2d61cfSRichard Henderson tcg_cur_ctxs = 1; 6150e2d61cfSRichard Henderson tcg_max_ctxs = 1; 6163468b59eSEmilio G. Cota #else 6170e2d61cfSRichard Henderson tcg_max_ctxs = max_cpus; 6180e2d61cfSRichard Henderson tcg_ctxs = g_new0(TCGContext *, max_cpus); 6193468b59eSEmilio G. Cota #endif 6201c2adb95SRichard Henderson 6211c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 6221c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 6231c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 6249002ec79SRichard Henderson } 625b03cce8eSbellard 62643b972b7SRichard Henderson void tcg_init(size_t tb_size, int splitwx, unsigned max_cpus) 627a76aabd3SRichard Henderson { 62843b972b7SRichard Henderson tcg_context_init(max_cpus); 62943b972b7SRichard Henderson tcg_region_init(tb_size, splitwx, max_cpus); 630a76aabd3SRichard Henderson } 631a76aabd3SRichard Henderson 6326e3b2bfdSEmilio G. Cota /* 6336e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 6346e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 6356e3b2bfdSEmilio G. Cota */ 6366e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 6376e3b2bfdSEmilio G. Cota { 6386e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 6396e3b2bfdSEmilio G. Cota TranslationBlock *tb; 6406e3b2bfdSEmilio G. Cota void *next; 6416e3b2bfdSEmilio G. Cota 642e8feb96fSEmilio G. Cota retry: 6436e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 6446e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 6456e3b2bfdSEmilio G. Cota 6466e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 647e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 6486e3b2bfdSEmilio G. Cota return NULL; 6496e3b2bfdSEmilio G. Cota } 650e8feb96fSEmilio G. Cota goto retry; 651e8feb96fSEmilio G. Cota } 652d73415a3SStefan Hajnoczi qatomic_set(&s->code_gen_ptr, next); 65357a26946SRichard Henderson s->data_gen_ptr = NULL; 6546e3b2bfdSEmilio G. Cota return tb; 6556e3b2bfdSEmilio G. Cota } 6566e3b2bfdSEmilio G. Cota 6579002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 6589002ec79SRichard Henderson { 659b0a0794aSRichard Henderson size_t prologue_size; 6608163b749SRichard Henderson 661b0a0794aSRichard Henderson s->code_ptr = s->code_gen_ptr; 662b0a0794aSRichard Henderson s->code_buf = s->code_gen_ptr; 6635b38ee31SRichard Henderson s->data_gen_ptr = NULL; 664b91ccb31SRichard Henderson 665b91ccb31SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 666b0a0794aSRichard Henderson tcg_qemu_tb_exec = (tcg_prologue_fn *)tcg_splitwx_to_rx(s->code_ptr); 667b91ccb31SRichard Henderson #endif 6688163b749SRichard Henderson 6695b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 6705b38ee31SRichard Henderson s->pool_labels = NULL; 6715b38ee31SRichard Henderson #endif 6725b38ee31SRichard Henderson 673653b87ebSRoman Bolshakov qemu_thread_jit_write(); 6748163b749SRichard Henderson /* Generate the prologue. */ 675b03cce8eSbellard tcg_target_qemu_prologue(s); 6765b38ee31SRichard Henderson 6775b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 6785b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 6795b38ee31SRichard Henderson { 6801768987bSRichard Henderson int result = tcg_out_pool_finalize(s); 6811768987bSRichard Henderson tcg_debug_assert(result == 0); 6825b38ee31SRichard Henderson } 6835b38ee31SRichard Henderson #endif 6845b38ee31SRichard Henderson 685b0a0794aSRichard Henderson prologue_size = tcg_current_code_size(s); 686b0a0794aSRichard Henderson 687df5d2b16SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 688b0a0794aSRichard Henderson flush_idcache_range((uintptr_t)tcg_splitwx_to_rx(s->code_buf), 689b0a0794aSRichard Henderson (uintptr_t)s->code_buf, prologue_size); 690df5d2b16SRichard Henderson #endif 6918163b749SRichard Henderson 692bf042e8eSRichard Henderson tcg_region_prologue_set(s); 693d6b64b2bSRichard Henderson 694d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 695d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 696fc59d2d8SRobert Foley FILE *logfile = qemu_log_lock(); 6978163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 6985b38ee31SRichard Henderson if (s->data_gen_ptr) { 699b0a0794aSRichard Henderson size_t code_size = s->data_gen_ptr - s->code_gen_ptr; 7005b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 7015b38ee31SRichard Henderson size_t i; 7025b38ee31SRichard Henderson 703b0a0794aSRichard Henderson log_disas(s->code_gen_ptr, code_size); 7045b38ee31SRichard Henderson 7055b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 7065b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 7075b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 7085b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 7095b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 7105b38ee31SRichard Henderson } else { 7115b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .long 0x%08x\n", 7125b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 7135b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 7145b38ee31SRichard Henderson } 7155b38ee31SRichard Henderson } 7165b38ee31SRichard Henderson } else { 717b0a0794aSRichard Henderson log_disas(s->code_gen_ptr, prologue_size); 7185b38ee31SRichard Henderson } 719d6b64b2bSRichard Henderson qemu_log("\n"); 720d6b64b2bSRichard Henderson qemu_log_flush(); 721fc59d2d8SRobert Foley qemu_log_unlock(logfile); 722d6b64b2bSRichard Henderson } 723d6b64b2bSRichard Henderson #endif 724cedbcb01SEmilio G. Cota 725cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 726cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 7278b5c2b62SRichard Henderson tcg_debug_assert(tcg_code_gen_epilogue != NULL); 728cedbcb01SEmilio G. Cota } 729c896fe29Sbellard } 730c896fe29Sbellard 731c896fe29Sbellard void tcg_func_start(TCGContext *s) 732c896fe29Sbellard { 733c896fe29Sbellard tcg_pool_reset(s); 734c896fe29Sbellard s->nb_temps = s->nb_globals; 7350ec9eabcSRichard Henderson 7360ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 7370ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 7380ec9eabcSRichard Henderson 739c0522136SRichard Henderson /* No constant temps have been previously allocated. */ 740c0522136SRichard Henderson for (int i = 0; i < TCG_TYPE_COUNT; ++i) { 741c0522136SRichard Henderson if (s->const_table[i]) { 742c0522136SRichard Henderson g_hash_table_remove_all(s->const_table[i]); 743c0522136SRichard Henderson } 744c0522136SRichard Henderson } 745c0522136SRichard Henderson 746abebf925SRichard Henderson s->nb_ops = 0; 747c896fe29Sbellard s->nb_labels = 0; 748c896fe29Sbellard s->current_frame_offset = s->frame_start; 749c896fe29Sbellard 7500a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 7510a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 7520a209d4bSRichard Henderson #endif 7530a209d4bSRichard Henderson 75415fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 75515fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 756bef16ab4SRichard Henderson QSIMPLEQ_INIT(&s->labels); 757c896fe29Sbellard } 758c896fe29Sbellard 759ae30e866SRichard Henderson static TCGTemp *tcg_temp_alloc(TCGContext *s) 7607ca4b752SRichard Henderson { 7617ca4b752SRichard Henderson int n = s->nb_temps++; 762ae30e866SRichard Henderson 763ae30e866SRichard Henderson if (n >= TCG_MAX_TEMPS) { 764db6b7d0cSRichard Henderson tcg_raise_tb_overflow(s); 765ae30e866SRichard Henderson } 7667ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 7677ca4b752SRichard Henderson } 7687ca4b752SRichard Henderson 769ae30e866SRichard Henderson static TCGTemp *tcg_global_alloc(TCGContext *s) 7707ca4b752SRichard Henderson { 771fa477d25SRichard Henderson TCGTemp *ts; 772fa477d25SRichard Henderson 7737ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 774ae30e866SRichard Henderson tcg_debug_assert(s->nb_globals < TCG_MAX_TEMPS); 7757ca4b752SRichard Henderson s->nb_globals++; 776fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 777ee17db83SRichard Henderson ts->kind = TEMP_GLOBAL; 778fa477d25SRichard Henderson 779fa477d25SRichard Henderson return ts; 780c896fe29Sbellard } 781c896fe29Sbellard 782085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 783b6638662SRichard Henderson TCGReg reg, const char *name) 784c896fe29Sbellard { 785c896fe29Sbellard TCGTemp *ts; 786c896fe29Sbellard 787b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 788c896fe29Sbellard tcg_abort(); 789b3a62939SRichard Henderson } 7907ca4b752SRichard Henderson 7917ca4b752SRichard Henderson ts = tcg_global_alloc(s); 792c896fe29Sbellard ts->base_type = type; 793c896fe29Sbellard ts->type = type; 794ee17db83SRichard Henderson ts->kind = TEMP_FIXED; 795c896fe29Sbellard ts->reg = reg; 796c896fe29Sbellard ts->name = name; 797c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 7987ca4b752SRichard Henderson 799085272b3SRichard Henderson return ts; 800a7812ae4Spbrook } 801a7812ae4Spbrook 802b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 803a7812ae4Spbrook { 804b3a62939SRichard Henderson s->frame_start = start; 805b3a62939SRichard Henderson s->frame_end = start + size; 806085272b3SRichard Henderson s->frame_temp 807085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 808b3a62939SRichard Henderson } 809a7812ae4Spbrook 810085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 811e1ccc054SRichard Henderson intptr_t offset, const char *name) 812c896fe29Sbellard { 813b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 814dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 8157ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 816b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 8177ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 8187ca4b752SRichard Henderson bigendian = 1; 8197ca4b752SRichard Henderson #endif 820c896fe29Sbellard 821c0522136SRichard Henderson switch (base_ts->kind) { 822c0522136SRichard Henderson case TEMP_FIXED: 823c0522136SRichard Henderson break; 824c0522136SRichard Henderson case TEMP_GLOBAL: 8255a18407fSRichard Henderson /* We do not support double-indirect registers. */ 8265a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 827b3915dbbSRichard Henderson base_ts->indirect_base = 1; 8285a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 8295a18407fSRichard Henderson ? 2 : 1); 8305a18407fSRichard Henderson indirect_reg = 1; 831c0522136SRichard Henderson break; 832c0522136SRichard Henderson default: 833c0522136SRichard Henderson g_assert_not_reached(); 834b3915dbbSRichard Henderson } 835b3915dbbSRichard Henderson 8367ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 8377ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 838c896fe29Sbellard char buf[64]; 8397ca4b752SRichard Henderson 8407ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 841c896fe29Sbellard ts->type = TCG_TYPE_I32; 842b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 843c896fe29Sbellard ts->mem_allocated = 1; 844b3a62939SRichard Henderson ts->mem_base = base_ts; 8457ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 846c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 847c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 848c896fe29Sbellard ts->name = strdup(buf); 849c896fe29Sbellard 8507ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 8517ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 8527ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 853b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 8547ca4b752SRichard Henderson ts2->mem_allocated = 1; 8557ca4b752SRichard Henderson ts2->mem_base = base_ts; 8567ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 857c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 858c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 859120c1084SRichard Henderson ts2->name = strdup(buf); 8607ca4b752SRichard Henderson } else { 861c896fe29Sbellard ts->base_type = type; 862c896fe29Sbellard ts->type = type; 863b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 864c896fe29Sbellard ts->mem_allocated = 1; 865b3a62939SRichard Henderson ts->mem_base = base_ts; 866c896fe29Sbellard ts->mem_offset = offset; 867c896fe29Sbellard ts->name = name; 868c896fe29Sbellard } 869085272b3SRichard Henderson return ts; 870c896fe29Sbellard } 871c896fe29Sbellard 8725bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 873c896fe29Sbellard { 874b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 875ee17db83SRichard Henderson TCGTempKind kind = temp_local ? TEMP_LOCAL : TEMP_NORMAL; 876c896fe29Sbellard TCGTemp *ts; 877641d5fbeSbellard int idx, k; 878c896fe29Sbellard 8790ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 8800ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 8810ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 8820ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 8830ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 8840ec9eabcSRichard Henderson 885e8996ee0Sbellard ts = &s->temps[idx]; 886e8996ee0Sbellard ts->temp_allocated = 1; 8877ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 888ee17db83SRichard Henderson tcg_debug_assert(ts->kind == kind); 889e8996ee0Sbellard } else { 8907ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 8917ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 8927ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 8937ca4b752SRichard Henderson 894c896fe29Sbellard ts->base_type = type; 895c896fe29Sbellard ts->type = TCG_TYPE_I32; 896e8996ee0Sbellard ts->temp_allocated = 1; 897ee17db83SRichard Henderson ts->kind = kind; 8987ca4b752SRichard Henderson 8997ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 9007ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 9017ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 9027ca4b752SRichard Henderson ts2->temp_allocated = 1; 903ee17db83SRichard Henderson ts2->kind = kind; 9047ca4b752SRichard Henderson } else { 905c896fe29Sbellard ts->base_type = type; 906c896fe29Sbellard ts->type = type; 907e8996ee0Sbellard ts->temp_allocated = 1; 908ee17db83SRichard Henderson ts->kind = kind; 909c896fe29Sbellard } 910e8996ee0Sbellard } 91127bfd83cSPeter Maydell 91227bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 91327bfd83cSPeter Maydell s->temps_in_use++; 91427bfd83cSPeter Maydell #endif 915085272b3SRichard Henderson return ts; 916c896fe29Sbellard } 917c896fe29Sbellard 918d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 919d2fd745fSRichard Henderson { 920d2fd745fSRichard Henderson TCGTemp *t; 921d2fd745fSRichard Henderson 922d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 923d2fd745fSRichard Henderson switch (type) { 924d2fd745fSRichard Henderson case TCG_TYPE_V64: 925d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 926d2fd745fSRichard Henderson break; 927d2fd745fSRichard Henderson case TCG_TYPE_V128: 928d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 929d2fd745fSRichard Henderson break; 930d2fd745fSRichard Henderson case TCG_TYPE_V256: 931d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 932d2fd745fSRichard Henderson break; 933d2fd745fSRichard Henderson default: 934d2fd745fSRichard Henderson g_assert_not_reached(); 935d2fd745fSRichard Henderson } 936d2fd745fSRichard Henderson #endif 937d2fd745fSRichard Henderson 938d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 939d2fd745fSRichard Henderson return temp_tcgv_vec(t); 940d2fd745fSRichard Henderson } 941d2fd745fSRichard Henderson 942d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 943d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 944d2fd745fSRichard Henderson { 945d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 946d2fd745fSRichard Henderson 947d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 948d2fd745fSRichard Henderson 949d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 950d2fd745fSRichard Henderson return temp_tcgv_vec(t); 951d2fd745fSRichard Henderson } 952d2fd745fSRichard Henderson 9535bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 954c896fe29Sbellard { 955b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 956085272b3SRichard Henderson int k, idx; 957c896fe29Sbellard 958c0522136SRichard Henderson /* In order to simplify users of tcg_constant_*, silently ignore free. */ 959c0522136SRichard Henderson if (ts->kind == TEMP_CONST) { 960c0522136SRichard Henderson return; 961c0522136SRichard Henderson } 962c0522136SRichard Henderson 96327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 96427bfd83cSPeter Maydell s->temps_in_use--; 96527bfd83cSPeter Maydell if (s->temps_in_use < 0) { 96627bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 96727bfd83cSPeter Maydell } 96827bfd83cSPeter Maydell #endif 96927bfd83cSPeter Maydell 970ee17db83SRichard Henderson tcg_debug_assert(ts->kind < TEMP_GLOBAL); 971eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 972e8996ee0Sbellard ts->temp_allocated = 0; 9730ec9eabcSRichard Henderson 974085272b3SRichard Henderson idx = temp_idx(ts); 975ee17db83SRichard Henderson k = ts->base_type + (ts->kind == TEMP_NORMAL ? 0 : TCG_TYPE_COUNT); 9760ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 977e8996ee0Sbellard } 978e8996ee0Sbellard 979c0522136SRichard Henderson TCGTemp *tcg_constant_internal(TCGType type, int64_t val) 980c0522136SRichard Henderson { 981c0522136SRichard Henderson TCGContext *s = tcg_ctx; 982c0522136SRichard Henderson GHashTable *h = s->const_table[type]; 983c0522136SRichard Henderson TCGTemp *ts; 984c0522136SRichard Henderson 985c0522136SRichard Henderson if (h == NULL) { 986c0522136SRichard Henderson h = g_hash_table_new(g_int64_hash, g_int64_equal); 987c0522136SRichard Henderson s->const_table[type] = h; 988c0522136SRichard Henderson } 989c0522136SRichard Henderson 990c0522136SRichard Henderson ts = g_hash_table_lookup(h, &val); 991c0522136SRichard Henderson if (ts == NULL) { 992c0522136SRichard Henderson ts = tcg_temp_alloc(s); 993c0522136SRichard Henderson 994c0522136SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 995c0522136SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 996c0522136SRichard Henderson 997c0522136SRichard Henderson ts->base_type = TCG_TYPE_I64; 998c0522136SRichard Henderson ts->type = TCG_TYPE_I32; 999c0522136SRichard Henderson ts->kind = TEMP_CONST; 1000c0522136SRichard Henderson ts->temp_allocated = 1; 1001c0522136SRichard Henderson /* 1002c0522136SRichard Henderson * Retain the full value of the 64-bit constant in the low 1003c0522136SRichard Henderson * part, so that the hash table works. Actual uses will 1004c0522136SRichard Henderson * truncate the value to the low part. 1005c0522136SRichard Henderson */ 1006c0522136SRichard Henderson ts->val = val; 1007c0522136SRichard Henderson 1008c0522136SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 1009c0522136SRichard Henderson ts2->base_type = TCG_TYPE_I64; 1010c0522136SRichard Henderson ts2->type = TCG_TYPE_I32; 1011c0522136SRichard Henderson ts2->kind = TEMP_CONST; 1012c0522136SRichard Henderson ts2->temp_allocated = 1; 1013c0522136SRichard Henderson ts2->val = val >> 32; 1014c0522136SRichard Henderson } else { 1015c0522136SRichard Henderson ts->base_type = type; 1016c0522136SRichard Henderson ts->type = type; 1017c0522136SRichard Henderson ts->kind = TEMP_CONST; 1018c0522136SRichard Henderson ts->temp_allocated = 1; 1019c0522136SRichard Henderson ts->val = val; 1020c0522136SRichard Henderson } 1021c0522136SRichard Henderson g_hash_table_insert(h, &ts->val, ts); 1022c0522136SRichard Henderson } 1023c0522136SRichard Henderson 1024c0522136SRichard Henderson return ts; 1025c0522136SRichard Henderson } 1026c0522136SRichard Henderson 1027c0522136SRichard Henderson TCGv_vec tcg_constant_vec(TCGType type, unsigned vece, int64_t val) 1028c0522136SRichard Henderson { 1029c0522136SRichard Henderson val = dup_const(vece, val); 1030c0522136SRichard Henderson return temp_tcgv_vec(tcg_constant_internal(type, val)); 1031c0522136SRichard Henderson } 1032c0522136SRichard Henderson 103388d4005bSRichard Henderson TCGv_vec tcg_constant_vec_matching(TCGv_vec match, unsigned vece, int64_t val) 103488d4005bSRichard Henderson { 103588d4005bSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 103688d4005bSRichard Henderson 103788d4005bSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 103888d4005bSRichard Henderson return tcg_constant_vec(t->base_type, vece, val); 103988d4005bSRichard Henderson } 104088d4005bSRichard Henderson 1041a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1042a7812ae4Spbrook { 1043a7812ae4Spbrook TCGv_i32 t0; 1044a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1045e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1046e8996ee0Sbellard return t0; 1047c896fe29Sbellard } 1048c896fe29Sbellard 1049a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1050c896fe29Sbellard { 1051a7812ae4Spbrook TCGv_i64 t0; 1052a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1053e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1054e8996ee0Sbellard return t0; 1055c896fe29Sbellard } 1056c896fe29Sbellard 1057a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1058bdffd4a9Saurel32 { 1059a7812ae4Spbrook TCGv_i32 t0; 1060a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1061bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1062bdffd4a9Saurel32 return t0; 1063bdffd4a9Saurel32 } 1064bdffd4a9Saurel32 1065a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1066bdffd4a9Saurel32 { 1067a7812ae4Spbrook TCGv_i64 t0; 1068a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1069bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1070bdffd4a9Saurel32 return t0; 1071bdffd4a9Saurel32 } 1072bdffd4a9Saurel32 107327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 107427bfd83cSPeter Maydell void tcg_clear_temp_count(void) 107527bfd83cSPeter Maydell { 1076b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 107727bfd83cSPeter Maydell s->temps_in_use = 0; 107827bfd83cSPeter Maydell } 107927bfd83cSPeter Maydell 108027bfd83cSPeter Maydell int tcg_check_temp_count(void) 108127bfd83cSPeter Maydell { 1082b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 108327bfd83cSPeter Maydell if (s->temps_in_use) { 108427bfd83cSPeter Maydell /* Clear the count so that we don't give another 108527bfd83cSPeter Maydell * warning immediately next time around. 108627bfd83cSPeter Maydell */ 108727bfd83cSPeter Maydell s->temps_in_use = 0; 108827bfd83cSPeter Maydell return 1; 108927bfd83cSPeter Maydell } 109027bfd83cSPeter Maydell return 0; 109127bfd83cSPeter Maydell } 109227bfd83cSPeter Maydell #endif 109327bfd83cSPeter Maydell 1094be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1095be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1096be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1097be0f34b5SRichard Henderson { 1098d2fd745fSRichard Henderson const bool have_vec 1099d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1100d2fd745fSRichard Henderson 1101be0f34b5SRichard Henderson switch (op) { 1102be0f34b5SRichard Henderson case INDEX_op_discard: 1103be0f34b5SRichard Henderson case INDEX_op_set_label: 1104be0f34b5SRichard Henderson case INDEX_op_call: 1105be0f34b5SRichard Henderson case INDEX_op_br: 1106be0f34b5SRichard Henderson case INDEX_op_mb: 1107be0f34b5SRichard Henderson case INDEX_op_insn_start: 1108be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1109be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1110be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1111be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1112be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1113be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1114be0f34b5SRichard Henderson return true; 1115be0f34b5SRichard Henderson 111607ce0b05SRichard Henderson case INDEX_op_qemu_st8_i32: 111707ce0b05SRichard Henderson return TCG_TARGET_HAS_qemu_st8_i32; 111807ce0b05SRichard Henderson 1119be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 1120be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 1121be0f34b5SRichard Henderson 1122be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1123be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1124be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1125be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1126be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1127be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1128be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1129be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1130be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1131be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1132be0f34b5SRichard Henderson case INDEX_op_st_i32: 1133be0f34b5SRichard Henderson case INDEX_op_add_i32: 1134be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1135be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1136be0f34b5SRichard Henderson case INDEX_op_and_i32: 1137be0f34b5SRichard Henderson case INDEX_op_or_i32: 1138be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1139be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1140be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1141be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1142be0f34b5SRichard Henderson return true; 1143be0f34b5SRichard Henderson 1144be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1145be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1146be0f34b5SRichard Henderson case INDEX_op_div_i32: 1147be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1148be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1149be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1150be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1151be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1152be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1153be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1154be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1155be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1156be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1157be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1158be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1159be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1160be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1161be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1162be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1163be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1164fce1296fSRichard Henderson case INDEX_op_extract2_i32: 1165fce1296fSRichard Henderson return TCG_TARGET_HAS_extract2_i32; 1166be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1167be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1168be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1169be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1170be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1171be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1172be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1173be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1174be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1175be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1176be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1177be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1178be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1179be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1180be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1181be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1182be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1183be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1184be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1185be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1186be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1187be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1188be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1189be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1190be0f34b5SRichard Henderson case INDEX_op_not_i32: 1191be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1192be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1193be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1194be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1195be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1196be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1197be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1198be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1199be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1200be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1201be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1202be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1203be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1204be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1205be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1206be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1207be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1208be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1209be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1210be0f34b5SRichard Henderson 1211be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1212be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1213be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1214be0f34b5SRichard Henderson 1215be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1216be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1217be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1218be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1219be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1220be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1221be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1222be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1223be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1224be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1225be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1226be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1227be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1228be0f34b5SRichard Henderson case INDEX_op_st_i64: 1229be0f34b5SRichard Henderson case INDEX_op_add_i64: 1230be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1231be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1232be0f34b5SRichard Henderson case INDEX_op_and_i64: 1233be0f34b5SRichard Henderson case INDEX_op_or_i64: 1234be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1235be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1236be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1237be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1238be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1239be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1240be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1241be0f34b5SRichard Henderson 1242be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1243be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1244be0f34b5SRichard Henderson case INDEX_op_div_i64: 1245be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1246be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1247be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1248be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1249be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1250be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1251be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1252be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1253be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1254be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1255be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1256be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1257be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1258be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1259be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1260be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1261be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1262fce1296fSRichard Henderson case INDEX_op_extract2_i64: 1263fce1296fSRichard Henderson return TCG_TARGET_HAS_extract2_i64; 1264be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1265be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1266be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1267be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1268be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1269be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1270be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1271be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1272be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1273be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1274be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1275be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1276be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1277be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1278be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1279be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1280be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1281be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1282be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1283be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1284be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1285be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1286be0f34b5SRichard Henderson case INDEX_op_not_i64: 1287be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1288be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1289be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1290be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1291be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1292be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1293be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1294be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1295be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1296be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1297be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1298be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1299be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1300be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1301be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1302be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1303be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1304be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1305be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1306be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1307be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1308be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1309be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1310be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1311be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1312be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1313be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1314be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1315be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1316be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1317be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1318be0f34b5SRichard Henderson 1319d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1320d2fd745fSRichard Henderson case INDEX_op_dup_vec: 132137ee55a0SRichard Henderson case INDEX_op_dupm_vec: 1322d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1323d2fd745fSRichard Henderson case INDEX_op_st_vec: 1324d2fd745fSRichard Henderson case INDEX_op_add_vec: 1325d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1326d2fd745fSRichard Henderson case INDEX_op_and_vec: 1327d2fd745fSRichard Henderson case INDEX_op_or_vec: 1328d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1329212be173SRichard Henderson case INDEX_op_cmp_vec: 1330d2fd745fSRichard Henderson return have_vec; 1331d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1332d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1333d2fd745fSRichard Henderson case INDEX_op_not_vec: 1334d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1335d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1336d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1337bcefc902SRichard Henderson case INDEX_op_abs_vec: 1338bcefc902SRichard Henderson return have_vec && TCG_TARGET_HAS_abs_vec; 1339d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1340d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1341d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1342d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 13433774030aSRichard Henderson case INDEX_op_mul_vec: 13443774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1345d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1346d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1347d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1348d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1349d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1350d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1351d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1352d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1353d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1354d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1355d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1356d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1357b0f7e744SRichard Henderson case INDEX_op_rotli_vec: 1358b0f7e744SRichard Henderson return have_vec && TCG_TARGET_HAS_roti_vec; 135923850a74SRichard Henderson case INDEX_op_rotls_vec: 136023850a74SRichard Henderson return have_vec && TCG_TARGET_HAS_rots_vec; 13615d0ceda9SRichard Henderson case INDEX_op_rotlv_vec: 13625d0ceda9SRichard Henderson case INDEX_op_rotrv_vec: 13635d0ceda9SRichard Henderson return have_vec && TCG_TARGET_HAS_rotv_vec; 13648afaf050SRichard Henderson case INDEX_op_ssadd_vec: 13658afaf050SRichard Henderson case INDEX_op_usadd_vec: 13668afaf050SRichard Henderson case INDEX_op_sssub_vec: 13678afaf050SRichard Henderson case INDEX_op_ussub_vec: 13688afaf050SRichard Henderson return have_vec && TCG_TARGET_HAS_sat_vec; 1369dd0a0fcdSRichard Henderson case INDEX_op_smin_vec: 1370dd0a0fcdSRichard Henderson case INDEX_op_umin_vec: 1371dd0a0fcdSRichard Henderson case INDEX_op_smax_vec: 1372dd0a0fcdSRichard Henderson case INDEX_op_umax_vec: 1373dd0a0fcdSRichard Henderson return have_vec && TCG_TARGET_HAS_minmax_vec; 137438dc1294SRichard Henderson case INDEX_op_bitsel_vec: 137538dc1294SRichard Henderson return have_vec && TCG_TARGET_HAS_bitsel_vec; 1376f75da298SRichard Henderson case INDEX_op_cmpsel_vec: 1377f75da298SRichard Henderson return have_vec && TCG_TARGET_HAS_cmpsel_vec; 1378d2fd745fSRichard Henderson 1379db432672SRichard Henderson default: 1380db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1381db432672SRichard Henderson return true; 1382be0f34b5SRichard Henderson } 1383be0f34b5SRichard Henderson } 1384be0f34b5SRichard Henderson 138539cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 138639cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 138739cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1388ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1389c896fe29Sbellard { 139075e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 13913e92aa34SRichard Henderson unsigned typemask; 13923e92aa34SRichard Henderson const TCGHelperInfo *info; 139375e8b9b7SRichard Henderson TCGOp *op; 1394afb49896SRichard Henderson 1395619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 13967319d83aSRichard Henderson typemask = info->typemask; 13972bece2c8SRichard Henderson 139838b47b19SEmilio G. Cota #ifdef CONFIG_PLUGIN 139938b47b19SEmilio G. Cota /* detect non-plugin helpers */ 140038b47b19SEmilio G. Cota if (tcg_ctx->plugin_insn && unlikely(strncmp(info->name, "plugin_", 7))) { 140138b47b19SEmilio G. Cota tcg_ctx->plugin_insn->calls_helpers = true; 140238b47b19SEmilio G. Cota } 140338b47b19SEmilio G. Cota #endif 140438b47b19SEmilio G. Cota 140534b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 140634b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 140734b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 140834b1a49cSRichard Henderson separate parameters. Split them. */ 14097319d83aSRichard Henderson int orig_typemask = typemask; 141034b1a49cSRichard Henderson int orig_nargs = nargs; 141134b1a49cSRichard Henderson TCGv_i64 retl, reth; 1412ae8b75dcSRichard Henderson TCGTemp *split_args[MAX_OPC_PARAM]; 141334b1a49cSRichard Henderson 1414f764718dSRichard Henderson retl = NULL; 1415f764718dSRichard Henderson reth = NULL; 14167319d83aSRichard Henderson typemask = 0; 141734b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 14187319d83aSRichard Henderson int argtype = extract32(orig_typemask, (i + 1) * 3, 3); 14197319d83aSRichard Henderson bool is_64bit = (argtype & ~1) == dh_typecode_i64; 14207319d83aSRichard Henderson 142134b1a49cSRichard Henderson if (is_64bit) { 1422085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 142334b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 142434b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 142534b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 1426ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(h); 14277319d83aSRichard Henderson typemask |= dh_typecode_i32 << (real_args * 3); 1428ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(l); 14297319d83aSRichard Henderson typemask |= dh_typecode_i32 << (real_args * 3); 143034b1a49cSRichard Henderson } else { 143134b1a49cSRichard Henderson split_args[real_args++] = args[i]; 14327319d83aSRichard Henderson typemask |= argtype << (real_args * 3); 143334b1a49cSRichard Henderson } 143434b1a49cSRichard Henderson } 143534b1a49cSRichard Henderson nargs = real_args; 143634b1a49cSRichard Henderson args = split_args; 143734b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 14382bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 14397319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 14407319d83aSRichard Henderson bool is_32bit = (argtype & ~1) == dh_typecode_i32; 14417319d83aSRichard Henderson bool is_signed = argtype & 1; 14427319d83aSRichard Henderson 14437319d83aSRichard Henderson if (is_32bit) { 14442bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 1445085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 14462bece2c8SRichard Henderson if (is_signed) { 14472bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 14482bece2c8SRichard Henderson } else { 14492bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 14502bece2c8SRichard Henderson } 1451ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 14522bece2c8SRichard Henderson } 14532bece2c8SRichard Henderson } 14542bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 14552bece2c8SRichard Henderson 145615fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 145775e8b9b7SRichard Henderson 145875e8b9b7SRichard Henderson pi = 0; 1459ae8b75dcSRichard Henderson if (ret != NULL) { 146034b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 146134b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 14627319d83aSRichard Henderson if ((typemask & 6) == dh_typecode_i64) { 146334b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 146434b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 146534b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 146634b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 146734b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1468ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(reth); 1469ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(retl); 147034b1a49cSRichard Henderson nb_rets = 2; 147134b1a49cSRichard Henderson } else { 1472ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 147334b1a49cSRichard Henderson nb_rets = 1; 147434b1a49cSRichard Henderson } 147534b1a49cSRichard Henderson #else 14767319d83aSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (typemask & 6) == dh_typecode_i64) { 147702eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1478ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1479ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1480a7812ae4Spbrook #else 1481ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1482ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1483a7812ae4Spbrook #endif 1484a7812ae4Spbrook nb_rets = 2; 148534b1a49cSRichard Henderson } else { 1486ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1487a7812ae4Spbrook nb_rets = 1; 1488a7812ae4Spbrook } 148934b1a49cSRichard Henderson #endif 1490a7812ae4Spbrook } else { 1491a7812ae4Spbrook nb_rets = 0; 1492a7812ae4Spbrook } 1493cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 149475e8b9b7SRichard Henderson 1495a7812ae4Spbrook real_args = 0; 1496a7812ae4Spbrook for (i = 0; i < nargs; i++) { 14977319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 14987319d83aSRichard Henderson bool is_64bit = (argtype & ~1) == dh_typecode_i64; 14997319d83aSRichard Henderson 1500bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 150139cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 150239cf05d3Sbellard /* some targets want aligned 64 bit args */ 1503ebd486d5Smalc if (real_args & 1) { 150475e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1505ebd486d5Smalc real_args++; 150639cf05d3Sbellard } 150739cf05d3Sbellard #endif 15083f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 15093f90f252SRichard Henderson arguments at lower addresses, which means we need to 15103f90f252SRichard Henderson reverse the order compared to how we would normally 15113f90f252SRichard Henderson treat either big or little-endian. For those arguments 15123f90f252SRichard Henderson that will wind up in registers, this still works for 15133f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 15143f90f252SRichard Henderson argument registers are *also* allocated in decreasing 15153f90f252SRichard Henderson order. If another such target is added, this logic may 15163f90f252SRichard Henderson have to get more complicated to differentiate between 15173f90f252SRichard Henderson stack arguments and register arguments. */ 151802eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1519ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1520ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1521c896fe29Sbellard #else 1522ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1523ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1524c896fe29Sbellard #endif 1525a7812ae4Spbrook real_args += 2; 15262bece2c8SRichard Henderson continue; 15272bece2c8SRichard Henderson } 15282bece2c8SRichard Henderson 1529ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1530a7812ae4Spbrook real_args++; 1531c896fe29Sbellard } 153275e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 15333e92aa34SRichard Henderson op->args[pi++] = (uintptr_t)info; 1534cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1535a7812ae4Spbrook 153675e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1537cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 153875e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 15392bece2c8SRichard Henderson 154034b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 154134b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 154234b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 154334b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 15447319d83aSRichard Henderson int argtype = extract32(orig_typemask, (i + 1) * 3, 3); 15457319d83aSRichard Henderson bool is_64bit = (argtype & ~1) == dh_typecode_i64; 15467319d83aSRichard Henderson 154734b1a49cSRichard Henderson if (is_64bit) { 1548085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 1549085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 155034b1a49cSRichard Henderson } else { 155134b1a49cSRichard Henderson real_args++; 155234b1a49cSRichard Henderson } 155334b1a49cSRichard Henderson } 15547319d83aSRichard Henderson if ((orig_typemask & 6) == dh_typecode_i64) { 155534b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 155634b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 155734b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 1558085272b3SRichard Henderson tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth); 155934b1a49cSRichard Henderson tcg_temp_free_i64(retl); 156034b1a49cSRichard Henderson tcg_temp_free_i64(reth); 156134b1a49cSRichard Henderson } 156234b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 15632bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 15647319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 15657319d83aSRichard Henderson bool is_32bit = (argtype & ~1) == dh_typecode_i32; 15667319d83aSRichard Henderson 15677319d83aSRichard Henderson if (is_32bit) { 1568085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 15692bece2c8SRichard Henderson } 15702bece2c8SRichard Henderson } 15712bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1572a7812ae4Spbrook } 1573c896fe29Sbellard 15748fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1575c896fe29Sbellard { 1576ac3b8891SRichard Henderson int i, n; 1577ac3b8891SRichard Henderson 1578ee17db83SRichard Henderson for (i = 0, n = s->nb_temps; i < n; i++) { 1579ee17db83SRichard Henderson TCGTemp *ts = &s->temps[i]; 1580ee17db83SRichard Henderson TCGTempVal val = TEMP_VAL_MEM; 1581ee17db83SRichard Henderson 1582ee17db83SRichard Henderson switch (ts->kind) { 1583c0522136SRichard Henderson case TEMP_CONST: 1584c0522136SRichard Henderson val = TEMP_VAL_CONST; 1585c0522136SRichard Henderson break; 1586ee17db83SRichard Henderson case TEMP_FIXED: 1587ee17db83SRichard Henderson val = TEMP_VAL_REG; 1588ee17db83SRichard Henderson break; 1589ee17db83SRichard Henderson case TEMP_GLOBAL: 1590ee17db83SRichard Henderson break; 1591ee17db83SRichard Henderson case TEMP_NORMAL: 1592ee17db83SRichard Henderson val = TEMP_VAL_DEAD; 1593ee17db83SRichard Henderson /* fall through */ 1594ee17db83SRichard Henderson case TEMP_LOCAL: 1595e8996ee0Sbellard ts->mem_allocated = 0; 1596ee17db83SRichard Henderson break; 1597ee17db83SRichard Henderson default: 1598ee17db83SRichard Henderson g_assert_not_reached(); 1599ee17db83SRichard Henderson } 1600ee17db83SRichard Henderson ts->val_type = val; 1601e8996ee0Sbellard } 1602f8b2f202SRichard Henderson 1603f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1604c896fe29Sbellard } 1605c896fe29Sbellard 1606f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1607f8b2f202SRichard Henderson TCGTemp *ts) 1608c896fe29Sbellard { 16091807f4c4SRichard Henderson int idx = temp_idx(ts); 1610ac56dd48Spbrook 1611ee17db83SRichard Henderson switch (ts->kind) { 1612ee17db83SRichard Henderson case TEMP_FIXED: 1613ee17db83SRichard Henderson case TEMP_GLOBAL: 1614ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1615ee17db83SRichard Henderson break; 1616ee17db83SRichard Henderson case TEMP_LOCAL: 1617641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1618ee17db83SRichard Henderson break; 1619ee17db83SRichard Henderson case TEMP_NORMAL: 1620ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1621ee17db83SRichard Henderson break; 1622c0522136SRichard Henderson case TEMP_CONST: 1623c0522136SRichard Henderson switch (ts->type) { 1624c0522136SRichard Henderson case TCG_TYPE_I32: 1625c0522136SRichard Henderson snprintf(buf, buf_size, "$0x%x", (int32_t)ts->val); 1626c0522136SRichard Henderson break; 1627c0522136SRichard Henderson #if TCG_TARGET_REG_BITS > 32 1628c0522136SRichard Henderson case TCG_TYPE_I64: 1629c0522136SRichard Henderson snprintf(buf, buf_size, "$0x%" PRIx64, ts->val); 1630c0522136SRichard Henderson break; 1631c0522136SRichard Henderson #endif 1632c0522136SRichard Henderson case TCG_TYPE_V64: 1633c0522136SRichard Henderson case TCG_TYPE_V128: 1634c0522136SRichard Henderson case TCG_TYPE_V256: 1635c0522136SRichard Henderson snprintf(buf, buf_size, "v%d$0x%" PRIx64, 1636c0522136SRichard Henderson 64 << (ts->type - TCG_TYPE_V64), ts->val); 1637c0522136SRichard Henderson break; 1638c0522136SRichard Henderson default: 1639c0522136SRichard Henderson g_assert_not_reached(); 1640c0522136SRichard Henderson } 1641c0522136SRichard Henderson break; 1642c896fe29Sbellard } 1643c896fe29Sbellard return buf; 1644c896fe29Sbellard } 1645c896fe29Sbellard 164643439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 164743439139SRichard Henderson int buf_size, TCGArg arg) 1648f8b2f202SRichard Henderson { 164943439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1650f8b2f202SRichard Henderson } 1651f8b2f202SRichard Henderson 1652f48f3edeSblueswir1 static const char * const cond_name[] = 1653f48f3edeSblueswir1 { 16540aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 16550aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1656f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1657f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1658f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1659f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1660f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1661f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1662f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1663f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1664f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1665f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1666f48f3edeSblueswir1 }; 1667f48f3edeSblueswir1 1668f713d6adSRichard Henderson static const char * const ldst_name[] = 1669f713d6adSRichard Henderson { 1670f713d6adSRichard Henderson [MO_UB] = "ub", 1671f713d6adSRichard Henderson [MO_SB] = "sb", 1672f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1673f713d6adSRichard Henderson [MO_LESW] = "lesw", 1674f713d6adSRichard Henderson [MO_LEUL] = "leul", 1675f713d6adSRichard Henderson [MO_LESL] = "lesl", 1676f713d6adSRichard Henderson [MO_LEQ] = "leq", 1677f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1678f713d6adSRichard Henderson [MO_BESW] = "besw", 1679f713d6adSRichard Henderson [MO_BEUL] = "beul", 1680f713d6adSRichard Henderson [MO_BESL] = "besl", 1681f713d6adSRichard Henderson [MO_BEQ] = "beq", 1682f713d6adSRichard Henderson }; 1683f713d6adSRichard Henderson 16841f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 168552bf9771Stony.nguyen@bt.com #ifdef TARGET_ALIGNED_ONLY 16861f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 16871f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 16881f00b27fSSergey Sorokin #else 16891f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 16901f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 16911f00b27fSSergey Sorokin #endif 16921f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 16931f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 16941f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 16951f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 16961f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 16971f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 16981f00b27fSSergey Sorokin }; 16991f00b27fSSergey Sorokin 1700b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d) 1701b016486eSRichard Henderson { 1702b016486eSRichard Henderson return (d & (d - 1)) == 0; 1703b016486eSRichard Henderson } 1704b016486eSRichard Henderson 1705b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d) 1706b016486eSRichard Henderson { 1707b016486eSRichard Henderson if (TCG_TARGET_NB_REGS <= 32) { 1708b016486eSRichard Henderson return ctz32(d); 1709b016486eSRichard Henderson } else { 1710b016486eSRichard Henderson return ctz64(d); 1711b016486eSRichard Henderson } 1712b016486eSRichard Henderson } 1713b016486eSRichard Henderson 17141894f69aSRichard Henderson static void tcg_dump_ops(TCGContext *s, bool have_prefs) 1715c896fe29Sbellard { 1716c896fe29Sbellard char buf[128]; 1717c45cb8bbSRichard Henderson TCGOp *op; 1718c896fe29Sbellard 171915fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1720c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1721c45cb8bbSRichard Henderson const TCGOpDef *def; 1722c45cb8bbSRichard Henderson TCGOpcode c; 1723bdfb460eSRichard Henderson int col = 0; 1724c45cb8bbSRichard Henderson 1725c45cb8bbSRichard Henderson c = op->opc; 1726c896fe29Sbellard def = &tcg_op_defs[c]; 1727c45cb8bbSRichard Henderson 1728765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1729b016486eSRichard Henderson nb_oargs = 0; 173015fa08f8SRichard Henderson col += qemu_log("\n ----"); 17319aef40edSRichard Henderson 17329aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 17339aef40edSRichard Henderson target_ulong a; 17347e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1735efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 17367e4597d7Sbellard #else 1737efee3746SRichard Henderson a = op->args[i]; 17387e4597d7Sbellard #endif 1739bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1740eeacee4dSBlue Swirl } 17417e4597d7Sbellard } else if (c == INDEX_op_call) { 17423e92aa34SRichard Henderson const TCGHelperInfo *info = tcg_call_info(op); 1743*fa52e660SRichard Henderson void *func = tcg_call_func(op); 17443e92aa34SRichard Henderson 1745c896fe29Sbellard /* variable number of arguments */ 1746cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1747cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1748c896fe29Sbellard nb_cargs = def->nb_cargs; 1749b03cce8eSbellard 17503e92aa34SRichard Henderson col += qemu_log(" %s ", def->name); 17513e92aa34SRichard Henderson 17523e92aa34SRichard Henderson /* 17533e92aa34SRichard Henderson * Print the function name from TCGHelperInfo, if available. 17543e92aa34SRichard Henderson * Note that plugins have a template function for the info, 17553e92aa34SRichard Henderson * but the actual function pointer comes from the plugin. 17563e92aa34SRichard Henderson */ 17573e92aa34SRichard Henderson if (func == info->func) { 17583e92aa34SRichard Henderson col += qemu_log("%s", info->name); 17593e92aa34SRichard Henderson } else { 17603e92aa34SRichard Henderson col += qemu_log("plugin(%p)", func); 17613e92aa34SRichard Henderson } 17623e92aa34SRichard Henderson 17633e92aa34SRichard Henderson col += qemu_log("$0x%x,$%d", info->flags, nb_oargs); 1764b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 176543439139SRichard Henderson col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1766efee3746SRichard Henderson op->args[i])); 1767b03cce8eSbellard } 1768cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1769efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1770cf066674SRichard Henderson const char *t = "<dummy>"; 1771cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 177243439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1773b03cce8eSbellard } 1774bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1775e8996ee0Sbellard } 1776b03cce8eSbellard } else { 1777bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1778c45cb8bbSRichard Henderson 1779c896fe29Sbellard nb_oargs = def->nb_oargs; 1780c896fe29Sbellard nb_iargs = def->nb_iargs; 1781c896fe29Sbellard nb_cargs = def->nb_cargs; 1782c896fe29Sbellard 1783d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1784d2fd745fSRichard Henderson col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op), 1785d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1786d2fd745fSRichard Henderson } 1787d2fd745fSRichard Henderson 1788c896fe29Sbellard k = 0; 1789c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1790eeacee4dSBlue Swirl if (k != 0) { 1791bdfb460eSRichard Henderson col += qemu_log(","); 1792eeacee4dSBlue Swirl } 179343439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1794efee3746SRichard Henderson op->args[k++])); 1795c896fe29Sbellard } 1796c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1797eeacee4dSBlue Swirl if (k != 0) { 1798bdfb460eSRichard Henderson col += qemu_log(","); 1799eeacee4dSBlue Swirl } 180043439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1801efee3746SRichard Henderson op->args[k++])); 1802c896fe29Sbellard } 1803be210acbSRichard Henderson switch (c) { 1804be210acbSRichard Henderson case INDEX_op_brcond_i32: 1805ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1806ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1807be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1808be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1809ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1810be210acbSRichard Henderson case INDEX_op_setcond_i64: 1811ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1812212be173SRichard Henderson case INDEX_op_cmp_vec: 1813f75da298SRichard Henderson case INDEX_op_cmpsel_vec: 1814efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1815efee3746SRichard Henderson && cond_name[op->args[k]]) { 1816efee3746SRichard Henderson col += qemu_log(",%s", cond_name[op->args[k++]]); 1817eeacee4dSBlue Swirl } else { 1818efee3746SRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]); 1819eeacee4dSBlue Swirl } 1820f48f3edeSblueswir1 i = 1; 1821be210acbSRichard Henderson break; 1822f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1823f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 182407ce0b05SRichard Henderson case INDEX_op_qemu_st8_i32: 1825f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1826f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 182759227d5dSRichard Henderson { 1828efee3746SRichard Henderson TCGMemOpIdx oi = op->args[k++]; 182914776ab5STony Nguyen MemOp op = get_memop(oi); 183059227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 183159227d5dSRichard Henderson 183259c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1833bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 183459c4b7e8SRichard Henderson } else { 18351f00b27fSSergey Sorokin const char *s_al, *s_op; 18361f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 183759c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1838bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 1839f713d6adSRichard Henderson } 1840f713d6adSRichard Henderson i = 1; 184159227d5dSRichard Henderson } 1842f713d6adSRichard Henderson break; 1843be210acbSRichard Henderson default: 1844f48f3edeSblueswir1 i = 0; 1845be210acbSRichard Henderson break; 1846be210acbSRichard Henderson } 184751e3972cSRichard Henderson switch (c) { 184851e3972cSRichard Henderson case INDEX_op_set_label: 184951e3972cSRichard Henderson case INDEX_op_br: 185051e3972cSRichard Henderson case INDEX_op_brcond_i32: 185151e3972cSRichard Henderson case INDEX_op_brcond_i64: 185251e3972cSRichard Henderson case INDEX_op_brcond2_i32: 1853efee3746SRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", 1854efee3746SRichard Henderson arg_label(op->args[k])->id); 185551e3972cSRichard Henderson i++, k++; 185651e3972cSRichard Henderson break; 185751e3972cSRichard Henderson default: 185851e3972cSRichard Henderson break; 1859eeacee4dSBlue Swirl } 186051e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 1861efee3746SRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]); 1862bdfb460eSRichard Henderson } 1863bdfb460eSRichard Henderson } 1864bdfb460eSRichard Henderson 18651894f69aSRichard Henderson if (have_prefs || op->life) { 18667606488cSRobert Foley 18677606488cSRobert Foley QemuLogFile *logfile; 18687606488cSRobert Foley 18697606488cSRobert Foley rcu_read_lock(); 1870d73415a3SStefan Hajnoczi logfile = qatomic_rcu_read(&qemu_logfile); 18717606488cSRobert Foley if (logfile) { 18721894f69aSRichard Henderson for (; col < 40; ++col) { 18737606488cSRobert Foley putc(' ', logfile->fd); 1874bdfb460eSRichard Henderson } 18751894f69aSRichard Henderson } 18767606488cSRobert Foley rcu_read_unlock(); 18777606488cSRobert Foley } 18781894f69aSRichard Henderson 18791894f69aSRichard Henderson if (op->life) { 18801894f69aSRichard Henderson unsigned life = op->life; 1881bdfb460eSRichard Henderson 1882bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 1883bdfb460eSRichard Henderson qemu_log(" sync:"); 1884bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 1885bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 1886bdfb460eSRichard Henderson qemu_log(" %d", i); 1887bdfb460eSRichard Henderson } 1888bdfb460eSRichard Henderson } 1889bdfb460eSRichard Henderson } 1890bdfb460eSRichard Henderson life /= DEAD_ARG; 1891bdfb460eSRichard Henderson if (life) { 1892bdfb460eSRichard Henderson qemu_log(" dead:"); 1893bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 1894bdfb460eSRichard Henderson if (life & 1) { 1895bdfb460eSRichard Henderson qemu_log(" %d", i); 1896bdfb460eSRichard Henderson } 1897bdfb460eSRichard Henderson } 1898c896fe29Sbellard } 1899b03cce8eSbellard } 19001894f69aSRichard Henderson 19011894f69aSRichard Henderson if (have_prefs) { 19021894f69aSRichard Henderson for (i = 0; i < nb_oargs; ++i) { 19031894f69aSRichard Henderson TCGRegSet set = op->output_pref[i]; 19041894f69aSRichard Henderson 19051894f69aSRichard Henderson if (i == 0) { 19061894f69aSRichard Henderson qemu_log(" pref="); 19071894f69aSRichard Henderson } else { 19081894f69aSRichard Henderson qemu_log(","); 19091894f69aSRichard Henderson } 19101894f69aSRichard Henderson if (set == 0) { 19111894f69aSRichard Henderson qemu_log("none"); 19121894f69aSRichard Henderson } else if (set == MAKE_64BIT_MASK(0, TCG_TARGET_NB_REGS)) { 19131894f69aSRichard Henderson qemu_log("all"); 19141894f69aSRichard Henderson #ifdef CONFIG_DEBUG_TCG 19151894f69aSRichard Henderson } else if (tcg_regset_single(set)) { 19161894f69aSRichard Henderson TCGReg reg = tcg_regset_first(set); 19171894f69aSRichard Henderson qemu_log("%s", tcg_target_reg_names[reg]); 19181894f69aSRichard Henderson #endif 19191894f69aSRichard Henderson } else if (TCG_TARGET_NB_REGS <= 32) { 19201894f69aSRichard Henderson qemu_log("%#x", (uint32_t)set); 19211894f69aSRichard Henderson } else { 19221894f69aSRichard Henderson qemu_log("%#" PRIx64, (uint64_t)set); 19231894f69aSRichard Henderson } 19241894f69aSRichard Henderson } 19251894f69aSRichard Henderson } 19261894f69aSRichard Henderson 1927eeacee4dSBlue Swirl qemu_log("\n"); 1928c896fe29Sbellard } 1929c896fe29Sbellard } 1930c896fe29Sbellard 1931c896fe29Sbellard /* we give more priority to constraints with less registers */ 1932c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 1933c896fe29Sbellard { 193474a11790SRichard Henderson const TCGArgConstraint *arg_ct = &def->args_ct[k]; 193574a11790SRichard Henderson int n; 1936c896fe29Sbellard 1937bc2b17e6SRichard Henderson if (arg_ct->oalias) { 1938c896fe29Sbellard /* an alias is equivalent to a single register */ 1939c896fe29Sbellard n = 1; 1940c896fe29Sbellard } else { 194174a11790SRichard Henderson n = ctpop64(arg_ct->regs); 1942c896fe29Sbellard } 1943c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 1944c896fe29Sbellard } 1945c896fe29Sbellard 1946c896fe29Sbellard /* sort from highest priority to lowest */ 1947c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 1948c896fe29Sbellard { 194966792f90SRichard Henderson int i, j; 195066792f90SRichard Henderson TCGArgConstraint *a = def->args_ct; 1951c896fe29Sbellard 195266792f90SRichard Henderson for (i = 0; i < n; i++) { 195366792f90SRichard Henderson a[start + i].sort_index = start + i; 195466792f90SRichard Henderson } 195566792f90SRichard Henderson if (n <= 1) { 1956c896fe29Sbellard return; 195766792f90SRichard Henderson } 1958c896fe29Sbellard for (i = 0; i < n - 1; i++) { 1959c896fe29Sbellard for (j = i + 1; j < n; j++) { 196066792f90SRichard Henderson int p1 = get_constraint_priority(def, a[start + i].sort_index); 196166792f90SRichard Henderson int p2 = get_constraint_priority(def, a[start + j].sort_index); 1962c896fe29Sbellard if (p1 < p2) { 196366792f90SRichard Henderson int tmp = a[start + i].sort_index; 196466792f90SRichard Henderson a[start + i].sort_index = a[start + j].sort_index; 196566792f90SRichard Henderson a[start + j].sort_index = tmp; 1966c896fe29Sbellard } 1967c896fe29Sbellard } 1968c896fe29Sbellard } 1969c896fe29Sbellard } 1970c896fe29Sbellard 1971f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 1972c896fe29Sbellard { 1973a9751609SRichard Henderson TCGOpcode op; 1974c896fe29Sbellard 1975f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 1976f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 1977f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 1978069ea736SRichard Henderson int i, nb_args; 1979f69d277eSRichard Henderson 1980f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 1981f69d277eSRichard Henderson continue; 1982f69d277eSRichard Henderson } 1983f69d277eSRichard Henderson 1984c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 1985f69d277eSRichard Henderson if (nb_args == 0) { 1986f69d277eSRichard Henderson continue; 1987f69d277eSRichard Henderson } 1988f69d277eSRichard Henderson 19894c22e840SRichard Henderson /* 19904c22e840SRichard Henderson * Macro magic should make it impossible, but double-check that 19914c22e840SRichard Henderson * the array index is in range. Since the signness of an enum 19924c22e840SRichard Henderson * is implementation defined, force the result to unsigned. 19934c22e840SRichard Henderson */ 19944c22e840SRichard Henderson unsigned con_set = tcg_target_op_def(op); 19954c22e840SRichard Henderson tcg_debug_assert(con_set < ARRAY_SIZE(constraint_sets)); 19964c22e840SRichard Henderson tdefs = &constraint_sets[con_set]; 1997f69d277eSRichard Henderson 1998c896fe29Sbellard for (i = 0; i < nb_args; i++) { 1999f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 2000f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2001eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2002f69d277eSRichard Henderson 200317280ff4SRichard Henderson while (*ct_str != '\0') { 200417280ff4SRichard Henderson switch(*ct_str) { 200517280ff4SRichard Henderson case '0' ... '9': 200617280ff4SRichard Henderson { 200717280ff4SRichard Henderson int oarg = *ct_str - '0'; 200817280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 2009eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 201074a11790SRichard Henderson tcg_debug_assert(def->args_ct[oarg].regs != 0); 2011c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 2012bc2b17e6SRichard Henderson /* The output sets oalias. */ 2013bc2b17e6SRichard Henderson def->args_ct[oarg].oalias = true; 20145ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 2015bc2b17e6SRichard Henderson /* The input sets ialias. */ 2016bc2b17e6SRichard Henderson def->args_ct[i].ialias = true; 20175ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 201817280ff4SRichard Henderson } 201917280ff4SRichard Henderson ct_str++; 2020c896fe29Sbellard break; 202182790a87SRichard Henderson case '&': 2022bc2b17e6SRichard Henderson def->args_ct[i].newreg = true; 202382790a87SRichard Henderson ct_str++; 202482790a87SRichard Henderson break; 2025c896fe29Sbellard case 'i': 2026c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2027c896fe29Sbellard ct_str++; 2028c896fe29Sbellard break; 2029358b4923SRichard Henderson 2030358b4923SRichard Henderson /* Include all of the target-specific constraints. */ 2031358b4923SRichard Henderson 2032358b4923SRichard Henderson #undef CONST 2033358b4923SRichard Henderson #define CONST(CASE, MASK) \ 2034358b4923SRichard Henderson case CASE: def->args_ct[i].ct |= MASK; ct_str++; break; 2035358b4923SRichard Henderson #define REGS(CASE, MASK) \ 2036358b4923SRichard Henderson case CASE: def->args_ct[i].regs |= MASK; ct_str++; break; 2037358b4923SRichard Henderson 2038358b4923SRichard Henderson #include "tcg-target-con-str.h" 2039358b4923SRichard Henderson 2040358b4923SRichard Henderson #undef REGS 2041358b4923SRichard Henderson #undef CONST 2042c896fe29Sbellard default: 2043358b4923SRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2044358b4923SRichard Henderson g_assert_not_reached(); 2045358b4923SRichard Henderson } 2046c896fe29Sbellard } 2047c896fe29Sbellard } 2048c896fe29Sbellard 2049c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2050eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2051c68aaa18SStefan Weil 2052c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2053c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2054c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2055c896fe29Sbellard } 2056c896fe29Sbellard } 2057c896fe29Sbellard 20580c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 20590c627cdcSRichard Henderson { 2060d88a117eSRichard Henderson TCGLabel *label; 2061d88a117eSRichard Henderson 2062d88a117eSRichard Henderson switch (op->opc) { 2063d88a117eSRichard Henderson case INDEX_op_br: 2064d88a117eSRichard Henderson label = arg_label(op->args[0]); 2065d88a117eSRichard Henderson label->refs--; 2066d88a117eSRichard Henderson break; 2067d88a117eSRichard Henderson case INDEX_op_brcond_i32: 2068d88a117eSRichard Henderson case INDEX_op_brcond_i64: 2069d88a117eSRichard Henderson label = arg_label(op->args[3]); 2070d88a117eSRichard Henderson label->refs--; 2071d88a117eSRichard Henderson break; 2072d88a117eSRichard Henderson case INDEX_op_brcond2_i32: 2073d88a117eSRichard Henderson label = arg_label(op->args[5]); 2074d88a117eSRichard Henderson label->refs--; 2075d88a117eSRichard Henderson break; 2076d88a117eSRichard Henderson default: 2077d88a117eSRichard Henderson break; 2078d88a117eSRichard Henderson } 2079d88a117eSRichard Henderson 208015fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 208115fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2082abebf925SRichard Henderson s->nb_ops--; 20830c627cdcSRichard Henderson 20840c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2085d73415a3SStefan Hajnoczi qatomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 20860c627cdcSRichard Henderson #endif 20870c627cdcSRichard Henderson } 20880c627cdcSRichard Henderson 2089a80cdd31SRichard Henderson void tcg_remove_ops_after(TCGOp *op) 2090a80cdd31SRichard Henderson { 2091a80cdd31SRichard Henderson TCGContext *s = tcg_ctx; 2092a80cdd31SRichard Henderson 2093a80cdd31SRichard Henderson while (true) { 2094a80cdd31SRichard Henderson TCGOp *last = tcg_last_op(); 2095a80cdd31SRichard Henderson if (last == op) { 2096a80cdd31SRichard Henderson return; 2097a80cdd31SRichard Henderson } 2098a80cdd31SRichard Henderson tcg_op_remove(s, last); 2099a80cdd31SRichard Henderson } 2100a80cdd31SRichard Henderson } 2101a80cdd31SRichard Henderson 210215fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 210315fa08f8SRichard Henderson { 210415fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 210515fa08f8SRichard Henderson TCGOp *op; 210615fa08f8SRichard Henderson 210715fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 210815fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 210915fa08f8SRichard Henderson } else { 211015fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 211115fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 211215fa08f8SRichard Henderson } 211315fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 211415fa08f8SRichard Henderson op->opc = opc; 2115abebf925SRichard Henderson s->nb_ops++; 211615fa08f8SRichard Henderson 211715fa08f8SRichard Henderson return op; 211815fa08f8SRichard Henderson } 211915fa08f8SRichard Henderson 212015fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 212115fa08f8SRichard Henderson { 212215fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 212315fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 212415fa08f8SRichard Henderson return op; 212515fa08f8SRichard Henderson } 212615fa08f8SRichard Henderson 2127ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 21285a18407fSRichard Henderson { 212915fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 213015fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 21315a18407fSRichard Henderson return new_op; 21325a18407fSRichard Henderson } 21335a18407fSRichard Henderson 2134ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 21355a18407fSRichard Henderson { 213615fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 213715fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 21385a18407fSRichard Henderson return new_op; 21395a18407fSRichard Henderson } 21405a18407fSRichard Henderson 2141b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code. */ 2142b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s) 2143b4fc67c7SRichard Henderson { 2144b4fc67c7SRichard Henderson TCGOp *op, *op_next; 2145b4fc67c7SRichard Henderson bool dead = false; 2146b4fc67c7SRichard Henderson 2147b4fc67c7SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 2148b4fc67c7SRichard Henderson bool remove = dead; 2149b4fc67c7SRichard Henderson TCGLabel *label; 2150b4fc67c7SRichard Henderson 2151b4fc67c7SRichard Henderson switch (op->opc) { 2152b4fc67c7SRichard Henderson case INDEX_op_set_label: 2153b4fc67c7SRichard Henderson label = arg_label(op->args[0]); 2154b4fc67c7SRichard Henderson if (label->refs == 0) { 2155b4fc67c7SRichard Henderson /* 2156b4fc67c7SRichard Henderson * While there is an occasional backward branch, virtually 2157b4fc67c7SRichard Henderson * all branches generated by the translators are forward. 2158b4fc67c7SRichard Henderson * Which means that generally we will have already removed 2159b4fc67c7SRichard Henderson * all references to the label that will be, and there is 2160b4fc67c7SRichard Henderson * little to be gained by iterating. 2161b4fc67c7SRichard Henderson */ 2162b4fc67c7SRichard Henderson remove = true; 2163b4fc67c7SRichard Henderson } else { 2164b4fc67c7SRichard Henderson /* Once we see a label, insns become live again. */ 2165b4fc67c7SRichard Henderson dead = false; 2166b4fc67c7SRichard Henderson remove = false; 2167b4fc67c7SRichard Henderson 2168b4fc67c7SRichard Henderson /* 2169b4fc67c7SRichard Henderson * Optimization can fold conditional branches to unconditional. 2170b4fc67c7SRichard Henderson * If we find a label with one reference which is preceded by 2171b4fc67c7SRichard Henderson * an unconditional branch to it, remove both. This needed to 2172b4fc67c7SRichard Henderson * wait until the dead code in between them was removed. 2173b4fc67c7SRichard Henderson */ 2174b4fc67c7SRichard Henderson if (label->refs == 1) { 2175eae3eb3eSPaolo Bonzini TCGOp *op_prev = QTAILQ_PREV(op, link); 2176b4fc67c7SRichard Henderson if (op_prev->opc == INDEX_op_br && 2177b4fc67c7SRichard Henderson label == arg_label(op_prev->args[0])) { 2178b4fc67c7SRichard Henderson tcg_op_remove(s, op_prev); 2179b4fc67c7SRichard Henderson remove = true; 2180b4fc67c7SRichard Henderson } 2181b4fc67c7SRichard Henderson } 2182b4fc67c7SRichard Henderson } 2183b4fc67c7SRichard Henderson break; 2184b4fc67c7SRichard Henderson 2185b4fc67c7SRichard Henderson case INDEX_op_br: 2186b4fc67c7SRichard Henderson case INDEX_op_exit_tb: 2187b4fc67c7SRichard Henderson case INDEX_op_goto_ptr: 2188b4fc67c7SRichard Henderson /* Unconditional branches; everything following is dead. */ 2189b4fc67c7SRichard Henderson dead = true; 2190b4fc67c7SRichard Henderson break; 2191b4fc67c7SRichard Henderson 2192b4fc67c7SRichard Henderson case INDEX_op_call: 2193b4fc67c7SRichard Henderson /* Notice noreturn helper calls, raising exceptions. */ 219490163900SRichard Henderson if (tcg_call_flags(op) & TCG_CALL_NO_RETURN) { 2195b4fc67c7SRichard Henderson dead = true; 2196b4fc67c7SRichard Henderson } 2197b4fc67c7SRichard Henderson break; 2198b4fc67c7SRichard Henderson 2199b4fc67c7SRichard Henderson case INDEX_op_insn_start: 2200b4fc67c7SRichard Henderson /* Never remove -- we need to keep these for unwind. */ 2201b4fc67c7SRichard Henderson remove = false; 2202b4fc67c7SRichard Henderson break; 2203b4fc67c7SRichard Henderson 2204b4fc67c7SRichard Henderson default: 2205b4fc67c7SRichard Henderson break; 2206b4fc67c7SRichard Henderson } 2207b4fc67c7SRichard Henderson 2208b4fc67c7SRichard Henderson if (remove) { 2209b4fc67c7SRichard Henderson tcg_op_remove(s, op); 2210b4fc67c7SRichard Henderson } 2211b4fc67c7SRichard Henderson } 2212b4fc67c7SRichard Henderson } 2213b4fc67c7SRichard Henderson 2214c70fbf0aSRichard Henderson #define TS_DEAD 1 2215c70fbf0aSRichard Henderson #define TS_MEM 2 2216c70fbf0aSRichard Henderson 22175a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 22185a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 22195a18407fSRichard Henderson 222025f49c5fSRichard Henderson /* For liveness_pass_1, the register preferences for a given temp. */ 222125f49c5fSRichard Henderson static inline TCGRegSet *la_temp_pref(TCGTemp *ts) 222225f49c5fSRichard Henderson { 222325f49c5fSRichard Henderson return ts->state_ptr; 222425f49c5fSRichard Henderson } 222525f49c5fSRichard Henderson 222625f49c5fSRichard Henderson /* For liveness_pass_1, reset the preferences for a given temp to the 222725f49c5fSRichard Henderson * maximal regset for its type. 222825f49c5fSRichard Henderson */ 222925f49c5fSRichard Henderson static inline void la_reset_pref(TCGTemp *ts) 223025f49c5fSRichard Henderson { 223125f49c5fSRichard Henderson *la_temp_pref(ts) 223225f49c5fSRichard Henderson = (ts->state == TS_DEAD ? 0 : tcg_target_available_regs[ts->type]); 223325f49c5fSRichard Henderson } 223425f49c5fSRichard Henderson 22359c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 22369c43b68dSAurelien Jarno should be in memory. */ 22372616c808SRichard Henderson static void la_func_end(TCGContext *s, int ng, int nt) 2238c896fe29Sbellard { 2239b83eabeaSRichard Henderson int i; 2240b83eabeaSRichard Henderson 2241b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2242b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 224325f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 2244b83eabeaSRichard Henderson } 2245b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2246b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 224725f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 2248b83eabeaSRichard Henderson } 2249c896fe29Sbellard } 2250c896fe29Sbellard 22519c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 22529c43b68dSAurelien Jarno and local temps should be in memory. */ 22532616c808SRichard Henderson static void la_bb_end(TCGContext *s, int ng, int nt) 2254641d5fbeSbellard { 2255b83eabeaSRichard Henderson int i; 2256641d5fbeSbellard 2257ee17db83SRichard Henderson for (i = 0; i < nt; ++i) { 2258ee17db83SRichard Henderson TCGTemp *ts = &s->temps[i]; 2259ee17db83SRichard Henderson int state; 2260ee17db83SRichard Henderson 2261ee17db83SRichard Henderson switch (ts->kind) { 2262ee17db83SRichard Henderson case TEMP_FIXED: 2263ee17db83SRichard Henderson case TEMP_GLOBAL: 2264ee17db83SRichard Henderson case TEMP_LOCAL: 2265ee17db83SRichard Henderson state = TS_DEAD | TS_MEM; 2266ee17db83SRichard Henderson break; 2267ee17db83SRichard Henderson case TEMP_NORMAL: 2268c0522136SRichard Henderson case TEMP_CONST: 2269ee17db83SRichard Henderson state = TS_DEAD; 2270ee17db83SRichard Henderson break; 2271ee17db83SRichard Henderson default: 2272ee17db83SRichard Henderson g_assert_not_reached(); 2273c70fbf0aSRichard Henderson } 2274ee17db83SRichard Henderson ts->state = state; 2275ee17db83SRichard Henderson la_reset_pref(ts); 2276641d5fbeSbellard } 2277641d5fbeSbellard } 2278641d5fbeSbellard 2279f65a061cSRichard Henderson /* liveness analysis: sync globals back to memory. */ 2280f65a061cSRichard Henderson static void la_global_sync(TCGContext *s, int ng) 2281f65a061cSRichard Henderson { 2282f65a061cSRichard Henderson int i; 2283f65a061cSRichard Henderson 2284f65a061cSRichard Henderson for (i = 0; i < ng; ++i) { 228525f49c5fSRichard Henderson int state = s->temps[i].state; 228625f49c5fSRichard Henderson s->temps[i].state = state | TS_MEM; 228725f49c5fSRichard Henderson if (state == TS_DEAD) { 228825f49c5fSRichard Henderson /* If the global was previously dead, reset prefs. */ 228925f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 229025f49c5fSRichard Henderson } 2291f65a061cSRichard Henderson } 2292f65a061cSRichard Henderson } 2293f65a061cSRichard Henderson 2294b4cb76e6SRichard Henderson /* 2295b4cb76e6SRichard Henderson * liveness analysis: conditional branch: all temps are dead, 2296b4cb76e6SRichard Henderson * globals and local temps should be synced. 2297b4cb76e6SRichard Henderson */ 2298b4cb76e6SRichard Henderson static void la_bb_sync(TCGContext *s, int ng, int nt) 2299b4cb76e6SRichard Henderson { 2300b4cb76e6SRichard Henderson la_global_sync(s, ng); 2301b4cb76e6SRichard Henderson 2302b4cb76e6SRichard Henderson for (int i = ng; i < nt; ++i) { 2303c0522136SRichard Henderson TCGTemp *ts = &s->temps[i]; 2304c0522136SRichard Henderson int state; 2305c0522136SRichard Henderson 2306c0522136SRichard Henderson switch (ts->kind) { 2307c0522136SRichard Henderson case TEMP_LOCAL: 2308c0522136SRichard Henderson state = ts->state; 2309c0522136SRichard Henderson ts->state = state | TS_MEM; 2310b4cb76e6SRichard Henderson if (state != TS_DEAD) { 2311b4cb76e6SRichard Henderson continue; 2312b4cb76e6SRichard Henderson } 2313c0522136SRichard Henderson break; 2314c0522136SRichard Henderson case TEMP_NORMAL: 2315b4cb76e6SRichard Henderson s->temps[i].state = TS_DEAD; 2316c0522136SRichard Henderson break; 2317c0522136SRichard Henderson case TEMP_CONST: 2318c0522136SRichard Henderson continue; 2319c0522136SRichard Henderson default: 2320c0522136SRichard Henderson g_assert_not_reached(); 2321b4cb76e6SRichard Henderson } 2322b4cb76e6SRichard Henderson la_reset_pref(&s->temps[i]); 2323b4cb76e6SRichard Henderson } 2324b4cb76e6SRichard Henderson } 2325b4cb76e6SRichard Henderson 2326f65a061cSRichard Henderson /* liveness analysis: sync globals back to memory and kill. */ 2327f65a061cSRichard Henderson static void la_global_kill(TCGContext *s, int ng) 2328f65a061cSRichard Henderson { 2329f65a061cSRichard Henderson int i; 2330f65a061cSRichard Henderson 2331f65a061cSRichard Henderson for (i = 0; i < ng; i++) { 2332f65a061cSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 233325f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 233425f49c5fSRichard Henderson } 233525f49c5fSRichard Henderson } 233625f49c5fSRichard Henderson 233725f49c5fSRichard Henderson /* liveness analysis: note live globals crossing calls. */ 233825f49c5fSRichard Henderson static void la_cross_call(TCGContext *s, int nt) 233925f49c5fSRichard Henderson { 234025f49c5fSRichard Henderson TCGRegSet mask = ~tcg_target_call_clobber_regs; 234125f49c5fSRichard Henderson int i; 234225f49c5fSRichard Henderson 234325f49c5fSRichard Henderson for (i = 0; i < nt; i++) { 234425f49c5fSRichard Henderson TCGTemp *ts = &s->temps[i]; 234525f49c5fSRichard Henderson if (!(ts->state & TS_DEAD)) { 234625f49c5fSRichard Henderson TCGRegSet *pset = la_temp_pref(ts); 234725f49c5fSRichard Henderson TCGRegSet set = *pset; 234825f49c5fSRichard Henderson 234925f49c5fSRichard Henderson set &= mask; 235025f49c5fSRichard Henderson /* If the combination is not possible, restart. */ 235125f49c5fSRichard Henderson if (set == 0) { 235225f49c5fSRichard Henderson set = tcg_target_available_regs[ts->type] & mask; 235325f49c5fSRichard Henderson } 235425f49c5fSRichard Henderson *pset = set; 235525f49c5fSRichard Henderson } 2356f65a061cSRichard Henderson } 2357f65a061cSRichard Henderson } 2358f65a061cSRichard Henderson 2359a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2360c896fe29Sbellard given input arguments is dead. Instructions updating dead 2361c896fe29Sbellard temporaries are removed. */ 2362b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2363c896fe29Sbellard { 2364c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 23652616c808SRichard Henderson int nb_temps = s->nb_temps; 236615fa08f8SRichard Henderson TCGOp *op, *op_prev; 236725f49c5fSRichard Henderson TCGRegSet *prefs; 236825f49c5fSRichard Henderson int i; 236925f49c5fSRichard Henderson 237025f49c5fSRichard Henderson prefs = tcg_malloc(sizeof(TCGRegSet) * nb_temps); 237125f49c5fSRichard Henderson for (i = 0; i < nb_temps; ++i) { 237225f49c5fSRichard Henderson s->temps[i].state_ptr = prefs + i; 237325f49c5fSRichard Henderson } 2374c896fe29Sbellard 2375ae36a246SRichard Henderson /* ??? Should be redundant with the exit_tb that ends the TB. */ 23762616c808SRichard Henderson la_func_end(s, nb_globals, nb_temps); 2377c896fe29Sbellard 2378eae3eb3eSPaolo Bonzini QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, link, op_prev) { 237925f49c5fSRichard Henderson int nb_iargs, nb_oargs; 2380c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2381c45cb8bbSRichard Henderson bool have_opc_new2; 2382a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 238325f49c5fSRichard Henderson TCGTemp *ts; 2384c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2385c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2386c45cb8bbSRichard Henderson 2387c45cb8bbSRichard Henderson switch (opc) { 2388c896fe29Sbellard case INDEX_op_call: 2389c6e113f5Sbellard { 2390c6e113f5Sbellard int call_flags; 239125f49c5fSRichard Henderson int nb_call_regs; 2392c6e113f5Sbellard 2393cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2394cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 239590163900SRichard Henderson call_flags = tcg_call_flags(op); 2396c6e113f5Sbellard 2397c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 239878505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2399c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 240025f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 240125f49c5fSRichard Henderson if (ts->state != TS_DEAD) { 2402c6e113f5Sbellard goto do_not_remove_call; 2403c6e113f5Sbellard } 24049c43b68dSAurelien Jarno } 2405c45cb8bbSRichard Henderson goto do_remove; 2406152c35aaSRichard Henderson } 2407c6e113f5Sbellard do_not_remove_call: 2408c896fe29Sbellard 240925f49c5fSRichard Henderson /* Output args are dead. */ 2410c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 241125f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 241225f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2413a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 24146b64b624SAurelien Jarno } 241525f49c5fSRichard Henderson if (ts->state & TS_MEM) { 2416a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 24179c43b68dSAurelien Jarno } 241825f49c5fSRichard Henderson ts->state = TS_DEAD; 241925f49c5fSRichard Henderson la_reset_pref(ts); 242025f49c5fSRichard Henderson 242125f49c5fSRichard Henderson /* Not used -- it will be tcg_target_call_oarg_regs[i]. */ 242225f49c5fSRichard Henderson op->output_pref[i] = 0; 2423c896fe29Sbellard } 2424c896fe29Sbellard 242578505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 242678505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 2427f65a061cSRichard Henderson la_global_kill(s, nb_globals); 2428c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2429f65a061cSRichard Henderson la_global_sync(s, nb_globals); 2430b9c18f56Saurel32 } 2431c896fe29Sbellard 243225f49c5fSRichard Henderson /* Record arguments that die in this helper. */ 2433866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 243425f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 243525f49c5fSRichard Henderson if (ts && ts->state & TS_DEAD) { 2436a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2437c896fe29Sbellard } 2438c896fe29Sbellard } 243925f49c5fSRichard Henderson 244025f49c5fSRichard Henderson /* For all live registers, remove call-clobbered prefs. */ 244125f49c5fSRichard Henderson la_cross_call(s, nb_temps); 244225f49c5fSRichard Henderson 244325f49c5fSRichard Henderson nb_call_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 244425f49c5fSRichard Henderson 244525f49c5fSRichard Henderson /* Input arguments are live for preceding opcodes. */ 244625f49c5fSRichard Henderson for (i = 0; i < nb_iargs; i++) { 244725f49c5fSRichard Henderson ts = arg_temp(op->args[i + nb_oargs]); 244825f49c5fSRichard Henderson if (ts && ts->state & TS_DEAD) { 244925f49c5fSRichard Henderson /* For those arguments that die, and will be allocated 245025f49c5fSRichard Henderson * in registers, clear the register set for that arg, 245125f49c5fSRichard Henderson * to be filled in below. For args that will be on 245225f49c5fSRichard Henderson * the stack, reset to any available reg. 245325f49c5fSRichard Henderson */ 245425f49c5fSRichard Henderson *la_temp_pref(ts) 245525f49c5fSRichard Henderson = (i < nb_call_regs ? 0 : 245625f49c5fSRichard Henderson tcg_target_available_regs[ts->type]); 245725f49c5fSRichard Henderson ts->state &= ~TS_DEAD; 245825f49c5fSRichard Henderson } 245925f49c5fSRichard Henderson } 246025f49c5fSRichard Henderson 246125f49c5fSRichard Henderson /* For each input argument, add its input register to prefs. 246225f49c5fSRichard Henderson If a temp is used once, this produces a single set bit. */ 246325f49c5fSRichard Henderson for (i = 0; i < MIN(nb_call_regs, nb_iargs); i++) { 246425f49c5fSRichard Henderson ts = arg_temp(op->args[i + nb_oargs]); 246525f49c5fSRichard Henderson if (ts) { 246625f49c5fSRichard Henderson tcg_regset_set_reg(*la_temp_pref(ts), 246725f49c5fSRichard Henderson tcg_target_call_iarg_regs[i]); 2468c70fbf0aSRichard Henderson } 2469c19f47bfSAurelien Jarno } 2470c6e113f5Sbellard } 2471c896fe29Sbellard break; 2472765b842aSRichard Henderson case INDEX_op_insn_start: 2473c896fe29Sbellard break; 24745ff9d6a4Sbellard case INDEX_op_discard: 24755ff9d6a4Sbellard /* mark the temporary as dead */ 247625f49c5fSRichard Henderson ts = arg_temp(op->args[0]); 247725f49c5fSRichard Henderson ts->state = TS_DEAD; 247825f49c5fSRichard Henderson la_reset_pref(ts); 24795ff9d6a4Sbellard break; 24801305c451SRichard Henderson 24811305c451SRichard Henderson case INDEX_op_add2_i32: 2482c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2483f1fae40cSRichard Henderson goto do_addsub2; 24841305c451SRichard Henderson case INDEX_op_sub2_i32: 2485c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2486f1fae40cSRichard Henderson goto do_addsub2; 2487f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2488c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2489f1fae40cSRichard Henderson goto do_addsub2; 2490f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2491c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2492f1fae40cSRichard Henderson do_addsub2: 24931305c451SRichard Henderson nb_iargs = 4; 24941305c451SRichard Henderson nb_oargs = 2; 24951305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 24961305c451SRichard Henderson the low part. The result can be optimized to a simple 24971305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 24981305c451SRichard Henderson cpu mode is set to 32 bit. */ 2499b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2500b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 25011305c451SRichard Henderson goto do_remove; 25021305c451SRichard Henderson } 2503c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2504c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2505c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2506efee3746SRichard Henderson op->args[1] = op->args[2]; 2507efee3746SRichard Henderson op->args[2] = op->args[4]; 25081305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 25091305c451SRichard Henderson nb_iargs = 2; 25101305c451SRichard Henderson nb_oargs = 1; 25111305c451SRichard Henderson } 25121305c451SRichard Henderson goto do_not_remove; 25131305c451SRichard Henderson 25141414968aSRichard Henderson case INDEX_op_mulu2_i32: 2515c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2516c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2517c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 251803271524SRichard Henderson goto do_mul2; 2519f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2520c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2521c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2522c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2523f1fae40cSRichard Henderson goto do_mul2; 2524f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2525c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2526c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2527c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 252803271524SRichard Henderson goto do_mul2; 2529f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2530c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2531c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2532c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 253303271524SRichard Henderson goto do_mul2; 2534f1fae40cSRichard Henderson do_mul2: 25351414968aSRichard Henderson nb_iargs = 2; 25361414968aSRichard Henderson nb_oargs = 2; 2537b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2538b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 253903271524SRichard Henderson /* Both parts of the operation are dead. */ 25401414968aSRichard Henderson goto do_remove; 25411414968aSRichard Henderson } 254203271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2543c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2544efee3746SRichard Henderson op->args[1] = op->args[2]; 2545efee3746SRichard Henderson op->args[2] = op->args[3]; 2546b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 254703271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2548c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2549efee3746SRichard Henderson op->args[0] = op->args[1]; 2550efee3746SRichard Henderson op->args[1] = op->args[2]; 2551efee3746SRichard Henderson op->args[2] = op->args[3]; 255203271524SRichard Henderson } else { 255303271524SRichard Henderson goto do_not_remove; 255403271524SRichard Henderson } 255503271524SRichard Henderson /* Mark the single-word operation live. */ 25561414968aSRichard Henderson nb_oargs = 1; 25571414968aSRichard Henderson goto do_not_remove; 25581414968aSRichard Henderson 2559c896fe29Sbellard default: 25601305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2561c896fe29Sbellard nb_iargs = def->nb_iargs; 2562c896fe29Sbellard nb_oargs = def->nb_oargs; 2563c896fe29Sbellard 2564c896fe29Sbellard /* Test if the operation can be removed because all 25655ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 25665ff9d6a4Sbellard implies side effects */ 25675ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2568c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2569b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2570c896fe29Sbellard goto do_not_remove; 2571c896fe29Sbellard } 25729c43b68dSAurelien Jarno } 2573152c35aaSRichard Henderson goto do_remove; 2574152c35aaSRichard Henderson } 2575152c35aaSRichard Henderson goto do_not_remove; 2576152c35aaSRichard Henderson 25771305c451SRichard Henderson do_remove: 25780c627cdcSRichard Henderson tcg_op_remove(s, op); 2579152c35aaSRichard Henderson break; 2580152c35aaSRichard Henderson 2581c896fe29Sbellard do_not_remove: 2582c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 258325f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 258425f49c5fSRichard Henderson 258525f49c5fSRichard Henderson /* Remember the preference of the uses that followed. */ 258625f49c5fSRichard Henderson op->output_pref[i] = *la_temp_pref(ts); 258725f49c5fSRichard Henderson 258825f49c5fSRichard Henderson /* Output args are dead. */ 258925f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2590a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 25916b64b624SAurelien Jarno } 259225f49c5fSRichard Henderson if (ts->state & TS_MEM) { 2593a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 25949c43b68dSAurelien Jarno } 259525f49c5fSRichard Henderson ts->state = TS_DEAD; 259625f49c5fSRichard Henderson la_reset_pref(ts); 2597c896fe29Sbellard } 2598c896fe29Sbellard 259925f49c5fSRichard Henderson /* If end of basic block, update. */ 2600ae36a246SRichard Henderson if (def->flags & TCG_OPF_BB_EXIT) { 2601ae36a246SRichard Henderson la_func_end(s, nb_globals, nb_temps); 2602b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_COND_BRANCH) { 2603b4cb76e6SRichard Henderson la_bb_sync(s, nb_globals, nb_temps); 2604ae36a246SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 26052616c808SRichard Henderson la_bb_end(s, nb_globals, nb_temps); 26063d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 2607f65a061cSRichard Henderson la_global_sync(s, nb_globals); 260825f49c5fSRichard Henderson if (def->flags & TCG_OPF_CALL_CLOBBER) { 260925f49c5fSRichard Henderson la_cross_call(s, nb_temps); 261025f49c5fSRichard Henderson } 2611c896fe29Sbellard } 2612c896fe29Sbellard 261325f49c5fSRichard Henderson /* Record arguments that die in this opcode. */ 2614866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 261525f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 261625f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2617a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2618c896fe29Sbellard } 2619c19f47bfSAurelien Jarno } 262025f49c5fSRichard Henderson 262125f49c5fSRichard Henderson /* Input arguments are live for preceding opcodes. */ 2622c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 262325f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 262425f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 262525f49c5fSRichard Henderson /* For operands that were dead, initially allow 262625f49c5fSRichard Henderson all regs for the type. */ 262725f49c5fSRichard Henderson *la_temp_pref(ts) = tcg_target_available_regs[ts->type]; 262825f49c5fSRichard Henderson ts->state &= ~TS_DEAD; 262925f49c5fSRichard Henderson } 263025f49c5fSRichard Henderson } 263125f49c5fSRichard Henderson 263225f49c5fSRichard Henderson /* Incorporate constraints for this operand. */ 263325f49c5fSRichard Henderson switch (opc) { 263425f49c5fSRichard Henderson case INDEX_op_mov_i32: 263525f49c5fSRichard Henderson case INDEX_op_mov_i64: 263625f49c5fSRichard Henderson /* Note that these are TCG_OPF_NOT_PRESENT and do not 263725f49c5fSRichard Henderson have proper constraints. That said, special case 263825f49c5fSRichard Henderson moves to propagate preferences backward. */ 263925f49c5fSRichard Henderson if (IS_DEAD_ARG(1)) { 264025f49c5fSRichard Henderson *la_temp_pref(arg_temp(op->args[0])) 264125f49c5fSRichard Henderson = *la_temp_pref(arg_temp(op->args[1])); 264225f49c5fSRichard Henderson } 264325f49c5fSRichard Henderson break; 264425f49c5fSRichard Henderson 264525f49c5fSRichard Henderson default: 264625f49c5fSRichard Henderson for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 264725f49c5fSRichard Henderson const TCGArgConstraint *ct = &def->args_ct[i]; 264825f49c5fSRichard Henderson TCGRegSet set, *pset; 264925f49c5fSRichard Henderson 265025f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 265125f49c5fSRichard Henderson pset = la_temp_pref(ts); 265225f49c5fSRichard Henderson set = *pset; 265325f49c5fSRichard Henderson 26549be0d080SRichard Henderson set &= ct->regs; 2655bc2b17e6SRichard Henderson if (ct->ialias) { 265625f49c5fSRichard Henderson set &= op->output_pref[ct->alias_index]; 265725f49c5fSRichard Henderson } 265825f49c5fSRichard Henderson /* If the combination is not possible, restart. */ 265925f49c5fSRichard Henderson if (set == 0) { 26609be0d080SRichard Henderson set = ct->regs; 266125f49c5fSRichard Henderson } 266225f49c5fSRichard Henderson *pset = set; 266325f49c5fSRichard Henderson } 266425f49c5fSRichard Henderson break; 2665c896fe29Sbellard } 2666c896fe29Sbellard break; 2667c896fe29Sbellard } 2668bee158cbSRichard Henderson op->life = arg_life; 2669c896fe29Sbellard } 26701ff0a2c5SEvgeny Voevodin } 2671c896fe29Sbellard 26725a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2673b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 26745a18407fSRichard Henderson { 26755a18407fSRichard Henderson int nb_globals = s->nb_globals; 267615fa08f8SRichard Henderson int nb_temps, i; 26775a18407fSRichard Henderson bool changes = false; 267815fa08f8SRichard Henderson TCGOp *op, *op_next; 26795a18407fSRichard Henderson 26805a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 26815a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 26825a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 26835a18407fSRichard Henderson if (its->indirect_reg) { 26845a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 26855a18407fSRichard Henderson dts->type = its->type; 26865a18407fSRichard Henderson dts->base_type = its->base_type; 2687b83eabeaSRichard Henderson its->state_ptr = dts; 2688b83eabeaSRichard Henderson } else { 2689b83eabeaSRichard Henderson its->state_ptr = NULL; 26905a18407fSRichard Henderson } 2691b83eabeaSRichard Henderson /* All globals begin dead. */ 2692b83eabeaSRichard Henderson its->state = TS_DEAD; 26935a18407fSRichard Henderson } 2694b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2695b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2696b83eabeaSRichard Henderson its->state_ptr = NULL; 2697b83eabeaSRichard Henderson its->state = TS_DEAD; 2698b83eabeaSRichard Henderson } 26995a18407fSRichard Henderson 270015fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 27015a18407fSRichard Henderson TCGOpcode opc = op->opc; 27025a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 27035a18407fSRichard Henderson TCGLifeData arg_life = op->life; 27045a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2705b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 27065a18407fSRichard Henderson 27075a18407fSRichard Henderson if (opc == INDEX_op_call) { 2708cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2709cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 271090163900SRichard Henderson call_flags = tcg_call_flags(op); 27115a18407fSRichard Henderson } else { 27125a18407fSRichard Henderson nb_iargs = def->nb_iargs; 27135a18407fSRichard Henderson nb_oargs = def->nb_oargs; 27145a18407fSRichard Henderson 27155a18407fSRichard Henderson /* Set flags similar to how calls require. */ 2716b4cb76e6SRichard Henderson if (def->flags & TCG_OPF_COND_BRANCH) { 2717b4cb76e6SRichard Henderson /* Like reading globals: sync_globals */ 2718b4cb76e6SRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 2719b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 27205a18407fSRichard Henderson /* Like writing globals: save_globals */ 27215a18407fSRichard Henderson call_flags = 0; 27225a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 27235a18407fSRichard Henderson /* Like reading globals: sync_globals */ 27245a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 27255a18407fSRichard Henderson } else { 27265a18407fSRichard Henderson /* No effect on globals. */ 27275a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 27285a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 27295a18407fSRichard Henderson } 27305a18407fSRichard Henderson } 27315a18407fSRichard Henderson 27325a18407fSRichard Henderson /* Make sure that input arguments are available. */ 27335a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2734b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2735b83eabeaSRichard Henderson if (arg_ts) { 2736b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2737b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2738b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 27395a18407fSRichard Henderson ? INDEX_op_ld_i32 27405a18407fSRichard Henderson : INDEX_op_ld_i64); 2741ac1043f6SEmilio G. Cota TCGOp *lop = tcg_op_insert_before(s, op, lopc); 27425a18407fSRichard Henderson 2743b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2744b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2745b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 27465a18407fSRichard Henderson 27475a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2748b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 27495a18407fSRichard Henderson } 27505a18407fSRichard Henderson } 27515a18407fSRichard Henderson } 27525a18407fSRichard Henderson 27535a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 27545a18407fSRichard Henderson No action is required except keeping temp_state up to date 27555a18407fSRichard Henderson so that we reload when needed. */ 27565a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2757b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2758b83eabeaSRichard Henderson if (arg_ts) { 2759b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2760b83eabeaSRichard Henderson if (dir_ts) { 2761b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 27625a18407fSRichard Henderson changes = true; 27635a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2764b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 27655a18407fSRichard Henderson } 27665a18407fSRichard Henderson } 27675a18407fSRichard Henderson } 27685a18407fSRichard Henderson } 27695a18407fSRichard Henderson 27705a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 27715a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 27725a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 27735a18407fSRichard Henderson /* Nothing to do */ 27745a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 27755a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 27765a18407fSRichard Henderson /* Liveness should see that globals are synced back, 27775a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2778b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2779b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2780b83eabeaSRichard Henderson || arg_ts->state != 0); 27815a18407fSRichard Henderson } 27825a18407fSRichard Henderson } else { 27835a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 27845a18407fSRichard Henderson /* Liveness should see that globals are saved back, 27855a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2786b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2787b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2788b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 27895a18407fSRichard Henderson } 27905a18407fSRichard Henderson } 27915a18407fSRichard Henderson 27925a18407fSRichard Henderson /* Outputs become available. */ 279361f15c48SRichard Henderson if (opc == INDEX_op_mov_i32 || opc == INDEX_op_mov_i64) { 279461f15c48SRichard Henderson arg_ts = arg_temp(op->args[0]); 279561f15c48SRichard Henderson dir_ts = arg_ts->state_ptr; 279661f15c48SRichard Henderson if (dir_ts) { 279761f15c48SRichard Henderson op->args[0] = temp_arg(dir_ts); 279861f15c48SRichard Henderson changes = true; 279961f15c48SRichard Henderson 280061f15c48SRichard Henderson /* The output is now live and modified. */ 280161f15c48SRichard Henderson arg_ts->state = 0; 280261f15c48SRichard Henderson 280361f15c48SRichard Henderson if (NEED_SYNC_ARG(0)) { 280461f15c48SRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 280561f15c48SRichard Henderson ? INDEX_op_st_i32 280661f15c48SRichard Henderson : INDEX_op_st_i64); 280761f15c48SRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc); 280861f15c48SRichard Henderson TCGTemp *out_ts = dir_ts; 280961f15c48SRichard Henderson 281061f15c48SRichard Henderson if (IS_DEAD_ARG(0)) { 281161f15c48SRichard Henderson out_ts = arg_temp(op->args[1]); 281261f15c48SRichard Henderson arg_ts->state = TS_DEAD; 281361f15c48SRichard Henderson tcg_op_remove(s, op); 281461f15c48SRichard Henderson } else { 281561f15c48SRichard Henderson arg_ts->state = TS_MEM; 281661f15c48SRichard Henderson } 281761f15c48SRichard Henderson 281861f15c48SRichard Henderson sop->args[0] = temp_arg(out_ts); 281961f15c48SRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 282061f15c48SRichard Henderson sop->args[2] = arg_ts->mem_offset; 282161f15c48SRichard Henderson } else { 282261f15c48SRichard Henderson tcg_debug_assert(!IS_DEAD_ARG(0)); 282361f15c48SRichard Henderson } 282461f15c48SRichard Henderson } 282561f15c48SRichard Henderson } else { 28265a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 2827b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2828b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2829b83eabeaSRichard Henderson if (!dir_ts) { 28305a18407fSRichard Henderson continue; 28315a18407fSRichard Henderson } 2832b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 28335a18407fSRichard Henderson changes = true; 28345a18407fSRichard Henderson 28355a18407fSRichard Henderson /* The output is now live and modified. */ 2836b83eabeaSRichard Henderson arg_ts->state = 0; 28375a18407fSRichard Henderson 28385a18407fSRichard Henderson /* Sync outputs upon their last write. */ 28395a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 2840b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 28415a18407fSRichard Henderson ? INDEX_op_st_i32 28425a18407fSRichard Henderson : INDEX_op_st_i64); 2843ac1043f6SEmilio G. Cota TCGOp *sop = tcg_op_insert_after(s, op, sopc); 28445a18407fSRichard Henderson 2845b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 2846b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 2847b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 28485a18407fSRichard Henderson 2849b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 28505a18407fSRichard Henderson } 28515a18407fSRichard Henderson /* Drop outputs that are dead. */ 28525a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2853b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 28545a18407fSRichard Henderson } 28555a18407fSRichard Henderson } 28565a18407fSRichard Henderson } 285761f15c48SRichard Henderson } 28585a18407fSRichard Henderson 28595a18407fSRichard Henderson return changes; 28605a18407fSRichard Henderson } 28615a18407fSRichard Henderson 28628d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2863c896fe29Sbellard static void dump_regs(TCGContext *s) 2864c896fe29Sbellard { 2865c896fe29Sbellard TCGTemp *ts; 2866c896fe29Sbellard int i; 2867c896fe29Sbellard char buf[64]; 2868c896fe29Sbellard 2869c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2870c896fe29Sbellard ts = &s->temps[i]; 287143439139SRichard Henderson printf(" %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2872c896fe29Sbellard switch(ts->val_type) { 2873c896fe29Sbellard case TEMP_VAL_REG: 2874c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2875c896fe29Sbellard break; 2876c896fe29Sbellard case TEMP_VAL_MEM: 2877b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2878b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2879c896fe29Sbellard break; 2880c896fe29Sbellard case TEMP_VAL_CONST: 2881bdb38b95SRichard Henderson printf("$0x%" PRIx64, ts->val); 2882c896fe29Sbellard break; 2883c896fe29Sbellard case TEMP_VAL_DEAD: 2884c896fe29Sbellard printf("D"); 2885c896fe29Sbellard break; 2886c896fe29Sbellard default: 2887c896fe29Sbellard printf("???"); 2888c896fe29Sbellard break; 2889c896fe29Sbellard } 2890c896fe29Sbellard printf("\n"); 2891c896fe29Sbellard } 2892c896fe29Sbellard 2893c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2894f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2895c896fe29Sbellard printf("%s: %s\n", 2896c896fe29Sbellard tcg_target_reg_names[i], 2897f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2898c896fe29Sbellard } 2899c896fe29Sbellard } 2900c896fe29Sbellard } 2901c896fe29Sbellard 2902c896fe29Sbellard static void check_regs(TCGContext *s) 2903c896fe29Sbellard { 2904869938aeSRichard Henderson int reg; 2905b6638662SRichard Henderson int k; 2906c896fe29Sbellard TCGTemp *ts; 2907c896fe29Sbellard char buf[64]; 2908c896fe29Sbellard 2909c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2910f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2911f8b2f202SRichard Henderson if (ts != NULL) { 2912f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2913c896fe29Sbellard printf("Inconsistency for register %s:\n", 2914c896fe29Sbellard tcg_target_reg_names[reg]); 2915b03cce8eSbellard goto fail; 2916c896fe29Sbellard } 2917c896fe29Sbellard } 2918c896fe29Sbellard } 2919c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2920c896fe29Sbellard ts = &s->temps[k]; 2921ee17db83SRichard Henderson if (ts->val_type == TEMP_VAL_REG 2922ee17db83SRichard Henderson && ts->kind != TEMP_FIXED 2923f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2924c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2925f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2926b03cce8eSbellard fail: 2927c896fe29Sbellard printf("reg state:\n"); 2928c896fe29Sbellard dump_regs(s); 2929c896fe29Sbellard tcg_abort(); 2930c896fe29Sbellard } 2931c896fe29Sbellard } 2932c896fe29Sbellard } 2933c896fe29Sbellard #endif 2934c896fe29Sbellard 29352272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 2936c896fe29Sbellard { 29379b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 29389b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2939b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2940b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2941b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2942f44c9960SBlue Swirl #endif 2943b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2944b591dc59SBlue Swirl s->frame_end) { 29455ff9d6a4Sbellard tcg_abort(); 2946b591dc59SBlue Swirl } 2947c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2948b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2949c896fe29Sbellard ts->mem_allocated = 1; 2950e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2951c896fe29Sbellard } 2952c896fe29Sbellard 2953b722452aSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet, TCGRegSet); 2954b3915dbbSRichard Henderson 295559d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 295659d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 295759d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2958c896fe29Sbellard { 2959c0522136SRichard Henderson TCGTempVal new_type; 2960c0522136SRichard Henderson 2961c0522136SRichard Henderson switch (ts->kind) { 2962c0522136SRichard Henderson case TEMP_FIXED: 296359d7c14eSRichard Henderson return; 2964c0522136SRichard Henderson case TEMP_GLOBAL: 2965c0522136SRichard Henderson case TEMP_LOCAL: 2966c0522136SRichard Henderson new_type = TEMP_VAL_MEM; 2967c0522136SRichard Henderson break; 2968c0522136SRichard Henderson case TEMP_NORMAL: 2969c0522136SRichard Henderson new_type = free_or_dead < 0 ? TEMP_VAL_MEM : TEMP_VAL_DEAD; 2970c0522136SRichard Henderson break; 2971c0522136SRichard Henderson case TEMP_CONST: 2972c0522136SRichard Henderson new_type = TEMP_VAL_CONST; 2973c0522136SRichard Henderson break; 2974c0522136SRichard Henderson default: 2975c0522136SRichard Henderson g_assert_not_reached(); 297659d7c14eSRichard Henderson } 297759d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 297859d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 297959d7c14eSRichard Henderson } 2980c0522136SRichard Henderson ts->val_type = new_type; 298159d7c14eSRichard Henderson } 2982c896fe29Sbellard 298359d7c14eSRichard Henderson /* Mark a temporary as dead. */ 298459d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 298559d7c14eSRichard Henderson { 298659d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 298759d7c14eSRichard Henderson } 298859d7c14eSRichard Henderson 298959d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 299059d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 299159d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 299259d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 299398b4e186SRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs, 299498b4e186SRichard Henderson TCGRegSet preferred_regs, int free_or_dead) 299559d7c14eSRichard Henderson { 2996c0522136SRichard Henderson if (!temp_readonly(ts) && !ts->mem_coherent) { 29977f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 29982272e4a7SRichard Henderson temp_allocate_frame(s, ts); 299959d7c14eSRichard Henderson } 300059d7c14eSRichard Henderson switch (ts->val_type) { 300159d7c14eSRichard Henderson case TEMP_VAL_CONST: 300259d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 300359d7c14eSRichard Henderson require it later in a register, so attempt to store the 300459d7c14eSRichard Henderson constant to memory directly. */ 300559d7c14eSRichard Henderson if (free_or_dead 300659d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 300759d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 300859d7c14eSRichard Henderson break; 300959d7c14eSRichard Henderson } 301059d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 301198b4e186SRichard Henderson allocated_regs, preferred_regs); 301259d7c14eSRichard Henderson /* fallthrough */ 301359d7c14eSRichard Henderson 301459d7c14eSRichard Henderson case TEMP_VAL_REG: 301559d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 301659d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 301759d7c14eSRichard Henderson break; 301859d7c14eSRichard Henderson 301959d7c14eSRichard Henderson case TEMP_VAL_MEM: 302059d7c14eSRichard Henderson break; 302159d7c14eSRichard Henderson 302259d7c14eSRichard Henderson case TEMP_VAL_DEAD: 302359d7c14eSRichard Henderson default: 302459d7c14eSRichard Henderson tcg_abort(); 3025c896fe29Sbellard } 30267f6ceedfSAurelien Jarno ts->mem_coherent = 1; 30277f6ceedfSAurelien Jarno } 302859d7c14eSRichard Henderson if (free_or_dead) { 302959d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 303059d7c14eSRichard Henderson } 303159d7c14eSRichard Henderson } 30327f6ceedfSAurelien Jarno 30337f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 3034b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 30357f6ceedfSAurelien Jarno { 3036f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 3037f8b2f202SRichard Henderson if (ts != NULL) { 303898b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, -1); 3039c896fe29Sbellard } 3040c896fe29Sbellard } 3041c896fe29Sbellard 3042b016486eSRichard Henderson /** 3043b016486eSRichard Henderson * tcg_reg_alloc: 3044b016486eSRichard Henderson * @required_regs: Set of registers in which we must allocate. 3045b016486eSRichard Henderson * @allocated_regs: Set of registers which must be avoided. 3046b016486eSRichard Henderson * @preferred_regs: Set of registers we should prefer. 3047b016486eSRichard Henderson * @rev: True if we search the registers in "indirect" order. 3048b016486eSRichard Henderson * 3049b016486eSRichard Henderson * The allocated register must be in @required_regs & ~@allocated_regs, 3050b016486eSRichard Henderson * but if we can put it in @preferred_regs we may save a move later. 3051b016486eSRichard Henderson */ 3052b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs, 3053b016486eSRichard Henderson TCGRegSet allocated_regs, 3054b016486eSRichard Henderson TCGRegSet preferred_regs, bool rev) 3055c896fe29Sbellard { 3056b016486eSRichard Henderson int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 3057b016486eSRichard Henderson TCGRegSet reg_ct[2]; 305891478cefSRichard Henderson const int *order; 3059c896fe29Sbellard 3060b016486eSRichard Henderson reg_ct[1] = required_regs & ~allocated_regs; 3061b016486eSRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 3062b016486eSRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 3063b016486eSRichard Henderson 3064b016486eSRichard Henderson /* Skip the preferred_regs option if it cannot be satisfied, 3065b016486eSRichard Henderson or if the preference made no difference. */ 3066b016486eSRichard Henderson f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 3067b016486eSRichard Henderson 306891478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 3069c896fe29Sbellard 3070b016486eSRichard Henderson /* Try free registers, preferences first. */ 3071b016486eSRichard Henderson for (j = f; j < 2; j++) { 3072b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3073b016486eSRichard Henderson 3074b016486eSRichard Henderson if (tcg_regset_single(set)) { 3075b016486eSRichard Henderson /* One register in the set. */ 3076b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3077b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL) { 3078c896fe29Sbellard return reg; 3079c896fe29Sbellard } 3080b016486eSRichard Henderson } else { 308191478cefSRichard Henderson for (i = 0; i < n; i++) { 3082b016486eSRichard Henderson TCGReg reg = order[i]; 3083b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL && 3084b016486eSRichard Henderson tcg_regset_test_reg(set, reg)) { 3085b016486eSRichard Henderson return reg; 3086b016486eSRichard Henderson } 3087b016486eSRichard Henderson } 3088b016486eSRichard Henderson } 3089b016486eSRichard Henderson } 3090b016486eSRichard Henderson 3091b016486eSRichard Henderson /* We must spill something. */ 3092b016486eSRichard Henderson for (j = f; j < 2; j++) { 3093b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3094b016486eSRichard Henderson 3095b016486eSRichard Henderson if (tcg_regset_single(set)) { 3096b016486eSRichard Henderson /* One register in the set. */ 3097b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3098b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3099c896fe29Sbellard return reg; 3100b016486eSRichard Henderson } else { 3101b016486eSRichard Henderson for (i = 0; i < n; i++) { 3102b016486eSRichard Henderson TCGReg reg = order[i]; 3103b016486eSRichard Henderson if (tcg_regset_test_reg(set, reg)) { 3104b016486eSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3105b016486eSRichard Henderson return reg; 3106b016486eSRichard Henderson } 3107b016486eSRichard Henderson } 3108c896fe29Sbellard } 3109c896fe29Sbellard } 3110c896fe29Sbellard 3111c896fe29Sbellard tcg_abort(); 3112c896fe29Sbellard } 3113c896fe29Sbellard 311440ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 311540ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 311640ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 3117b722452aSRichard Henderson TCGRegSet allocated_regs, TCGRegSet preferred_regs) 311840ae5c62SRichard Henderson { 311940ae5c62SRichard Henderson TCGReg reg; 312040ae5c62SRichard Henderson 312140ae5c62SRichard Henderson switch (ts->val_type) { 312240ae5c62SRichard Henderson case TEMP_VAL_REG: 312340ae5c62SRichard Henderson return; 312440ae5c62SRichard Henderson case TEMP_VAL_CONST: 3125b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3126b722452aSRichard Henderson preferred_regs, ts->indirect_base); 31270a6a8bc8SRichard Henderson if (ts->type <= TCG_TYPE_I64) { 312840ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 31290a6a8bc8SRichard Henderson } else { 31304e186175SRichard Henderson uint64_t val = ts->val; 31314e186175SRichard Henderson MemOp vece = MO_64; 31324e186175SRichard Henderson 31334e186175SRichard Henderson /* 31344e186175SRichard Henderson * Find the minimal vector element that matches the constant. 31354e186175SRichard Henderson * The targets will, in general, have to do this search anyway, 31364e186175SRichard Henderson * do this generically. 31374e186175SRichard Henderson */ 31384e186175SRichard Henderson if (val == dup_const(MO_8, val)) { 31394e186175SRichard Henderson vece = MO_8; 31404e186175SRichard Henderson } else if (val == dup_const(MO_16, val)) { 31414e186175SRichard Henderson vece = MO_16; 31420b4286ddSRichard Henderson } else if (val == dup_const(MO_32, val)) { 31434e186175SRichard Henderson vece = MO_32; 31444e186175SRichard Henderson } 31454e186175SRichard Henderson 31464e186175SRichard Henderson tcg_out_dupi_vec(s, ts->type, vece, reg, ts->val); 31470a6a8bc8SRichard Henderson } 314840ae5c62SRichard Henderson ts->mem_coherent = 0; 314940ae5c62SRichard Henderson break; 315040ae5c62SRichard Henderson case TEMP_VAL_MEM: 3151b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3152b722452aSRichard Henderson preferred_regs, ts->indirect_base); 315340ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 315440ae5c62SRichard Henderson ts->mem_coherent = 1; 315540ae5c62SRichard Henderson break; 315640ae5c62SRichard Henderson case TEMP_VAL_DEAD: 315740ae5c62SRichard Henderson default: 315840ae5c62SRichard Henderson tcg_abort(); 315940ae5c62SRichard Henderson } 316040ae5c62SRichard Henderson ts->reg = reg; 316140ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 316240ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 316340ae5c62SRichard Henderson } 316440ae5c62SRichard Henderson 316559d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 3166e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 316759d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 31681ad80729SAurelien Jarno { 31692c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 3170eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 3171e01fa97dSRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || temp_readonly(ts)); 31721ad80729SAurelien Jarno } 31731ad80729SAurelien Jarno 31749814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 3175641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 3176641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 3177641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 3178641d5fbeSbellard { 3179ac3b8891SRichard Henderson int i, n; 3180641d5fbeSbellard 3181ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 3182b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 3183641d5fbeSbellard } 3184e5097dc8Sbellard } 3185e5097dc8Sbellard 31863d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 31873d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 31883d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 31893d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 31903d5c5f87SAurelien Jarno { 3191ac3b8891SRichard Henderson int i, n; 31923d5c5f87SAurelien Jarno 3193ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 319412b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 319512b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 3196ee17db83SRichard Henderson || ts->kind == TEMP_FIXED 319712b9b11aSRichard Henderson || ts->mem_coherent); 31983d5c5f87SAurelien Jarno } 31993d5c5f87SAurelien Jarno } 32003d5c5f87SAurelien Jarno 3201e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 3202e8996ee0Sbellard all globals are stored at their canonical location. */ 3203e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 3204e5097dc8Sbellard { 3205e5097dc8Sbellard int i; 3206e5097dc8Sbellard 3207c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 3208b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 3209c0522136SRichard Henderson 3210c0522136SRichard Henderson switch (ts->kind) { 3211c0522136SRichard Henderson case TEMP_LOCAL: 3212b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 3213c0522136SRichard Henderson break; 3214c0522136SRichard Henderson case TEMP_NORMAL: 32152c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 3216eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 3217eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3218c0522136SRichard Henderson break; 3219c0522136SRichard Henderson case TEMP_CONST: 3220c0522136SRichard Henderson /* Similarly, we should have freed any allocated register. */ 3221c0522136SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_CONST); 3222c0522136SRichard Henderson break; 3223c0522136SRichard Henderson default: 3224c0522136SRichard Henderson g_assert_not_reached(); 3225c896fe29Sbellard } 3226641d5fbeSbellard } 3227e8996ee0Sbellard 3228e8996ee0Sbellard save_globals(s, allocated_regs); 3229c896fe29Sbellard } 3230c896fe29Sbellard 3231bab1671fSRichard Henderson /* 3232b4cb76e6SRichard Henderson * At a conditional branch, we assume all temporaries are dead and 3233b4cb76e6SRichard Henderson * all globals and local temps are synced to their location. 3234b4cb76e6SRichard Henderson */ 3235b4cb76e6SRichard Henderson static void tcg_reg_alloc_cbranch(TCGContext *s, TCGRegSet allocated_regs) 3236b4cb76e6SRichard Henderson { 3237b4cb76e6SRichard Henderson sync_globals(s, allocated_regs); 3238b4cb76e6SRichard Henderson 3239b4cb76e6SRichard Henderson for (int i = s->nb_globals; i < s->nb_temps; i++) { 3240b4cb76e6SRichard Henderson TCGTemp *ts = &s->temps[i]; 3241b4cb76e6SRichard Henderson /* 3242b4cb76e6SRichard Henderson * The liveness analysis already ensures that temps are dead. 3243b4cb76e6SRichard Henderson * Keep tcg_debug_asserts for safety. 3244b4cb76e6SRichard Henderson */ 3245c0522136SRichard Henderson switch (ts->kind) { 3246c0522136SRichard Henderson case TEMP_LOCAL: 3247b4cb76e6SRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG || ts->mem_coherent); 3248c0522136SRichard Henderson break; 3249c0522136SRichard Henderson case TEMP_NORMAL: 3250b4cb76e6SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3251c0522136SRichard Henderson break; 3252c0522136SRichard Henderson case TEMP_CONST: 3253c0522136SRichard Henderson break; 3254c0522136SRichard Henderson default: 3255c0522136SRichard Henderson g_assert_not_reached(); 3256b4cb76e6SRichard Henderson } 3257b4cb76e6SRichard Henderson } 3258b4cb76e6SRichard Henderson } 3259b4cb76e6SRichard Henderson 3260b4cb76e6SRichard Henderson /* 3261c58f4c97SRichard Henderson * Specialized code generation for INDEX_op_mov_* with a constant. 3262bab1671fSRichard Henderson */ 32630fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 3264ba87719cSRichard Henderson tcg_target_ulong val, TCGLifeData arg_life, 3265ba87719cSRichard Henderson TCGRegSet preferred_regs) 3266e8996ee0Sbellard { 3267d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3268e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 326959d7c14eSRichard Henderson 327059d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 3271f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 3272f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3273f8b2f202SRichard Henderson } 3274e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 3275e8996ee0Sbellard ots->val = val; 327659d7c14eSRichard Henderson ots->mem_coherent = 0; 3277ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 3278ba87719cSRichard Henderson temp_sync(s, ots, s->reserved_regs, preferred_regs, IS_DEAD_ARG(0)); 327959d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 3280f8bf00f1SRichard Henderson temp_dead(s, ots); 32814c4e1ab2SAurelien Jarno } 3282e8996ee0Sbellard } 3283e8996ee0Sbellard 3284bab1671fSRichard Henderson /* 3285bab1671fSRichard Henderson * Specialized code generation for INDEX_op_mov_*. 3286bab1671fSRichard Henderson */ 3287dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 3288c896fe29Sbellard { 3289dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 329069e3706dSRichard Henderson TCGRegSet allocated_regs, preferred_regs; 3291c896fe29Sbellard TCGTemp *ts, *ots; 3292450445d5SRichard Henderson TCGType otype, itype; 3293c896fe29Sbellard 3294d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 329569e3706dSRichard Henderson preferred_regs = op->output_pref[0]; 329643439139SRichard Henderson ots = arg_temp(op->args[0]); 329743439139SRichard Henderson ts = arg_temp(op->args[1]); 3298450445d5SRichard Henderson 3299d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3300e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3301d63e3b6eSRichard Henderson 3302450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 3303450445d5SRichard Henderson otype = ots->type; 3304450445d5SRichard Henderson itype = ts->type; 3305c896fe29Sbellard 33060fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 33070fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 33080fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 33090fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 33100fe4fca4SPaolo Bonzini temp_dead(s, ts); 33110fe4fca4SPaolo Bonzini } 331269e3706dSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, preferred_regs); 33130fe4fca4SPaolo Bonzini return; 33140fe4fca4SPaolo Bonzini } 33150fe4fca4SPaolo Bonzini 33160fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 33170fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 33180fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 33190fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 33200fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 332169e3706dSRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], 332269e3706dSRichard Henderson allocated_regs, preferred_regs); 3323c29c1d7eSAurelien Jarno } 3324c29c1d7eSAurelien Jarno 33250fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 3326d63e3b6eSRichard Henderson if (IS_DEAD_ARG(0)) { 3327c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 3328c29c1d7eSAurelien Jarno liveness analysis disabled). */ 3329eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 3330c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 33312272e4a7SRichard Henderson temp_allocate_frame(s, ots); 3332c29c1d7eSAurelien Jarno } 3333b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 3334c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 3335f8bf00f1SRichard Henderson temp_dead(s, ts); 3336c29c1d7eSAurelien Jarno } 3337f8bf00f1SRichard Henderson temp_dead(s, ots); 3338e8996ee0Sbellard } else { 3339ee17db83SRichard Henderson if (IS_DEAD_ARG(1) && ts->kind != TEMP_FIXED) { 3340c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 3341c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 3342f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3343c896fe29Sbellard } 3344c29c1d7eSAurelien Jarno ots->reg = ts->reg; 3345f8bf00f1SRichard Henderson temp_dead(s, ts); 3346c29c1d7eSAurelien Jarno } else { 3347c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 3348c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 3349c29c1d7eSAurelien Jarno input one. */ 3350c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 3351450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 335269e3706dSRichard Henderson allocated_regs, preferred_regs, 3353b016486eSRichard Henderson ots->indirect_base); 3354c29c1d7eSAurelien Jarno } 335578113e83SRichard Henderson if (!tcg_out_mov(s, otype, ots->reg, ts->reg)) { 3356240c08d0SRichard Henderson /* 3357240c08d0SRichard Henderson * Cross register class move not supported. 3358240c08d0SRichard Henderson * Store the source register into the destination slot 3359240c08d0SRichard Henderson * and leave the destination temp as TEMP_VAL_MEM. 3360240c08d0SRichard Henderson */ 3361e01fa97dSRichard Henderson assert(!temp_readonly(ots)); 3362240c08d0SRichard Henderson if (!ts->mem_allocated) { 3363240c08d0SRichard Henderson temp_allocate_frame(s, ots); 3364240c08d0SRichard Henderson } 3365240c08d0SRichard Henderson tcg_out_st(s, ts->type, ts->reg, 3366240c08d0SRichard Henderson ots->mem_base->reg, ots->mem_offset); 3367240c08d0SRichard Henderson ots->mem_coherent = 1; 3368240c08d0SRichard Henderson temp_free_or_dead(s, ots, -1); 3369240c08d0SRichard Henderson return; 337078113e83SRichard Henderson } 3371c29c1d7eSAurelien Jarno } 3372c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 3373c896fe29Sbellard ots->mem_coherent = 0; 3374f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 3375ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 337698b4e186SRichard Henderson temp_sync(s, ots, allocated_regs, 0, 0); 3377c29c1d7eSAurelien Jarno } 3378ec7a869dSAurelien Jarno } 3379c896fe29Sbellard } 3380c896fe29Sbellard 3381bab1671fSRichard Henderson /* 3382bab1671fSRichard Henderson * Specialized code generation for INDEX_op_dup_vec. 3383bab1671fSRichard Henderson */ 3384bab1671fSRichard Henderson static void tcg_reg_alloc_dup(TCGContext *s, const TCGOp *op) 3385bab1671fSRichard Henderson { 3386bab1671fSRichard Henderson const TCGLifeData arg_life = op->life; 3387bab1671fSRichard Henderson TCGRegSet dup_out_regs, dup_in_regs; 3388bab1671fSRichard Henderson TCGTemp *its, *ots; 3389bab1671fSRichard Henderson TCGType itype, vtype; 3390d6ecb4a9SRichard Henderson intptr_t endian_fixup; 3391bab1671fSRichard Henderson unsigned vece; 3392bab1671fSRichard Henderson bool ok; 3393bab1671fSRichard Henderson 3394bab1671fSRichard Henderson ots = arg_temp(op->args[0]); 3395bab1671fSRichard Henderson its = arg_temp(op->args[1]); 3396bab1671fSRichard Henderson 3397bab1671fSRichard Henderson /* ENV should not be modified. */ 3398e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3399bab1671fSRichard Henderson 3400bab1671fSRichard Henderson itype = its->type; 3401bab1671fSRichard Henderson vece = TCGOP_VECE(op); 3402bab1671fSRichard Henderson vtype = TCGOP_VECL(op) + TCG_TYPE_V64; 3403bab1671fSRichard Henderson 3404bab1671fSRichard Henderson if (its->val_type == TEMP_VAL_CONST) { 3405bab1671fSRichard Henderson /* Propagate constant via movi -> dupi. */ 3406bab1671fSRichard Henderson tcg_target_ulong val = its->val; 3407bab1671fSRichard Henderson if (IS_DEAD_ARG(1)) { 3408bab1671fSRichard Henderson temp_dead(s, its); 3409bab1671fSRichard Henderson } 3410bab1671fSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, op->output_pref[0]); 3411bab1671fSRichard Henderson return; 3412bab1671fSRichard Henderson } 3413bab1671fSRichard Henderson 34149be0d080SRichard Henderson dup_out_regs = tcg_op_defs[INDEX_op_dup_vec].args_ct[0].regs; 34159be0d080SRichard Henderson dup_in_regs = tcg_op_defs[INDEX_op_dup_vec].args_ct[1].regs; 3416bab1671fSRichard Henderson 3417bab1671fSRichard Henderson /* Allocate the output register now. */ 3418bab1671fSRichard Henderson if (ots->val_type != TEMP_VAL_REG) { 3419bab1671fSRichard Henderson TCGRegSet allocated_regs = s->reserved_regs; 3420bab1671fSRichard Henderson 3421bab1671fSRichard Henderson if (!IS_DEAD_ARG(1) && its->val_type == TEMP_VAL_REG) { 3422bab1671fSRichard Henderson /* Make sure to not spill the input register. */ 3423bab1671fSRichard Henderson tcg_regset_set_reg(allocated_regs, its->reg); 3424bab1671fSRichard Henderson } 3425bab1671fSRichard Henderson ots->reg = tcg_reg_alloc(s, dup_out_regs, allocated_regs, 3426bab1671fSRichard Henderson op->output_pref[0], ots->indirect_base); 3427bab1671fSRichard Henderson ots->val_type = TEMP_VAL_REG; 3428bab1671fSRichard Henderson ots->mem_coherent = 0; 3429bab1671fSRichard Henderson s->reg_to_temp[ots->reg] = ots; 3430bab1671fSRichard Henderson } 3431bab1671fSRichard Henderson 3432bab1671fSRichard Henderson switch (its->val_type) { 3433bab1671fSRichard Henderson case TEMP_VAL_REG: 3434bab1671fSRichard Henderson /* 3435bab1671fSRichard Henderson * The dup constriaints must be broad, covering all possible VECE. 3436bab1671fSRichard Henderson * However, tcg_op_dup_vec() gets to see the VECE and we allow it 3437bab1671fSRichard Henderson * to fail, indicating that extra moves are required for that case. 3438bab1671fSRichard Henderson */ 3439bab1671fSRichard Henderson if (tcg_regset_test_reg(dup_in_regs, its->reg)) { 3440bab1671fSRichard Henderson if (tcg_out_dup_vec(s, vtype, vece, ots->reg, its->reg)) { 3441bab1671fSRichard Henderson goto done; 3442bab1671fSRichard Henderson } 3443bab1671fSRichard Henderson /* Try again from memory or a vector input register. */ 3444bab1671fSRichard Henderson } 3445bab1671fSRichard Henderson if (!its->mem_coherent) { 3446bab1671fSRichard Henderson /* 3447bab1671fSRichard Henderson * The input register is not synced, and so an extra store 3448bab1671fSRichard Henderson * would be required to use memory. Attempt an integer-vector 3449bab1671fSRichard Henderson * register move first. We do not have a TCGRegSet for this. 3450bab1671fSRichard Henderson */ 3451bab1671fSRichard Henderson if (tcg_out_mov(s, itype, ots->reg, its->reg)) { 3452bab1671fSRichard Henderson break; 3453bab1671fSRichard Henderson } 3454bab1671fSRichard Henderson /* Sync the temp back to its slot and load from there. */ 3455bab1671fSRichard Henderson temp_sync(s, its, s->reserved_regs, 0, 0); 3456bab1671fSRichard Henderson } 3457bab1671fSRichard Henderson /* fall through */ 3458bab1671fSRichard Henderson 3459bab1671fSRichard Henderson case TEMP_VAL_MEM: 3460d6ecb4a9SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 3461d6ecb4a9SRichard Henderson endian_fixup = itype == TCG_TYPE_I32 ? 4 : 8; 3462d6ecb4a9SRichard Henderson endian_fixup -= 1 << vece; 3463d6ecb4a9SRichard Henderson #else 3464d6ecb4a9SRichard Henderson endian_fixup = 0; 3465d6ecb4a9SRichard Henderson #endif 3466d6ecb4a9SRichard Henderson if (tcg_out_dupm_vec(s, vtype, vece, ots->reg, its->mem_base->reg, 3467d6ecb4a9SRichard Henderson its->mem_offset + endian_fixup)) { 3468d6ecb4a9SRichard Henderson goto done; 3469d6ecb4a9SRichard Henderson } 3470bab1671fSRichard Henderson tcg_out_ld(s, itype, ots->reg, its->mem_base->reg, its->mem_offset); 3471bab1671fSRichard Henderson break; 3472bab1671fSRichard Henderson 3473bab1671fSRichard Henderson default: 3474bab1671fSRichard Henderson g_assert_not_reached(); 3475bab1671fSRichard Henderson } 3476bab1671fSRichard Henderson 3477bab1671fSRichard Henderson /* We now have a vector input register, so dup must succeed. */ 3478bab1671fSRichard Henderson ok = tcg_out_dup_vec(s, vtype, vece, ots->reg, ots->reg); 3479bab1671fSRichard Henderson tcg_debug_assert(ok); 3480bab1671fSRichard Henderson 3481bab1671fSRichard Henderson done: 3482bab1671fSRichard Henderson if (IS_DEAD_ARG(1)) { 3483bab1671fSRichard Henderson temp_dead(s, its); 3484bab1671fSRichard Henderson } 3485bab1671fSRichard Henderson if (NEED_SYNC_ARG(0)) { 3486bab1671fSRichard Henderson temp_sync(s, ots, s->reserved_regs, 0, 0); 3487bab1671fSRichard Henderson } 3488bab1671fSRichard Henderson if (IS_DEAD_ARG(0)) { 3489bab1671fSRichard Henderson temp_dead(s, ots); 3490bab1671fSRichard Henderson } 3491bab1671fSRichard Henderson } 3492bab1671fSRichard Henderson 3493dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3494c896fe29Sbellard { 3495dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3496dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 349782790a87SRichard Henderson TCGRegSet i_allocated_regs; 349882790a87SRichard Henderson TCGRegSet o_allocated_regs; 3499b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3500b6638662SRichard Henderson TCGReg reg; 3501c896fe29Sbellard TCGArg arg; 3502c896fe29Sbellard const TCGArgConstraint *arg_ct; 3503c896fe29Sbellard TCGTemp *ts; 3504c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3505c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3506c896fe29Sbellard 3507c896fe29Sbellard nb_oargs = def->nb_oargs; 3508c896fe29Sbellard nb_iargs = def->nb_iargs; 3509c896fe29Sbellard 3510c896fe29Sbellard /* copy constants */ 3511c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3512dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3513c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3514c896fe29Sbellard 3515d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3516d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 351782790a87SRichard Henderson 3518c896fe29Sbellard /* satisfy input constraints */ 3519c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 3520d62816f2SRichard Henderson TCGRegSet i_preferred_regs, o_preferred_regs; 3521d62816f2SRichard Henderson 352266792f90SRichard Henderson i = def->args_ct[nb_oargs + k].sort_index; 3523dd186292SRichard Henderson arg = op->args[i]; 3524c896fe29Sbellard arg_ct = &def->args_ct[i]; 352543439139SRichard Henderson ts = arg_temp(arg); 352640ae5c62SRichard Henderson 352740ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 3528a4fbbd77SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct->ct)) { 3529c896fe29Sbellard /* constant is OK for instruction */ 3530c896fe29Sbellard const_args[i] = 1; 3531c896fe29Sbellard new_args[i] = ts->val; 3532d62816f2SRichard Henderson continue; 3533c896fe29Sbellard } 353440ae5c62SRichard Henderson 3535d62816f2SRichard Henderson i_preferred_regs = o_preferred_regs = 0; 3536bc2b17e6SRichard Henderson if (arg_ct->ialias) { 3537d62816f2SRichard Henderson o_preferred_regs = op->output_pref[arg_ct->alias_index]; 3538c0522136SRichard Henderson 3539c0522136SRichard Henderson /* 3540c0522136SRichard Henderson * If the input is readonly, then it cannot also be an 3541c0522136SRichard Henderson * output and aliased to itself. If the input is not 3542c0522136SRichard Henderson * dead after the instruction, we must allocate a new 3543c0522136SRichard Henderson * register and move it. 3544c0522136SRichard Henderson */ 3545c0522136SRichard Henderson if (temp_readonly(ts) || !IS_DEAD_ARG(i)) { 3546c896fe29Sbellard goto allocate_in_reg; 3547c896fe29Sbellard } 3548d62816f2SRichard Henderson 3549c0522136SRichard Henderson /* 3550c0522136SRichard Henderson * Check if the current register has already been allocated 3551c0522136SRichard Henderson * for another input aliased to an output. 3552c0522136SRichard Henderson */ 3553d62816f2SRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 3554d62816f2SRichard Henderson reg = ts->reg; 3555c0522136SRichard Henderson for (int k2 = 0; k2 < k; k2++) { 3556c0522136SRichard Henderson int i2 = def->args_ct[nb_oargs + k2].sort_index; 3557bc2b17e6SRichard Henderson if (def->args_ct[i2].ialias && reg == new_args[i2]) { 35587e1df267SAurelien Jarno goto allocate_in_reg; 35597e1df267SAurelien Jarno } 35607e1df267SAurelien Jarno } 35615ff9d6a4Sbellard } 3562d62816f2SRichard Henderson i_preferred_regs = o_preferred_regs; 3563866cb6cbSAurelien Jarno } 3564d62816f2SRichard Henderson 35659be0d080SRichard Henderson temp_load(s, ts, arg_ct->regs, i_allocated_regs, i_preferred_regs); 3566c896fe29Sbellard reg = ts->reg; 3567d62816f2SRichard Henderson 3568c0522136SRichard Henderson if (!tcg_regset_test_reg(arg_ct->regs, reg)) { 3569c896fe29Sbellard allocate_in_reg: 3570c0522136SRichard Henderson /* 3571c0522136SRichard Henderson * Allocate a new register matching the constraint 3572c0522136SRichard Henderson * and move the temporary register into it. 3573c0522136SRichard Henderson */ 3574d62816f2SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 3575d62816f2SRichard Henderson i_allocated_regs, 0); 35769be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, i_allocated_regs, 3577d62816f2SRichard Henderson o_preferred_regs, ts->indirect_base); 357878113e83SRichard Henderson if (!tcg_out_mov(s, ts->type, reg, ts->reg)) { 3579240c08d0SRichard Henderson /* 3580240c08d0SRichard Henderson * Cross register class move not supported. Sync the 3581240c08d0SRichard Henderson * temp back to its slot and load from there. 3582240c08d0SRichard Henderson */ 3583240c08d0SRichard Henderson temp_sync(s, ts, i_allocated_regs, 0, 0); 3584240c08d0SRichard Henderson tcg_out_ld(s, ts->type, reg, 3585240c08d0SRichard Henderson ts->mem_base->reg, ts->mem_offset); 358678113e83SRichard Henderson } 3587c896fe29Sbellard } 3588c896fe29Sbellard new_args[i] = reg; 3589c896fe29Sbellard const_args[i] = 0; 359082790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3591c896fe29Sbellard } 3592c896fe29Sbellard 3593c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3594866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3595866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 359643439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3597c896fe29Sbellard } 3598c896fe29Sbellard } 3599c896fe29Sbellard 3600b4cb76e6SRichard Henderson if (def->flags & TCG_OPF_COND_BRANCH) { 3601b4cb76e6SRichard Henderson tcg_reg_alloc_cbranch(s, i_allocated_regs); 3602b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 360382790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3604a52ad07eSAurelien Jarno } else { 3605c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3606b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3607c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3608c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 360982790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3610c896fe29Sbellard } 3611c896fe29Sbellard } 36123d5c5f87SAurelien Jarno } 36133d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 36143d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 36153d5c5f87SAurelien Jarno an exception. */ 361682790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3617c896fe29Sbellard } 3618c896fe29Sbellard 3619c896fe29Sbellard /* satisfy the output constraints */ 3620c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 362166792f90SRichard Henderson i = def->args_ct[k].sort_index; 3622dd186292SRichard Henderson arg = op->args[i]; 3623c896fe29Sbellard arg_ct = &def->args_ct[i]; 362443439139SRichard Henderson ts = arg_temp(arg); 3625d63e3b6eSRichard Henderson 3626d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3627e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 3628d63e3b6eSRichard Henderson 3629bc2b17e6SRichard Henderson if (arg_ct->oalias && !const_args[arg_ct->alias_index]) { 36305ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 3631bc2b17e6SRichard Henderson } else if (arg_ct->newreg) { 36329be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, 363382790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 363469e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3635c896fe29Sbellard } else { 36369be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, o_allocated_regs, 363769e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3638c896fe29Sbellard } 363982790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 3640639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3641f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3642639368ddSAurelien Jarno } 3643c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3644c896fe29Sbellard ts->reg = reg; 3645d63e3b6eSRichard Henderson /* 3646d63e3b6eSRichard Henderson * Temp value is modified, so the value kept in memory is 3647d63e3b6eSRichard Henderson * potentially not the same. 3648d63e3b6eSRichard Henderson */ 3649c896fe29Sbellard ts->mem_coherent = 0; 3650f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3651c896fe29Sbellard new_args[i] = reg; 3652c896fe29Sbellard } 3653e8996ee0Sbellard } 3654c896fe29Sbellard 3655c896fe29Sbellard /* emit instruction */ 3656d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 3657d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 3658d2fd745fSRichard Henderson new_args, const_args); 3659d2fd745fSRichard Henderson } else { 3660dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 3661d2fd745fSRichard Henderson } 3662c896fe29Sbellard 3663c896fe29Sbellard /* move the outputs in the correct register if needed */ 3664c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 366543439139SRichard Henderson ts = arg_temp(op->args[i]); 3666d63e3b6eSRichard Henderson 3667d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3668e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 3669d63e3b6eSRichard Henderson 3670ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 367198b4e186SRichard Henderson temp_sync(s, ts, o_allocated_regs, 0, IS_DEAD_ARG(i)); 367259d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3673f8bf00f1SRichard Henderson temp_dead(s, ts); 3674ec7a869dSAurelien Jarno } 3675c896fe29Sbellard } 3676c896fe29Sbellard } 3677c896fe29Sbellard 3678efe86b21SRichard Henderson static bool tcg_reg_alloc_dup2(TCGContext *s, const TCGOp *op) 3679efe86b21SRichard Henderson { 3680efe86b21SRichard Henderson const TCGLifeData arg_life = op->life; 3681efe86b21SRichard Henderson TCGTemp *ots, *itsl, *itsh; 3682efe86b21SRichard Henderson TCGType vtype = TCGOP_VECL(op) + TCG_TYPE_V64; 3683efe86b21SRichard Henderson 3684efe86b21SRichard Henderson /* This opcode is only valid for 32-bit hosts, for 64-bit elements. */ 3685efe86b21SRichard Henderson tcg_debug_assert(TCG_TARGET_REG_BITS == 32); 3686efe86b21SRichard Henderson tcg_debug_assert(TCGOP_VECE(op) == MO_64); 3687efe86b21SRichard Henderson 3688efe86b21SRichard Henderson ots = arg_temp(op->args[0]); 3689efe86b21SRichard Henderson itsl = arg_temp(op->args[1]); 3690efe86b21SRichard Henderson itsh = arg_temp(op->args[2]); 3691efe86b21SRichard Henderson 3692efe86b21SRichard Henderson /* ENV should not be modified. */ 3693efe86b21SRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3694efe86b21SRichard Henderson 3695efe86b21SRichard Henderson /* Allocate the output register now. */ 3696efe86b21SRichard Henderson if (ots->val_type != TEMP_VAL_REG) { 3697efe86b21SRichard Henderson TCGRegSet allocated_regs = s->reserved_regs; 3698efe86b21SRichard Henderson TCGRegSet dup_out_regs = 3699efe86b21SRichard Henderson tcg_op_defs[INDEX_op_dup_vec].args_ct[0].regs; 3700efe86b21SRichard Henderson 3701efe86b21SRichard Henderson /* Make sure to not spill the input registers. */ 3702efe86b21SRichard Henderson if (!IS_DEAD_ARG(1) && itsl->val_type == TEMP_VAL_REG) { 3703efe86b21SRichard Henderson tcg_regset_set_reg(allocated_regs, itsl->reg); 3704efe86b21SRichard Henderson } 3705efe86b21SRichard Henderson if (!IS_DEAD_ARG(2) && itsh->val_type == TEMP_VAL_REG) { 3706efe86b21SRichard Henderson tcg_regset_set_reg(allocated_regs, itsh->reg); 3707efe86b21SRichard Henderson } 3708efe86b21SRichard Henderson 3709efe86b21SRichard Henderson ots->reg = tcg_reg_alloc(s, dup_out_regs, allocated_regs, 3710efe86b21SRichard Henderson op->output_pref[0], ots->indirect_base); 3711efe86b21SRichard Henderson ots->val_type = TEMP_VAL_REG; 3712efe86b21SRichard Henderson ots->mem_coherent = 0; 3713efe86b21SRichard Henderson s->reg_to_temp[ots->reg] = ots; 3714efe86b21SRichard Henderson } 3715efe86b21SRichard Henderson 3716efe86b21SRichard Henderson /* Promote dup2 of immediates to dupi_vec. */ 3717efe86b21SRichard Henderson if (itsl->val_type == TEMP_VAL_CONST && itsh->val_type == TEMP_VAL_CONST) { 3718efe86b21SRichard Henderson uint64_t val = deposit64(itsl->val, 32, 32, itsh->val); 3719efe86b21SRichard Henderson MemOp vece = MO_64; 3720efe86b21SRichard Henderson 3721efe86b21SRichard Henderson if (val == dup_const(MO_8, val)) { 3722efe86b21SRichard Henderson vece = MO_8; 3723efe86b21SRichard Henderson } else if (val == dup_const(MO_16, val)) { 3724efe86b21SRichard Henderson vece = MO_16; 3725efe86b21SRichard Henderson } else if (val == dup_const(MO_32, val)) { 3726efe86b21SRichard Henderson vece = MO_32; 3727efe86b21SRichard Henderson } 3728efe86b21SRichard Henderson 3729efe86b21SRichard Henderson tcg_out_dupi_vec(s, vtype, vece, ots->reg, val); 3730efe86b21SRichard Henderson goto done; 3731efe86b21SRichard Henderson } 3732efe86b21SRichard Henderson 3733efe86b21SRichard Henderson /* If the two inputs form one 64-bit value, try dupm_vec. */ 3734efe86b21SRichard Henderson if (itsl + 1 == itsh && itsl->base_type == TCG_TYPE_I64) { 3735efe86b21SRichard Henderson if (!itsl->mem_coherent) { 3736efe86b21SRichard Henderson temp_sync(s, itsl, s->reserved_regs, 0, 0); 3737efe86b21SRichard Henderson } 3738efe86b21SRichard Henderson if (!itsh->mem_coherent) { 3739efe86b21SRichard Henderson temp_sync(s, itsh, s->reserved_regs, 0, 0); 3740efe86b21SRichard Henderson } 3741efe86b21SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 3742efe86b21SRichard Henderson TCGTemp *its = itsh; 3743efe86b21SRichard Henderson #else 3744efe86b21SRichard Henderson TCGTemp *its = itsl; 3745efe86b21SRichard Henderson #endif 3746efe86b21SRichard Henderson if (tcg_out_dupm_vec(s, vtype, MO_64, ots->reg, 3747efe86b21SRichard Henderson its->mem_base->reg, its->mem_offset)) { 3748efe86b21SRichard Henderson goto done; 3749efe86b21SRichard Henderson } 3750efe86b21SRichard Henderson } 3751efe86b21SRichard Henderson 3752efe86b21SRichard Henderson /* Fall back to generic expansion. */ 3753efe86b21SRichard Henderson return false; 3754efe86b21SRichard Henderson 3755efe86b21SRichard Henderson done: 3756efe86b21SRichard Henderson if (IS_DEAD_ARG(1)) { 3757efe86b21SRichard Henderson temp_dead(s, itsl); 3758efe86b21SRichard Henderson } 3759efe86b21SRichard Henderson if (IS_DEAD_ARG(2)) { 3760efe86b21SRichard Henderson temp_dead(s, itsh); 3761efe86b21SRichard Henderson } 3762efe86b21SRichard Henderson if (NEED_SYNC_ARG(0)) { 3763efe86b21SRichard Henderson temp_sync(s, ots, s->reserved_regs, 0, IS_DEAD_ARG(0)); 3764efe86b21SRichard Henderson } else if (IS_DEAD_ARG(0)) { 3765efe86b21SRichard Henderson temp_dead(s, ots); 3766efe86b21SRichard Henderson } 3767efe86b21SRichard Henderson return true; 3768efe86b21SRichard Henderson } 3769efe86b21SRichard Henderson 3770b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 3771b03cce8eSbellard #define STACK_DIR(x) (-(x)) 3772b03cce8eSbellard #else 3773b03cce8eSbellard #define STACK_DIR(x) (x) 3774b03cce8eSbellard #endif 3775b03cce8eSbellard 3776dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 3777c896fe29Sbellard { 3778cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 3779cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 3780dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3781b6638662SRichard Henderson int flags, nb_regs, i; 3782b6638662SRichard Henderson TCGReg reg; 3783cf066674SRichard Henderson TCGArg arg; 3784c896fe29Sbellard TCGTemp *ts; 3785d3452f1fSRichard Henderson intptr_t stack_offset; 3786d3452f1fSRichard Henderson size_t call_stack_size; 3787cf066674SRichard Henderson tcg_insn_unit *func_addr; 3788cf066674SRichard Henderson int allocate_args; 3789c896fe29Sbellard TCGRegSet allocated_regs; 3790c896fe29Sbellard 3791*fa52e660SRichard Henderson func_addr = tcg_call_func(op); 379290163900SRichard Henderson flags = tcg_call_flags(op); 3793c896fe29Sbellard 37946e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 3795c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 3796c45cb8bbSRichard Henderson nb_regs = nb_iargs; 3797cf066674SRichard Henderson } 3798c896fe29Sbellard 3799c896fe29Sbellard /* assign stack slots first */ 3800c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 3801c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 3802c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 3803b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 3804b03cce8eSbellard if (allocate_args) { 3805345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 3806345649c0SBlue Swirl preallocate call stack */ 3807345649c0SBlue Swirl tcg_abort(); 3808b03cce8eSbellard } 380939cf05d3Sbellard 381039cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 3811c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 3812dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 381339cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 381439cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 381539cf05d3Sbellard #endif 381639cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 381743439139SRichard Henderson ts = arg_temp(arg); 381840ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 3819b722452aSRichard Henderson s->reserved_regs, 0); 3820e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 382139cf05d3Sbellard } 382239cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 382339cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 382439cf05d3Sbellard #endif 3825c896fe29Sbellard } 3826c896fe29Sbellard 3827c896fe29Sbellard /* assign input registers */ 3828d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 3829c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 3830dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 383139cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 383243439139SRichard Henderson ts = arg_temp(arg); 3833c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 383440ae5c62SRichard Henderson 3835c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 3836c896fe29Sbellard if (ts->reg != reg) { 38374250da10SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 383878113e83SRichard Henderson if (!tcg_out_mov(s, ts->type, reg, ts->reg)) { 3839240c08d0SRichard Henderson /* 3840240c08d0SRichard Henderson * Cross register class move not supported. Sync the 3841240c08d0SRichard Henderson * temp back to its slot and load from there. 3842240c08d0SRichard Henderson */ 3843240c08d0SRichard Henderson temp_sync(s, ts, allocated_regs, 0, 0); 3844240c08d0SRichard Henderson tcg_out_ld(s, ts->type, reg, 3845240c08d0SRichard Henderson ts->mem_base->reg, ts->mem_offset); 384678113e83SRichard Henderson } 3847c896fe29Sbellard } 3848c896fe29Sbellard } else { 3849ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 385040ae5c62SRichard Henderson 38514250da10SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 385240ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 3853b722452aSRichard Henderson temp_load(s, ts, arg_set, allocated_regs, 0); 3854c896fe29Sbellard } 385540ae5c62SRichard Henderson 3856c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 3857c896fe29Sbellard } 385839cf05d3Sbellard } 3859c896fe29Sbellard 3860c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3861866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 3862866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 386343439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3864c896fe29Sbellard } 3865c896fe29Sbellard } 3866c896fe29Sbellard 3867c896fe29Sbellard /* clobber call registers */ 3868c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3869c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 3870b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 3871c896fe29Sbellard } 3872c896fe29Sbellard } 3873c896fe29Sbellard 387478505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 387578505279SAurelien Jarno they might be read. */ 387678505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 387778505279SAurelien Jarno /* Nothing to do */ 387878505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 387978505279SAurelien Jarno sync_globals(s, allocated_regs); 388078505279SAurelien Jarno } else { 3881e8996ee0Sbellard save_globals(s, allocated_regs); 3882b9c18f56Saurel32 } 3883c896fe29Sbellard 3884cf066674SRichard Henderson tcg_out_call(s, func_addr); 3885c896fe29Sbellard 3886c896fe29Sbellard /* assign output registers and emit moves if needed */ 3887c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 3888dd186292SRichard Henderson arg = op->args[i]; 388943439139SRichard Henderson ts = arg_temp(arg); 3890d63e3b6eSRichard Henderson 3891d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3892e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 3893d63e3b6eSRichard Henderson 3894c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 3895eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 3896639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3897f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3898639368ddSAurelien Jarno } 3899c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3900c896fe29Sbellard ts->reg = reg; 3901c896fe29Sbellard ts->mem_coherent = 0; 3902f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3903ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 390498b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, IS_DEAD_ARG(i)); 390559d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3906f8bf00f1SRichard Henderson temp_dead(s, ts); 3907c896fe29Sbellard } 3908c896fe29Sbellard } 39098c11ad25SAurelien Jarno } 3910c896fe29Sbellard 3911c896fe29Sbellard #ifdef CONFIG_PROFILER 3912c896fe29Sbellard 3913c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 3914c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 3915c3fac113SEmilio G. Cota do { \ 3916d73415a3SStefan Hajnoczi (to)->field += qatomic_read(&((from)->field)); \ 3917c3fac113SEmilio G. Cota } while (0) 3918c896fe29Sbellard 3919c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 3920c3fac113SEmilio G. Cota do { \ 3921d73415a3SStefan Hajnoczi typeof((from)->field) val__ = qatomic_read(&((from)->field)); \ 3922c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 3923c3fac113SEmilio G. Cota (to)->field = val__; \ 3924c3fac113SEmilio G. Cota } \ 3925c3fac113SEmilio G. Cota } while (0) 3926c3fac113SEmilio G. Cota 3927c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 3928c3fac113SEmilio G. Cota static inline 3929c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 3930c896fe29Sbellard { 39310e2d61cfSRichard Henderson unsigned int n_ctxs = qatomic_read(&tcg_cur_ctxs); 3932c3fac113SEmilio G. Cota unsigned int i; 3933c3fac113SEmilio G. Cota 39343468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 3935d73415a3SStefan Hajnoczi TCGContext *s = qatomic_read(&tcg_ctxs[i]); 39363468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 3937c3fac113SEmilio G. Cota 3938c3fac113SEmilio G. Cota if (counters) { 393972fd2efbSEmilio G. Cota PROF_ADD(prof, orig, cpu_exec_time); 3940c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 3941c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 3942c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 3943c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 3944c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 3945c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 3946c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 3947c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 3948c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 3949c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 3950c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 3951c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 3952c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 3953c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 3954c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 3955c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 3956c3fac113SEmilio G. Cota } 3957c3fac113SEmilio G. Cota if (table) { 3958c896fe29Sbellard int i; 3959d70724ceSzhanghailiang 396015fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 3961c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 3962c3fac113SEmilio G. Cota } 3963c3fac113SEmilio G. Cota } 3964c3fac113SEmilio G. Cota } 3965c3fac113SEmilio G. Cota } 3966c3fac113SEmilio G. Cota 3967c3fac113SEmilio G. Cota #undef PROF_ADD 3968c3fac113SEmilio G. Cota #undef PROF_MAX 3969c3fac113SEmilio G. Cota 3970c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 3971c3fac113SEmilio G. Cota { 3972c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 3973c3fac113SEmilio G. Cota } 3974c3fac113SEmilio G. Cota 3975c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 3976c3fac113SEmilio G. Cota { 3977c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 3978c3fac113SEmilio G. Cota } 3979c3fac113SEmilio G. Cota 3980d4c51a0aSMarkus Armbruster void tcg_dump_op_count(void) 3981c3fac113SEmilio G. Cota { 3982c3fac113SEmilio G. Cota TCGProfile prof = {}; 3983c3fac113SEmilio G. Cota int i; 3984c3fac113SEmilio G. Cota 3985c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 3986c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 3987d4c51a0aSMarkus Armbruster qemu_printf("%s %" PRId64 "\n", tcg_op_defs[i].name, 3988c3fac113SEmilio G. Cota prof.table_op_count[i]); 3989c896fe29Sbellard } 3990c896fe29Sbellard } 399172fd2efbSEmilio G. Cota 399272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 399372fd2efbSEmilio G. Cota { 39940e2d61cfSRichard Henderson unsigned int n_ctxs = qatomic_read(&tcg_cur_ctxs); 399572fd2efbSEmilio G. Cota unsigned int i; 399672fd2efbSEmilio G. Cota int64_t ret = 0; 399772fd2efbSEmilio G. Cota 399872fd2efbSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 3999d73415a3SStefan Hajnoczi const TCGContext *s = qatomic_read(&tcg_ctxs[i]); 400072fd2efbSEmilio G. Cota const TCGProfile *prof = &s->prof; 400172fd2efbSEmilio G. Cota 4002d73415a3SStefan Hajnoczi ret += qatomic_read(&prof->cpu_exec_time); 400372fd2efbSEmilio G. Cota } 400472fd2efbSEmilio G. Cota return ret; 400572fd2efbSEmilio G. Cota } 4006246ae24dSMax Filippov #else 4007d4c51a0aSMarkus Armbruster void tcg_dump_op_count(void) 4008246ae24dSMax Filippov { 4009d4c51a0aSMarkus Armbruster qemu_printf("[TCG profiler not compiled]\n"); 4010246ae24dSMax Filippov } 401172fd2efbSEmilio G. Cota 401272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 401372fd2efbSEmilio G. Cota { 401472fd2efbSEmilio G. Cota error_report("%s: TCG profiler not compiled", __func__); 401572fd2efbSEmilio G. Cota exit(EXIT_FAILURE); 401672fd2efbSEmilio G. Cota } 4017c896fe29Sbellard #endif 4018c896fe29Sbellard 4019c896fe29Sbellard 40205bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 4021c896fe29Sbellard { 4022c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 4023c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 4024c3fac113SEmilio G. Cota #endif 402515fa08f8SRichard Henderson int i, num_insns; 402615fa08f8SRichard Henderson TCGOp *op; 4027c896fe29Sbellard 402804fe6400SRichard Henderson #ifdef CONFIG_PROFILER 402904fe6400SRichard Henderson { 4030c1f543b7SEmilio G. Cota int n = 0; 403104fe6400SRichard Henderson 403215fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 403315fa08f8SRichard Henderson n++; 403415fa08f8SRichard Henderson } 4035d73415a3SStefan Hajnoczi qatomic_set(&prof->op_count, prof->op_count + n); 4036c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 4037d73415a3SStefan Hajnoczi qatomic_set(&prof->op_count_max, n); 403804fe6400SRichard Henderson } 403904fe6400SRichard Henderson 404004fe6400SRichard Henderson n = s->nb_temps; 4041d73415a3SStefan Hajnoczi qatomic_set(&prof->temp_count, prof->temp_count + n); 4042c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 4043d73415a3SStefan Hajnoczi qatomic_set(&prof->temp_count_max, n); 404404fe6400SRichard Henderson } 404504fe6400SRichard Henderson } 404604fe6400SRichard Henderson #endif 404704fe6400SRichard Henderson 4048c896fe29Sbellard #ifdef DEBUG_DISAS 4049d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 4050d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 4051fc59d2d8SRobert Foley FILE *logfile = qemu_log_lock(); 405293fcfe39Saliguori qemu_log("OP:\n"); 40531894f69aSRichard Henderson tcg_dump_ops(s, false); 405493fcfe39Saliguori qemu_log("\n"); 4055fc59d2d8SRobert Foley qemu_log_unlock(logfile); 4056c896fe29Sbellard } 4057c896fe29Sbellard #endif 4058c896fe29Sbellard 4059bef16ab4SRichard Henderson #ifdef CONFIG_DEBUG_TCG 4060bef16ab4SRichard Henderson /* Ensure all labels referenced have been emitted. */ 4061bef16ab4SRichard Henderson { 4062bef16ab4SRichard Henderson TCGLabel *l; 4063bef16ab4SRichard Henderson bool error = false; 4064bef16ab4SRichard Henderson 4065bef16ab4SRichard Henderson QSIMPLEQ_FOREACH(l, &s->labels, next) { 4066bef16ab4SRichard Henderson if (unlikely(!l->present) && l->refs) { 4067bef16ab4SRichard Henderson qemu_log_mask(CPU_LOG_TB_OP, 4068bef16ab4SRichard Henderson "$L%d referenced but not present.\n", l->id); 4069bef16ab4SRichard Henderson error = true; 4070bef16ab4SRichard Henderson } 4071bef16ab4SRichard Henderson } 4072bef16ab4SRichard Henderson assert(!error); 4073bef16ab4SRichard Henderson } 4074bef16ab4SRichard Henderson #endif 4075bef16ab4SRichard Henderson 4076c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 4077d73415a3SStefan Hajnoczi qatomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 4078c5cc28ffSAurelien Jarno #endif 4079c5cc28ffSAurelien Jarno 40808f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 4081c45cb8bbSRichard Henderson tcg_optimize(s); 40828f2e8c07SKirill Batuzov #endif 40838f2e8c07SKirill Batuzov 4084a23a9ec6Sbellard #ifdef CONFIG_PROFILER 4085d73415a3SStefan Hajnoczi qatomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 4086d73415a3SStefan Hajnoczi qatomic_set(&prof->la_time, prof->la_time - profile_getclock()); 4087a23a9ec6Sbellard #endif 4088c5cc28ffSAurelien Jarno 4089b4fc67c7SRichard Henderson reachable_code_pass(s); 4090b83eabeaSRichard Henderson liveness_pass_1(s); 40915a18407fSRichard Henderson 40925a18407fSRichard Henderson if (s->nb_indirects > 0) { 40935a18407fSRichard Henderson #ifdef DEBUG_DISAS 40945a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 40955a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 4096fc59d2d8SRobert Foley FILE *logfile = qemu_log_lock(); 40975a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 40981894f69aSRichard Henderson tcg_dump_ops(s, false); 40995a18407fSRichard Henderson qemu_log("\n"); 4100fc59d2d8SRobert Foley qemu_log_unlock(logfile); 41015a18407fSRichard Henderson } 41025a18407fSRichard Henderson #endif 41035a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 4104b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 41055a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 4106b83eabeaSRichard Henderson liveness_pass_1(s); 41075a18407fSRichard Henderson } 41085a18407fSRichard Henderson } 4109c5cc28ffSAurelien Jarno 4110a23a9ec6Sbellard #ifdef CONFIG_PROFILER 4111d73415a3SStefan Hajnoczi qatomic_set(&prof->la_time, prof->la_time + profile_getclock()); 4112a23a9ec6Sbellard #endif 4113c896fe29Sbellard 4114c896fe29Sbellard #ifdef DEBUG_DISAS 4115d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 4116d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 4117fc59d2d8SRobert Foley FILE *logfile = qemu_log_lock(); 4118c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 41191894f69aSRichard Henderson tcg_dump_ops(s, true); 412093fcfe39Saliguori qemu_log("\n"); 4121fc59d2d8SRobert Foley qemu_log_unlock(logfile); 4122c896fe29Sbellard } 4123c896fe29Sbellard #endif 4124c896fe29Sbellard 4125c896fe29Sbellard tcg_reg_alloc_start(s); 4126c896fe29Sbellard 4127db0c51a3SRichard Henderson /* 4128db0c51a3SRichard Henderson * Reset the buffer pointers when restarting after overflow. 4129db0c51a3SRichard Henderson * TODO: Move this into translate-all.c with the rest of the 4130db0c51a3SRichard Henderson * buffer management. Having only this done here is confusing. 4131db0c51a3SRichard Henderson */ 4132db0c51a3SRichard Henderson s->code_buf = tcg_splitwx_to_rw(tb->tc.ptr); 4133db0c51a3SRichard Henderson s->code_ptr = s->code_buf; 4134c896fe29Sbellard 4135659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 41366001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 4137659ef5cbSRichard Henderson #endif 413857a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 413957a26946SRichard Henderson s->pool_labels = NULL; 414057a26946SRichard Henderson #endif 41419ecefc84SRichard Henderson 4142fca8a500SRichard Henderson num_insns = -1; 414315fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 4144c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 4145b3db8758Sblueswir1 4146c896fe29Sbellard #ifdef CONFIG_PROFILER 4147d73415a3SStefan Hajnoczi qatomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 4148c896fe29Sbellard #endif 4149c45cb8bbSRichard Henderson 4150c896fe29Sbellard switch (opc) { 4151c896fe29Sbellard case INDEX_op_mov_i32: 4152c896fe29Sbellard case INDEX_op_mov_i64: 4153d2fd745fSRichard Henderson case INDEX_op_mov_vec: 4154dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 4155c896fe29Sbellard break; 4156bab1671fSRichard Henderson case INDEX_op_dup_vec: 4157bab1671fSRichard Henderson tcg_reg_alloc_dup(s, op); 4158bab1671fSRichard Henderson break; 4159765b842aSRichard Henderson case INDEX_op_insn_start: 4160fca8a500SRichard Henderson if (num_insns >= 0) { 41619f754620SRichard Henderson size_t off = tcg_current_code_size(s); 41629f754620SRichard Henderson s->gen_insn_end_off[num_insns] = off; 41639f754620SRichard Henderson /* Assert that we do not overflow our stored offset. */ 41649f754620SRichard Henderson assert(s->gen_insn_end_off[num_insns] == off); 4165fca8a500SRichard Henderson } 4166fca8a500SRichard Henderson num_insns++; 4167bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 4168bad729e2SRichard Henderson target_ulong a; 4169bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 4170efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 4171bad729e2SRichard Henderson #else 4172efee3746SRichard Henderson a = op->args[i]; 4173bad729e2SRichard Henderson #endif 4174fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 4175bad729e2SRichard Henderson } 4176c896fe29Sbellard break; 41775ff9d6a4Sbellard case INDEX_op_discard: 417843439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 41795ff9d6a4Sbellard break; 4180c896fe29Sbellard case INDEX_op_set_label: 4181e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 418292ab8e7dSRichard Henderson tcg_out_label(s, arg_label(op->args[0])); 4183c896fe29Sbellard break; 4184c896fe29Sbellard case INDEX_op_call: 4185dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 4186c45cb8bbSRichard Henderson break; 4187efe86b21SRichard Henderson case INDEX_op_dup2_vec: 4188efe86b21SRichard Henderson if (tcg_reg_alloc_dup2(s, op)) { 4189efe86b21SRichard Henderson break; 4190efe86b21SRichard Henderson } 4191efe86b21SRichard Henderson /* fall through */ 4192c896fe29Sbellard default: 419325c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 4194be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 4195c896fe29Sbellard /* Note: in order to speed up the code, it would be much 4196c896fe29Sbellard faster to have specialized register allocator functions for 4197c896fe29Sbellard some common argument patterns */ 4198dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 4199c896fe29Sbellard break; 4200c896fe29Sbellard } 42018d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 4202c896fe29Sbellard check_regs(s); 4203c896fe29Sbellard #endif 4204b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 4205b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 4206b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 4207b125f9dcSRichard Henderson generating code without having to check during generation. */ 4208644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 4209b125f9dcSRichard Henderson return -1; 4210b125f9dcSRichard Henderson } 42116e6c4efeSRichard Henderson /* Test for TB overflow, as seen by gen_insn_end_off. */ 42126e6c4efeSRichard Henderson if (unlikely(tcg_current_code_size(s) > UINT16_MAX)) { 42136e6c4efeSRichard Henderson return -2; 42146e6c4efeSRichard Henderson } 4215c896fe29Sbellard } 4216fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 4217fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 4218c45cb8bbSRichard Henderson 4219b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 4220659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 4221aeee05f5SRichard Henderson i = tcg_out_ldst_finalize(s); 4222aeee05f5SRichard Henderson if (i < 0) { 4223aeee05f5SRichard Henderson return i; 422423dceda6SRichard Henderson } 4225659ef5cbSRichard Henderson #endif 422657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 42271768987bSRichard Henderson i = tcg_out_pool_finalize(s); 42281768987bSRichard Henderson if (i < 0) { 42291768987bSRichard Henderson return i; 423057a26946SRichard Henderson } 423157a26946SRichard Henderson #endif 42327ecd02a0SRichard Henderson if (!tcg_resolve_relocs(s)) { 42337ecd02a0SRichard Henderson return -2; 42347ecd02a0SRichard Henderson } 4235c896fe29Sbellard 4236df5d2b16SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 4237c896fe29Sbellard /* flush instruction cache */ 4238db0c51a3SRichard Henderson flush_idcache_range((uintptr_t)tcg_splitwx_to_rx(s->code_buf), 4239db0c51a3SRichard Henderson (uintptr_t)s->code_buf, 42401da8de39SRichard Henderson tcg_ptr_byte_diff(s->code_ptr, s->code_buf)); 4241df5d2b16SRichard Henderson #endif 42422aeabc08SStefan Weil 42431813e175SRichard Henderson return tcg_current_code_size(s); 4244c896fe29Sbellard } 4245c896fe29Sbellard 4246a23a9ec6Sbellard #ifdef CONFIG_PROFILER 42473de2faa9SMarkus Armbruster void tcg_dump_info(void) 4248a23a9ec6Sbellard { 4249c3fac113SEmilio G. Cota TCGProfile prof = {}; 4250c3fac113SEmilio G. Cota const TCGProfile *s; 4251c3fac113SEmilio G. Cota int64_t tb_count; 4252c3fac113SEmilio G. Cota int64_t tb_div_count; 4253c3fac113SEmilio G. Cota int64_t tot; 4254c3fac113SEmilio G. Cota 4255c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 4256c3fac113SEmilio G. Cota s = &prof; 4257c3fac113SEmilio G. Cota tb_count = s->tb_count; 4258c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 4259c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 4260a23a9ec6Sbellard 42613de2faa9SMarkus Armbruster qemu_printf("JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 4262a23a9ec6Sbellard tot, tot / 2.4e9); 42633de2faa9SMarkus Armbruster qemu_printf("translated TBs %" PRId64 " (aborted=%" PRId64 42643de2faa9SMarkus Armbruster " %0.1f%%)\n", 4265fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 4266fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 4267fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 42683de2faa9SMarkus Armbruster qemu_printf("avg ops/TB %0.1f max=%d\n", 4269fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 42703de2faa9SMarkus Armbruster qemu_printf("deleted ops/TB %0.2f\n", 4271fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 42723de2faa9SMarkus Armbruster qemu_printf("avg temps/TB %0.2f max=%d\n", 4273fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 42743de2faa9SMarkus Armbruster qemu_printf("avg host code/TB %0.1f\n", 4275fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 42763de2faa9SMarkus Armbruster qemu_printf("avg search data/TB %0.1f\n", 4277fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 4278a23a9ec6Sbellard 42793de2faa9SMarkus Armbruster qemu_printf("cycles/op %0.1f\n", 4280a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 42813de2faa9SMarkus Armbruster qemu_printf("cycles/in byte %0.1f\n", 4282a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 42833de2faa9SMarkus Armbruster qemu_printf("cycles/out byte %0.1f\n", 4284a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 42853de2faa9SMarkus Armbruster qemu_printf("cycles/search byte %0.1f\n", 4286fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 4287fca8a500SRichard Henderson if (tot == 0) { 4288a23a9ec6Sbellard tot = 1; 4289fca8a500SRichard Henderson } 42903de2faa9SMarkus Armbruster qemu_printf(" gen_interm time %0.1f%%\n", 4291a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 42923de2faa9SMarkus Armbruster qemu_printf(" gen_code time %0.1f%%\n", 4293a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 42943de2faa9SMarkus Armbruster qemu_printf("optim./code time %0.1f%%\n", 4295c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 4296c5cc28ffSAurelien Jarno * 100.0); 42973de2faa9SMarkus Armbruster qemu_printf("liveness/code time %0.1f%%\n", 4298a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 42993de2faa9SMarkus Armbruster qemu_printf("cpu_restore count %" PRId64 "\n", 4300a23a9ec6Sbellard s->restore_count); 43013de2faa9SMarkus Armbruster qemu_printf(" avg cycles %0.1f\n", 4302a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 4303a23a9ec6Sbellard } 4304a23a9ec6Sbellard #else 43053de2faa9SMarkus Armbruster void tcg_dump_info(void) 4306a23a9ec6Sbellard { 43073de2faa9SMarkus Armbruster qemu_printf("[TCG profiler not compiled]\n"); 4308a23a9ec6Sbellard } 4309a23a9ec6Sbellard #endif 4310813da627SRichard Henderson 4311813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 43125872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 43135872bbf2SRichard Henderson 43145872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 43155872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 43165872bbf2SRichard Henderson 43175872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 43185872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 43195872bbf2SRichard Henderson prologue unwind info for the tcg machine. 43205872bbf2SRichard Henderson 43215872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 43225872bbf2SRichard Henderson */ 4323813da627SRichard Henderson 4324813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 4325813da627SRichard Henderson typedef enum { 4326813da627SRichard Henderson JIT_NOACTION = 0, 4327813da627SRichard Henderson JIT_REGISTER_FN, 4328813da627SRichard Henderson JIT_UNREGISTER_FN 4329813da627SRichard Henderson } jit_actions_t; 4330813da627SRichard Henderson 4331813da627SRichard Henderson struct jit_code_entry { 4332813da627SRichard Henderson struct jit_code_entry *next_entry; 4333813da627SRichard Henderson struct jit_code_entry *prev_entry; 4334813da627SRichard Henderson const void *symfile_addr; 4335813da627SRichard Henderson uint64_t symfile_size; 4336813da627SRichard Henderson }; 4337813da627SRichard Henderson 4338813da627SRichard Henderson struct jit_descriptor { 4339813da627SRichard Henderson uint32_t version; 4340813da627SRichard Henderson uint32_t action_flag; 4341813da627SRichard Henderson struct jit_code_entry *relevant_entry; 4342813da627SRichard Henderson struct jit_code_entry *first_entry; 4343813da627SRichard Henderson }; 4344813da627SRichard Henderson 4345813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 4346813da627SRichard Henderson void __jit_debug_register_code(void) 4347813da627SRichard Henderson { 4348813da627SRichard Henderson asm(""); 4349813da627SRichard Henderson } 4350813da627SRichard Henderson 4351813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 4352813da627SRichard Henderson the version before we can set it. */ 4353813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 4354813da627SRichard Henderson 4355813da627SRichard Henderson /* End GDB interface. */ 4356813da627SRichard Henderson 4357813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 4358813da627SRichard Henderson { 4359813da627SRichard Henderson const char *p = strtab + 1; 4360813da627SRichard Henderson 4361813da627SRichard Henderson while (1) { 4362813da627SRichard Henderson if (strcmp(p, str) == 0) { 4363813da627SRichard Henderson return p - strtab; 4364813da627SRichard Henderson } 4365813da627SRichard Henderson p += strlen(p) + 1; 4366813da627SRichard Henderson } 4367813da627SRichard Henderson } 4368813da627SRichard Henderson 4369755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf_ptr, size_t buf_size, 43702c90784aSRichard Henderson const void *debug_frame, 43712c90784aSRichard Henderson size_t debug_frame_size) 4372813da627SRichard Henderson { 43735872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 43745872bbf2SRichard Henderson uint32_t len; 43755872bbf2SRichard Henderson uint16_t version; 43765872bbf2SRichard Henderson uint32_t abbrev; 43775872bbf2SRichard Henderson uint8_t ptr_size; 43785872bbf2SRichard Henderson uint8_t cu_die; 43795872bbf2SRichard Henderson uint16_t cu_lang; 43805872bbf2SRichard Henderson uintptr_t cu_low_pc; 43815872bbf2SRichard Henderson uintptr_t cu_high_pc; 43825872bbf2SRichard Henderson uint8_t fn_die; 43835872bbf2SRichard Henderson char fn_name[16]; 43845872bbf2SRichard Henderson uintptr_t fn_low_pc; 43855872bbf2SRichard Henderson uintptr_t fn_high_pc; 43865872bbf2SRichard Henderson uint8_t cu_eoc; 43875872bbf2SRichard Henderson }; 4388813da627SRichard Henderson 4389813da627SRichard Henderson struct ElfImage { 4390813da627SRichard Henderson ElfW(Ehdr) ehdr; 4391813da627SRichard Henderson ElfW(Phdr) phdr; 43925872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 43935872bbf2SRichard Henderson ElfW(Sym) sym[2]; 43945872bbf2SRichard Henderson struct DebugInfo di; 43955872bbf2SRichard Henderson uint8_t da[24]; 43965872bbf2SRichard Henderson char str[80]; 43975872bbf2SRichard Henderson }; 43985872bbf2SRichard Henderson 43995872bbf2SRichard Henderson struct ElfImage *img; 44005872bbf2SRichard Henderson 44015872bbf2SRichard Henderson static const struct ElfImage img_template = { 44025872bbf2SRichard Henderson .ehdr = { 44035872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 44045872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 44055872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 44065872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 44075872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 44085872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 44095872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 44105872bbf2SRichard Henderson .e_type = ET_EXEC, 44115872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 44125872bbf2SRichard Henderson .e_version = EV_CURRENT, 44135872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 44145872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 44155872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 44165872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 44175872bbf2SRichard Henderson .e_phnum = 1, 44185872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 44195872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 44205872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 4421abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 4422abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 4423abbb3eaeSRichard Henderson #endif 4424abbb3eaeSRichard Henderson #ifdef ELF_OSABI 4425abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 4426abbb3eaeSRichard Henderson #endif 44275872bbf2SRichard Henderson }, 44285872bbf2SRichard Henderson .phdr = { 44295872bbf2SRichard Henderson .p_type = PT_LOAD, 44305872bbf2SRichard Henderson .p_flags = PF_X, 44315872bbf2SRichard Henderson }, 44325872bbf2SRichard Henderson .shdr = { 44335872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 44345872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 44355872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 44365872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 44375872bbf2SRichard Henderson will not look for contents. We can record any address. */ 44385872bbf2SRichard Henderson [1] = { /* .text */ 44395872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 44405872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 44415872bbf2SRichard Henderson }, 44425872bbf2SRichard Henderson [2] = { /* .debug_info */ 44435872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 44445872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 44455872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 44465872bbf2SRichard Henderson }, 44475872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 44485872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 44495872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 44505872bbf2SRichard Henderson .sh_size = sizeof(img->da), 44515872bbf2SRichard Henderson }, 44525872bbf2SRichard Henderson [4] = { /* .debug_frame */ 44535872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 44545872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 44555872bbf2SRichard Henderson }, 44565872bbf2SRichard Henderson [5] = { /* .symtab */ 44575872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 44585872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 44595872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 44605872bbf2SRichard Henderson .sh_info = 1, 44615872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 44625872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 44635872bbf2SRichard Henderson }, 44645872bbf2SRichard Henderson [6] = { /* .strtab */ 44655872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 44665872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 44675872bbf2SRichard Henderson .sh_size = sizeof(img->str), 44685872bbf2SRichard Henderson } 44695872bbf2SRichard Henderson }, 44705872bbf2SRichard Henderson .sym = { 44715872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 44725872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 44735872bbf2SRichard Henderson .st_shndx = 1, 44745872bbf2SRichard Henderson } 44755872bbf2SRichard Henderson }, 44765872bbf2SRichard Henderson .di = { 44775872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 44785872bbf2SRichard Henderson .version = 2, 44795872bbf2SRichard Henderson .ptr_size = sizeof(void *), 44805872bbf2SRichard Henderson .cu_die = 1, 44815872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 44825872bbf2SRichard Henderson .fn_die = 2, 44835872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 44845872bbf2SRichard Henderson }, 44855872bbf2SRichard Henderson .da = { 44865872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 44875872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 44885872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 44895872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 44905872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 44915872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 44925872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 44935872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 44945872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 44955872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 44965872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 44975872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 44985872bbf2SRichard Henderson 0 /* no more abbrev */ 44995872bbf2SRichard Henderson }, 45005872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 45015872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 4502813da627SRichard Henderson }; 4503813da627SRichard Henderson 4504813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 4505813da627SRichard Henderson static struct jit_code_entry one_entry; 4506813da627SRichard Henderson 45075872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 4508813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 45092c90784aSRichard Henderson DebugFrameHeader *dfh; 4510813da627SRichard Henderson 45115872bbf2SRichard Henderson img = g_malloc(img_size); 45125872bbf2SRichard Henderson *img = img_template; 4513813da627SRichard Henderson 45145872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 45155872bbf2SRichard Henderson img->phdr.p_paddr = buf; 45165872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 4517813da627SRichard Henderson 45185872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 45195872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 45205872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 4521813da627SRichard Henderson 45225872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 45235872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 45245872bbf2SRichard Henderson 45255872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 45265872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 45275872bbf2SRichard Henderson 45285872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 45295872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 45305872bbf2SRichard Henderson 45315872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 45325872bbf2SRichard Henderson img->sym[1].st_value = buf; 45335872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 45345872bbf2SRichard Henderson 45355872bbf2SRichard Henderson img->di.cu_low_pc = buf; 453645aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 45375872bbf2SRichard Henderson img->di.fn_low_pc = buf; 453845aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 4539813da627SRichard Henderson 45402c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 45412c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 45422c90784aSRichard Henderson dfh->fde.func_start = buf; 45432c90784aSRichard Henderson dfh->fde.func_len = buf_size; 45442c90784aSRichard Henderson 4545813da627SRichard Henderson #ifdef DEBUG_JIT 4546813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 4547813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 4548813da627SRichard Henderson { 4549813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 4550813da627SRichard Henderson if (f) { 45515872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 4552813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 4553813da627SRichard Henderson } 4554813da627SRichard Henderson fclose(f); 4555813da627SRichard Henderson } 4556813da627SRichard Henderson } 4557813da627SRichard Henderson #endif 4558813da627SRichard Henderson 4559813da627SRichard Henderson one_entry.symfile_addr = img; 4560813da627SRichard Henderson one_entry.symfile_size = img_size; 4561813da627SRichard Henderson 4562813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 4563813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 4564813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 4565813da627SRichard Henderson __jit_debug_register_code(); 4566813da627SRichard Henderson } 4567813da627SRichard Henderson #else 45685872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 45695872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 4570813da627SRichard Henderson 4571755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf, size_t size, 45722c90784aSRichard Henderson const void *debug_frame, 45732c90784aSRichard Henderson size_t debug_frame_size) 4574813da627SRichard Henderson { 4575813da627SRichard Henderson } 4576813da627SRichard Henderson 4577755bf9e5SRichard Henderson void tcg_register_jit(const void *buf, size_t buf_size) 4578813da627SRichard Henderson { 4579813da627SRichard Henderson } 4580813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 4581db432672SRichard Henderson 4582db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 4583db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 4584db432672SRichard Henderson { 4585db432672SRichard Henderson g_assert_not_reached(); 4586db432672SRichard Henderson } 4587db432672SRichard Henderson #endif 4588