1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 3372fd2efbSEmilio G. Cota #include "qemu/error-report.h" 34f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 351de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 36d4c51a0aSMarkus Armbruster #include "qemu/qemu-print.h" 371de7afc9SPaolo Bonzini #include "qemu/timer.h" 38084cfca1SRichard Henderson #include "qemu/cacheflush.h" 39ad768e6fSPeter Maydell #include "qemu/cacheinfo.h" 40c896fe29Sbellard 41c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 42c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 43c896fe29Sbellard instructions */ 44c896fe29Sbellard #define NO_CPU_IO_DEFS 45c896fe29Sbellard 4663c91552SPaolo Bonzini #include "exec/exec-all.h" 47dcb32f1dSPhilippe Mathieu-Daudé #include "tcg/tcg-op.h" 48813da627SRichard Henderson 49edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 50813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 51edee2579SRichard Henderson #else 52edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 53813da627SRichard Henderson #endif 54e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 55813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 56813da627SRichard Henderson #else 57813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 58813da627SRichard Henderson #endif 59813da627SRichard Henderson 60c896fe29Sbellard #include "elf.h" 61508127e2SPaolo Bonzini #include "exec/log.h" 62d2ba8026SRichard Henderson #include "tcg/tcg-ldst.h" 635ff7258cSRichard Henderson #include "tcg-internal.h" 64c896fe29Sbellard 6522f15579SRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 6622f15579SRichard Henderson #include <ffi.h> 6722f15579SRichard Henderson #endif 6822f15579SRichard Henderson 69139c1837SPaolo Bonzini /* Forward declarations for functions declared in tcg-target.c.inc and 70ce151109SPeter Maydell used here. */ 71e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 72e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 736ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type, 742ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 75c896fe29Sbellard 76497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 77497a22ebSRichard Henderson typedef struct { 78497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 79497a22ebSRichard Henderson uint32_t id; 80497a22ebSRichard Henderson uint8_t version; 81497a22ebSRichard Henderson char augmentation[1]; 82497a22ebSRichard Henderson uint8_t code_align; 83497a22ebSRichard Henderson uint8_t data_align; 84497a22ebSRichard Henderson uint8_t return_column; 85497a22ebSRichard Henderson } DebugFrameCIE; 86497a22ebSRichard Henderson 87497a22ebSRichard Henderson typedef struct QEMU_PACKED { 88497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 89497a22ebSRichard Henderson uint32_t cie_offset; 90edee2579SRichard Henderson uintptr_t func_start; 91edee2579SRichard Henderson uintptr_t func_len; 92497a22ebSRichard Henderson } DebugFrameFDEHeader; 93497a22ebSRichard Henderson 942c90784aSRichard Henderson typedef struct QEMU_PACKED { 952c90784aSRichard Henderson DebugFrameCIE cie; 962c90784aSRichard Henderson DebugFrameFDEHeader fde; 972c90784aSRichard Henderson } DebugFrameHeader; 982c90784aSRichard Henderson 99755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf, size_t size, 1002c90784aSRichard Henderson const void *debug_frame, 1012c90784aSRichard Henderson size_t debug_frame_size) 102813da627SRichard Henderson __attribute__((unused)); 103813da627SRichard Henderson 104139c1837SPaolo Bonzini /* Forward declarations for functions declared and used in tcg-target.c.inc. */ 1052a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 106a05b5b9bSRichard Henderson intptr_t arg2); 10778113e83SRichard Henderson static bool tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 108c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1092a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 1105e8892dbSMiroslav Rezanina static void tcg_out_op(TCGContext *s, TCGOpcode opc, 1115e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1125e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]); 113d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 114e7632cfaSRichard Henderson static bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece, 115e7632cfaSRichard Henderson TCGReg dst, TCGReg src); 116d6ecb4a9SRichard Henderson static bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece, 117d6ecb4a9SRichard Henderson TCGReg dst, TCGReg base, intptr_t offset); 1184e186175SRichard Henderson static void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece, 1194e186175SRichard Henderson TCGReg dst, int64_t arg); 1205e8892dbSMiroslav Rezanina static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, 1215e8892dbSMiroslav Rezanina unsigned vecl, unsigned vece, 1225e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1235e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]); 124d2fd745fSRichard Henderson #else 125e7632cfaSRichard Henderson static inline bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece, 126e7632cfaSRichard Henderson TCGReg dst, TCGReg src) 127e7632cfaSRichard Henderson { 128e7632cfaSRichard Henderson g_assert_not_reached(); 129e7632cfaSRichard Henderson } 130d6ecb4a9SRichard Henderson static inline bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece, 131d6ecb4a9SRichard Henderson TCGReg dst, TCGReg base, intptr_t offset) 132d6ecb4a9SRichard Henderson { 133d6ecb4a9SRichard Henderson g_assert_not_reached(); 134d6ecb4a9SRichard Henderson } 1354e186175SRichard Henderson static inline void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece, 1364e186175SRichard Henderson TCGReg dst, int64_t arg) 137e7632cfaSRichard Henderson { 138e7632cfaSRichard Henderson g_assert_not_reached(); 139e7632cfaSRichard Henderson } 1405e8892dbSMiroslav Rezanina static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, 1415e8892dbSMiroslav Rezanina unsigned vecl, unsigned vece, 1425e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1435e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]) 144d2fd745fSRichard Henderson { 145d2fd745fSRichard Henderson g_assert_not_reached(); 146d2fd745fSRichard Henderson } 147d2fd745fSRichard Henderson #endif 1482a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 149a05b5b9bSRichard Henderson intptr_t arg2); 15059d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 15159d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 1527b7d8b2dSRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 1537b7d8b2dSRichard Henderson static void tcg_out_call(TCGContext *s, const tcg_insn_unit *target, 1547b7d8b2dSRichard Henderson ffi_cif *cif); 1557b7d8b2dSRichard Henderson #else 1562be7d76bSRichard Henderson static void tcg_out_call(TCGContext *s, const tcg_insn_unit *target); 1577b7d8b2dSRichard Henderson #endif 158a4fbbd77SRichard Henderson static bool tcg_target_const_match(int64_t val, TCGType type, int ct); 159659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 160aeee05f5SRichard Henderson static int tcg_out_ldst_finalize(TCGContext *s); 161659ef5cbSRichard Henderson #endif 162c896fe29Sbellard 16342eb6dfcSRichard Henderson TCGContext tcg_init_ctx; 16442eb6dfcSRichard Henderson __thread TCGContext *tcg_ctx; 16542eb6dfcSRichard Henderson 1665ff7258cSRichard Henderson TCGContext **tcg_ctxs; 1670e2d61cfSRichard Henderson unsigned int tcg_cur_ctxs; 1680e2d61cfSRichard Henderson unsigned int tcg_max_ctxs; 1691c2adb95SRichard Henderson TCGv_env cpu_env = 0; 170c8bc1168SRichard Henderson const void *tcg_code_gen_epilogue; 171db0c51a3SRichard Henderson uintptr_t tcg_splitwx_diff; 172df2cce29SEmilio G. Cota 173b91ccb31SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 174b91ccb31SRichard Henderson tcg_prologue_fn *tcg_qemu_tb_exec; 175b91ccb31SRichard Henderson #endif 176b91ccb31SRichard Henderson 177d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 178b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 179c896fe29Sbellard 1801813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1814196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 182c896fe29Sbellard { 183c896fe29Sbellard *s->code_ptr++ = v; 184c896fe29Sbellard } 185c896fe29Sbellard 1864196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1874196dca6SPeter Maydell uint8_t v) 1885c53bb81SPeter Maydell { 1891813e175SRichard Henderson *p = v; 1905c53bb81SPeter Maydell } 1911813e175SRichard Henderson #endif 1925c53bb81SPeter Maydell 1931813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1944196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 195c896fe29Sbellard { 1961813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1971813e175SRichard Henderson *s->code_ptr++ = v; 1981813e175SRichard Henderson } else { 1991813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2004387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2011813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 2021813e175SRichard Henderson } 203c896fe29Sbellard } 204c896fe29Sbellard 2054196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 2064196dca6SPeter Maydell uint16_t v) 2075c53bb81SPeter Maydell { 2081813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 2091813e175SRichard Henderson *p = v; 2101813e175SRichard Henderson } else { 2115c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2125c53bb81SPeter Maydell } 2131813e175SRichard Henderson } 2141813e175SRichard Henderson #endif 2155c53bb81SPeter Maydell 2161813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2174196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 218c896fe29Sbellard { 2191813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2201813e175SRichard Henderson *s->code_ptr++ = v; 2211813e175SRichard Henderson } else { 2221813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2234387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2241813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2251813e175SRichard Henderson } 226c896fe29Sbellard } 227c896fe29Sbellard 2284196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2294196dca6SPeter Maydell uint32_t v) 2305c53bb81SPeter Maydell { 2311813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2321813e175SRichard Henderson *p = v; 2331813e175SRichard Henderson } else { 2345c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2355c53bb81SPeter Maydell } 2361813e175SRichard Henderson } 2371813e175SRichard Henderson #endif 2385c53bb81SPeter Maydell 2391813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2404196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 241ac26eb69SRichard Henderson { 2421813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2431813e175SRichard Henderson *s->code_ptr++ = v; 2441813e175SRichard Henderson } else { 2451813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2464387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2471813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2481813e175SRichard Henderson } 249ac26eb69SRichard Henderson } 250ac26eb69SRichard Henderson 2514196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2524196dca6SPeter Maydell uint64_t v) 2535c53bb81SPeter Maydell { 2541813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2551813e175SRichard Henderson *p = v; 2561813e175SRichard Henderson } else { 2575c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2585c53bb81SPeter Maydell } 2591813e175SRichard Henderson } 2601813e175SRichard Henderson #endif 2615c53bb81SPeter Maydell 262c896fe29Sbellard /* label relocation processing */ 263c896fe29Sbellard 2641813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 265bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 266c896fe29Sbellard { 2677ecd02a0SRichard Henderson TCGRelocation *r = tcg_malloc(sizeof(TCGRelocation)); 268c896fe29Sbellard 269c896fe29Sbellard r->type = type; 270c896fe29Sbellard r->ptr = code_ptr; 271c896fe29Sbellard r->addend = addend; 2727ecd02a0SRichard Henderson QSIMPLEQ_INSERT_TAIL(&l->relocs, r, next); 273c896fe29Sbellard } 274c896fe29Sbellard 27592ab8e7dSRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l) 276c896fe29Sbellard { 277eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 278c896fe29Sbellard l->has_value = 1; 27992ab8e7dSRichard Henderson l->u.value_ptr = tcg_splitwx_to_rx(s->code_ptr); 280c896fe29Sbellard } 281c896fe29Sbellard 28242a268c2SRichard Henderson TCGLabel *gen_new_label(void) 283c896fe29Sbellard { 284b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 28551e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 286c896fe29Sbellard 2877ecd02a0SRichard Henderson memset(l, 0, sizeof(TCGLabel)); 2887ecd02a0SRichard Henderson l->id = s->nb_labels++; 2897ecd02a0SRichard Henderson QSIMPLEQ_INIT(&l->relocs); 2907ecd02a0SRichard Henderson 291bef16ab4SRichard Henderson QSIMPLEQ_INSERT_TAIL(&s->labels, l, next); 29242a268c2SRichard Henderson 29342a268c2SRichard Henderson return l; 294c896fe29Sbellard } 295c896fe29Sbellard 2967ecd02a0SRichard Henderson static bool tcg_resolve_relocs(TCGContext *s) 2977ecd02a0SRichard Henderson { 2987ecd02a0SRichard Henderson TCGLabel *l; 2997ecd02a0SRichard Henderson 3007ecd02a0SRichard Henderson QSIMPLEQ_FOREACH(l, &s->labels, next) { 3017ecd02a0SRichard Henderson TCGRelocation *r; 3027ecd02a0SRichard Henderson uintptr_t value = l->u.value; 3037ecd02a0SRichard Henderson 3047ecd02a0SRichard Henderson QSIMPLEQ_FOREACH(r, &l->relocs, next) { 3057ecd02a0SRichard Henderson if (!patch_reloc(r->ptr, r->type, value, r->addend)) { 3067ecd02a0SRichard Henderson return false; 3077ecd02a0SRichard Henderson } 3087ecd02a0SRichard Henderson } 3097ecd02a0SRichard Henderson } 3107ecd02a0SRichard Henderson return true; 3117ecd02a0SRichard Henderson } 3127ecd02a0SRichard Henderson 3139f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which) 3149f754620SRichard Henderson { 315f14bed3fSRichard Henderson /* 316f14bed3fSRichard Henderson * We will check for overflow at the end of the opcode loop in 317f14bed3fSRichard Henderson * tcg_gen_code, where we bound tcg_current_code_size to UINT16_MAX. 318f14bed3fSRichard Henderson */ 319f14bed3fSRichard Henderson s->tb_jmp_reset_offset[which] = tcg_current_code_size(s); 3209f754620SRichard Henderson } 3219f754620SRichard Henderson 322db6b7d0cSRichard Henderson /* Signal overflow, starting over with fewer guest insns. */ 3238905770bSMarc-André Lureau static G_NORETURN 3248905770bSMarc-André Lureau void tcg_raise_tb_overflow(TCGContext *s) 325db6b7d0cSRichard Henderson { 326db6b7d0cSRichard Henderson siglongjmp(s->jmp_trans, -2); 327db6b7d0cSRichard Henderson } 328db6b7d0cSRichard Henderson 3294c22e840SRichard Henderson #define C_PFX1(P, A) P##A 3304c22e840SRichard Henderson #define C_PFX2(P, A, B) P##A##_##B 3314c22e840SRichard Henderson #define C_PFX3(P, A, B, C) P##A##_##B##_##C 3324c22e840SRichard Henderson #define C_PFX4(P, A, B, C, D) P##A##_##B##_##C##_##D 3334c22e840SRichard Henderson #define C_PFX5(P, A, B, C, D, E) P##A##_##B##_##C##_##D##_##E 3344c22e840SRichard Henderson #define C_PFX6(P, A, B, C, D, E, F) P##A##_##B##_##C##_##D##_##E##_##F 3354c22e840SRichard Henderson 3364c22e840SRichard Henderson /* Define an enumeration for the various combinations. */ 3374c22e840SRichard Henderson 3384c22e840SRichard Henderson #define C_O0_I1(I1) C_PFX1(c_o0_i1_, I1), 3394c22e840SRichard Henderson #define C_O0_I2(I1, I2) C_PFX2(c_o0_i2_, I1, I2), 3404c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) C_PFX3(c_o0_i3_, I1, I2, I3), 3414c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) C_PFX4(c_o0_i4_, I1, I2, I3, I4), 3424c22e840SRichard Henderson 3434c22e840SRichard Henderson #define C_O1_I1(O1, I1) C_PFX2(c_o1_i1_, O1, I1), 3444c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) C_PFX3(c_o1_i2_, O1, I1, I2), 3454c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) C_PFX4(c_o1_i3_, O1, I1, I2, I3), 3464c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) C_PFX5(c_o1_i4_, O1, I1, I2, I3, I4), 3474c22e840SRichard Henderson 3484c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) C_PFX3(c_n1_i2_, O1, I1, I2), 3494c22e840SRichard Henderson 3504c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) C_PFX3(c_o2_i1_, O1, O2, I1), 3514c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) C_PFX4(c_o2_i2_, O1, O2, I1, I2), 3524c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) C_PFX5(c_o2_i3_, O1, O2, I1, I2, I3), 3534c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) C_PFX6(c_o2_i4_, O1, O2, I1, I2, I3, I4), 3544c22e840SRichard Henderson 3554c22e840SRichard Henderson typedef enum { 3564c22e840SRichard Henderson #include "tcg-target-con-set.h" 3574c22e840SRichard Henderson } TCGConstraintSetIndex; 3584c22e840SRichard Henderson 3594c22e840SRichard Henderson static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode); 3604c22e840SRichard Henderson 3614c22e840SRichard Henderson #undef C_O0_I1 3624c22e840SRichard Henderson #undef C_O0_I2 3634c22e840SRichard Henderson #undef C_O0_I3 3644c22e840SRichard Henderson #undef C_O0_I4 3654c22e840SRichard Henderson #undef C_O1_I1 3664c22e840SRichard Henderson #undef C_O1_I2 3674c22e840SRichard Henderson #undef C_O1_I3 3684c22e840SRichard Henderson #undef C_O1_I4 3694c22e840SRichard Henderson #undef C_N1_I2 3704c22e840SRichard Henderson #undef C_O2_I1 3714c22e840SRichard Henderson #undef C_O2_I2 3724c22e840SRichard Henderson #undef C_O2_I3 3734c22e840SRichard Henderson #undef C_O2_I4 3744c22e840SRichard Henderson 3754c22e840SRichard Henderson /* Put all of the constraint sets into an array, indexed by the enum. */ 3764c22e840SRichard Henderson 3774c22e840SRichard Henderson #define C_O0_I1(I1) { .args_ct_str = { #I1 } }, 3784c22e840SRichard Henderson #define C_O0_I2(I1, I2) { .args_ct_str = { #I1, #I2 } }, 3794c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) { .args_ct_str = { #I1, #I2, #I3 } }, 3804c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) { .args_ct_str = { #I1, #I2, #I3, #I4 } }, 3814c22e840SRichard Henderson 3824c22e840SRichard Henderson #define C_O1_I1(O1, I1) { .args_ct_str = { #O1, #I1 } }, 3834c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) { .args_ct_str = { #O1, #I1, #I2 } }, 3844c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) { .args_ct_str = { #O1, #I1, #I2, #I3 } }, 3854c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) { .args_ct_str = { #O1, #I1, #I2, #I3, #I4 } }, 3864c22e840SRichard Henderson 3874c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) { .args_ct_str = { "&" #O1, #I1, #I2 } }, 3884c22e840SRichard Henderson 3894c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) { .args_ct_str = { #O1, #O2, #I1 } }, 3904c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) { .args_ct_str = { #O1, #O2, #I1, #I2 } }, 3914c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) { .args_ct_str = { #O1, #O2, #I1, #I2, #I3 } }, 3924c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) { .args_ct_str = { #O1, #O2, #I1, #I2, #I3, #I4 } }, 3934c22e840SRichard Henderson 3944c22e840SRichard Henderson static const TCGTargetOpDef constraint_sets[] = { 3954c22e840SRichard Henderson #include "tcg-target-con-set.h" 3964c22e840SRichard Henderson }; 3974c22e840SRichard Henderson 3984c22e840SRichard Henderson 3994c22e840SRichard Henderson #undef C_O0_I1 4004c22e840SRichard Henderson #undef C_O0_I2 4014c22e840SRichard Henderson #undef C_O0_I3 4024c22e840SRichard Henderson #undef C_O0_I4 4034c22e840SRichard Henderson #undef C_O1_I1 4044c22e840SRichard Henderson #undef C_O1_I2 4054c22e840SRichard Henderson #undef C_O1_I3 4064c22e840SRichard Henderson #undef C_O1_I4 4074c22e840SRichard Henderson #undef C_N1_I2 4084c22e840SRichard Henderson #undef C_O2_I1 4094c22e840SRichard Henderson #undef C_O2_I2 4104c22e840SRichard Henderson #undef C_O2_I3 4114c22e840SRichard Henderson #undef C_O2_I4 4124c22e840SRichard Henderson 4134c22e840SRichard Henderson /* Expand the enumerator to be returned from tcg_target_op_def(). */ 4144c22e840SRichard Henderson 4154c22e840SRichard Henderson #define C_O0_I1(I1) C_PFX1(c_o0_i1_, I1) 4164c22e840SRichard Henderson #define C_O0_I2(I1, I2) C_PFX2(c_o0_i2_, I1, I2) 4174c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) C_PFX3(c_o0_i3_, I1, I2, I3) 4184c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) C_PFX4(c_o0_i4_, I1, I2, I3, I4) 4194c22e840SRichard Henderson 4204c22e840SRichard Henderson #define C_O1_I1(O1, I1) C_PFX2(c_o1_i1_, O1, I1) 4214c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) C_PFX3(c_o1_i2_, O1, I1, I2) 4224c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) C_PFX4(c_o1_i3_, O1, I1, I2, I3) 4234c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) C_PFX5(c_o1_i4_, O1, I1, I2, I3, I4) 4244c22e840SRichard Henderson 4254c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) C_PFX3(c_n1_i2_, O1, I1, I2) 4264c22e840SRichard Henderson 4274c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) C_PFX3(c_o2_i1_, O1, O2, I1) 4284c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) C_PFX4(c_o2_i2_, O1, O2, I1, I2) 4294c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) C_PFX5(c_o2_i3_, O1, O2, I1, I2, I3) 4304c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) C_PFX6(c_o2_i4_, O1, O2, I1, I2, I3, I4) 4314c22e840SRichard Henderson 432139c1837SPaolo Bonzini #include "tcg-target.c.inc" 433c896fe29Sbellard 43438b47b19SEmilio G. Cota static void alloc_tcg_plugin_context(TCGContext *s) 43538b47b19SEmilio G. Cota { 43638b47b19SEmilio G. Cota #ifdef CONFIG_PLUGIN 43738b47b19SEmilio G. Cota s->plugin_tb = g_new0(struct qemu_plugin_tb, 1); 43838b47b19SEmilio G. Cota s->plugin_tb->insns = 43938b47b19SEmilio G. Cota g_ptr_array_new_with_free_func(qemu_plugin_insn_cleanup_fn); 44038b47b19SEmilio G. Cota #endif 44138b47b19SEmilio G. Cota } 44238b47b19SEmilio G. Cota 443e8feb96fSEmilio G. Cota /* 4443468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 4453468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 4463468b59eSEmilio G. Cota * before initiating translation. 4473468b59eSEmilio G. Cota * 4483468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 4493468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 4503468b59eSEmilio G. Cota * 4513468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 4523468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 4533468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 4543468b59eSEmilio G. Cota * 4553468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 4563468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 4573468b59eSEmilio G. Cota */ 4583468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 4593468b59eSEmilio G. Cota void tcg_register_thread(void) 4603468b59eSEmilio G. Cota { 4613468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 4623468b59eSEmilio G. Cota } 4633468b59eSEmilio G. Cota #else 4643468b59eSEmilio G. Cota void tcg_register_thread(void) 4653468b59eSEmilio G. Cota { 4663468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 4673468b59eSEmilio G. Cota unsigned int i, n; 4683468b59eSEmilio G. Cota 4693468b59eSEmilio G. Cota *s = tcg_init_ctx; 4703468b59eSEmilio G. Cota 4713468b59eSEmilio G. Cota /* Relink mem_base. */ 4723468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 4733468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 4743468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 4753468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 4763468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 4773468b59eSEmilio G. Cota } 4783468b59eSEmilio G. Cota } 4793468b59eSEmilio G. Cota 4803468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 4810e2d61cfSRichard Henderson n = qatomic_fetch_inc(&tcg_cur_ctxs); 4820e2d61cfSRichard Henderson g_assert(n < tcg_max_ctxs); 483d73415a3SStefan Hajnoczi qatomic_set(&tcg_ctxs[n], s); 4843468b59eSEmilio G. Cota 48538b47b19SEmilio G. Cota if (n > 0) { 48638b47b19SEmilio G. Cota alloc_tcg_plugin_context(s); 487bf042e8eSRichard Henderson tcg_region_initial_alloc(s); 48838b47b19SEmilio G. Cota } 48938b47b19SEmilio G. Cota 4903468b59eSEmilio G. Cota tcg_ctx = s; 4913468b59eSEmilio G. Cota } 4923468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 4933468b59eSEmilio G. Cota 494c896fe29Sbellard /* pool based memory allocation */ 495c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 496c896fe29Sbellard { 497c896fe29Sbellard TCGPool *p; 498c896fe29Sbellard int pool_size; 499c896fe29Sbellard 500c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 501c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 5027267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 503c896fe29Sbellard p->size = size; 5044055299eSKirill Batuzov p->next = s->pool_first_large; 5054055299eSKirill Batuzov s->pool_first_large = p; 5064055299eSKirill Batuzov return p->data; 507c896fe29Sbellard } else { 508c896fe29Sbellard p = s->pool_current; 509c896fe29Sbellard if (!p) { 510c896fe29Sbellard p = s->pool_first; 511c896fe29Sbellard if (!p) 512c896fe29Sbellard goto new_pool; 513c896fe29Sbellard } else { 514c896fe29Sbellard if (!p->next) { 515c896fe29Sbellard new_pool: 516c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 5177267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 518c896fe29Sbellard p->size = pool_size; 519c896fe29Sbellard p->next = NULL; 520a813e36fSRichard Henderson if (s->pool_current) { 521c896fe29Sbellard s->pool_current->next = p; 522a813e36fSRichard Henderson } else { 523c896fe29Sbellard s->pool_first = p; 524a813e36fSRichard Henderson } 525c896fe29Sbellard } else { 526c896fe29Sbellard p = p->next; 527c896fe29Sbellard } 528c896fe29Sbellard } 529c896fe29Sbellard } 530c896fe29Sbellard s->pool_current = p; 531c896fe29Sbellard s->pool_cur = p->data + size; 532c896fe29Sbellard s->pool_end = p->data + p->size; 533c896fe29Sbellard return p->data; 534c896fe29Sbellard } 535c896fe29Sbellard 536c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 537c896fe29Sbellard { 5384055299eSKirill Batuzov TCGPool *p, *t; 5394055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 5404055299eSKirill Batuzov t = p->next; 5414055299eSKirill Batuzov g_free(p); 5424055299eSKirill Batuzov } 5434055299eSKirill Batuzov s->pool_first_large = NULL; 544c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 545c896fe29Sbellard s->pool_current = NULL; 546c896fe29Sbellard } 547c896fe29Sbellard 5482ef6175aSRichard Henderson #include "exec/helper-proto.h" 5492ef6175aSRichard Henderson 550100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 5512ef6175aSRichard Henderson #include "exec/helper-tcg.h" 552100b5e01SRichard Henderson }; 553619205fdSEmilio G. Cota static GHashTable *helper_table; 554100b5e01SRichard Henderson 55522f15579SRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 55622f15579SRichard Henderson static GHashTable *ffi_table; 55722f15579SRichard Henderson 55822f15579SRichard Henderson static ffi_type * const typecode_to_ffi[8] = { 55922f15579SRichard Henderson [dh_typecode_void] = &ffi_type_void, 56022f15579SRichard Henderson [dh_typecode_i32] = &ffi_type_uint32, 56122f15579SRichard Henderson [dh_typecode_s32] = &ffi_type_sint32, 56222f15579SRichard Henderson [dh_typecode_i64] = &ffi_type_uint64, 56322f15579SRichard Henderson [dh_typecode_s64] = &ffi_type_sint64, 56422f15579SRichard Henderson [dh_typecode_ptr] = &ffi_type_pointer, 56522f15579SRichard Henderson }; 56622f15579SRichard Henderson #endif 56722f15579SRichard Henderson 56891478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 569f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 5701c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 5711c2adb95SRichard Henderson TCGReg reg, const char *name); 57291478cefSRichard Henderson 57343b972b7SRichard Henderson static void tcg_context_init(unsigned max_cpus) 574c896fe29Sbellard { 575a76aabd3SRichard Henderson TCGContext *s = &tcg_init_ctx; 576100b5e01SRichard Henderson int op, total_args, n, i; 577c896fe29Sbellard TCGOpDef *def; 578c896fe29Sbellard TCGArgConstraint *args_ct; 5791c2adb95SRichard Henderson TCGTemp *ts; 580c896fe29Sbellard 581c896fe29Sbellard memset(s, 0, sizeof(*s)); 582c896fe29Sbellard s->nb_globals = 0; 583c896fe29Sbellard 584c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 585c896fe29Sbellard space */ 586c896fe29Sbellard total_args = 0; 587c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 588c896fe29Sbellard def = &tcg_op_defs[op]; 589c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 590c896fe29Sbellard total_args += n; 591c896fe29Sbellard } 592c896fe29Sbellard 593bc2b17e6SRichard Henderson args_ct = g_new0(TCGArgConstraint, total_args); 594c896fe29Sbellard 595c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 596c896fe29Sbellard def = &tcg_op_defs[op]; 597c896fe29Sbellard def->args_ct = args_ct; 598c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 599c896fe29Sbellard args_ct += n; 600c896fe29Sbellard } 601c896fe29Sbellard 6025cd8f621SRichard Henderson /* Register helpers. */ 60384fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 604619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 60584fd9dd3SRichard Henderson 606100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 60784fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 60872866e82SRichard Henderson (gpointer)&all_helpers[i]); 609100b5e01SRichard Henderson } 6105cd8f621SRichard Henderson 61122f15579SRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 61222f15579SRichard Henderson /* g_direct_hash/equal for direct comparisons on uint32_t. */ 61322f15579SRichard Henderson ffi_table = g_hash_table_new(NULL, NULL); 61422f15579SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 61522f15579SRichard Henderson struct { 61622f15579SRichard Henderson ffi_cif cif; 61722f15579SRichard Henderson ffi_type *args[]; 61822f15579SRichard Henderson } *ca; 61922f15579SRichard Henderson uint32_t typemask = all_helpers[i].typemask; 62022f15579SRichard Henderson gpointer hash = (gpointer)(uintptr_t)typemask; 62122f15579SRichard Henderson ffi_status status; 62222f15579SRichard Henderson int nargs; 62322f15579SRichard Henderson 62422f15579SRichard Henderson if (g_hash_table_lookup(ffi_table, hash)) { 62522f15579SRichard Henderson continue; 62622f15579SRichard Henderson } 62722f15579SRichard Henderson 62822f15579SRichard Henderson /* Ignoring the return type, find the last non-zero field. */ 62922f15579SRichard Henderson nargs = 32 - clz32(typemask >> 3); 63022f15579SRichard Henderson nargs = DIV_ROUND_UP(nargs, 3); 63122f15579SRichard Henderson 63222f15579SRichard Henderson ca = g_malloc0(sizeof(*ca) + nargs * sizeof(ffi_type *)); 63322f15579SRichard Henderson ca->cif.rtype = typecode_to_ffi[typemask & 7]; 63422f15579SRichard Henderson ca->cif.nargs = nargs; 63522f15579SRichard Henderson 63622f15579SRichard Henderson if (nargs != 0) { 63722f15579SRichard Henderson ca->cif.arg_types = ca->args; 6389dd1d56eSIcenowy Zheng for (int j = 0; j < nargs; ++j) { 6399dd1d56eSIcenowy Zheng int typecode = extract32(typemask, (j + 1) * 3, 3); 6409dd1d56eSIcenowy Zheng ca->args[j] = typecode_to_ffi[typecode]; 64122f15579SRichard Henderson } 64222f15579SRichard Henderson } 64322f15579SRichard Henderson 64422f15579SRichard Henderson status = ffi_prep_cif(&ca->cif, FFI_DEFAULT_ABI, nargs, 64522f15579SRichard Henderson ca->cif.rtype, ca->cif.arg_types); 64622f15579SRichard Henderson assert(status == FFI_OK); 64722f15579SRichard Henderson 64822f15579SRichard Henderson g_hash_table_insert(ffi_table, hash, (gpointer)&ca->cif); 64922f15579SRichard Henderson } 65022f15579SRichard Henderson #endif 65122f15579SRichard Henderson 652c896fe29Sbellard tcg_target_init(s); 653f69d277eSRichard Henderson process_op_defs(s); 65491478cefSRichard Henderson 65591478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 65691478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 65791478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 65891478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 65991478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 66091478cefSRichard Henderson break; 66191478cefSRichard Henderson } 66291478cefSRichard Henderson } 66391478cefSRichard Henderson for (i = 0; i < n; ++i) { 66491478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 66591478cefSRichard Henderson } 66691478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 66791478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 66891478cefSRichard Henderson } 669b1311c4aSEmilio G. Cota 67038b47b19SEmilio G. Cota alloc_tcg_plugin_context(s); 67138b47b19SEmilio G. Cota 672b1311c4aSEmilio G. Cota tcg_ctx = s; 6733468b59eSEmilio G. Cota /* 6743468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 6753468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 6763468b59eSEmilio G. Cota * reasoning behind this. 6773468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 6783468b59eSEmilio G. Cota */ 6793468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 680df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 6810e2d61cfSRichard Henderson tcg_cur_ctxs = 1; 6820e2d61cfSRichard Henderson tcg_max_ctxs = 1; 6833468b59eSEmilio G. Cota #else 6840e2d61cfSRichard Henderson tcg_max_ctxs = max_cpus; 6850e2d61cfSRichard Henderson tcg_ctxs = g_new0(TCGContext *, max_cpus); 6863468b59eSEmilio G. Cota #endif 6871c2adb95SRichard Henderson 6881c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 6891c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 6901c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 6919002ec79SRichard Henderson } 692b03cce8eSbellard 69343b972b7SRichard Henderson void tcg_init(size_t tb_size, int splitwx, unsigned max_cpus) 694a76aabd3SRichard Henderson { 69543b972b7SRichard Henderson tcg_context_init(max_cpus); 69643b972b7SRichard Henderson tcg_region_init(tb_size, splitwx, max_cpus); 697a76aabd3SRichard Henderson } 698a76aabd3SRichard Henderson 6996e3b2bfdSEmilio G. Cota /* 7006e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 7016e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 7026e3b2bfdSEmilio G. Cota */ 7036e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 7046e3b2bfdSEmilio G. Cota { 7056e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 7066e3b2bfdSEmilio G. Cota TranslationBlock *tb; 7076e3b2bfdSEmilio G. Cota void *next; 7086e3b2bfdSEmilio G. Cota 709e8feb96fSEmilio G. Cota retry: 7106e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 7116e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 7126e3b2bfdSEmilio G. Cota 7136e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 714e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 7156e3b2bfdSEmilio G. Cota return NULL; 7166e3b2bfdSEmilio G. Cota } 717e8feb96fSEmilio G. Cota goto retry; 718e8feb96fSEmilio G. Cota } 719d73415a3SStefan Hajnoczi qatomic_set(&s->code_gen_ptr, next); 72057a26946SRichard Henderson s->data_gen_ptr = NULL; 7216e3b2bfdSEmilio G. Cota return tb; 7226e3b2bfdSEmilio G. Cota } 7236e3b2bfdSEmilio G. Cota 7249002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 7259002ec79SRichard Henderson { 726b0a0794aSRichard Henderson size_t prologue_size; 7278163b749SRichard Henderson 728b0a0794aSRichard Henderson s->code_ptr = s->code_gen_ptr; 729b0a0794aSRichard Henderson s->code_buf = s->code_gen_ptr; 7305b38ee31SRichard Henderson s->data_gen_ptr = NULL; 731b91ccb31SRichard Henderson 732b91ccb31SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 733b0a0794aSRichard Henderson tcg_qemu_tb_exec = (tcg_prologue_fn *)tcg_splitwx_to_rx(s->code_ptr); 734b91ccb31SRichard Henderson #endif 7358163b749SRichard Henderson 7365b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 7375b38ee31SRichard Henderson s->pool_labels = NULL; 7385b38ee31SRichard Henderson #endif 7395b38ee31SRichard Henderson 740653b87ebSRoman Bolshakov qemu_thread_jit_write(); 7418163b749SRichard Henderson /* Generate the prologue. */ 742b03cce8eSbellard tcg_target_qemu_prologue(s); 7435b38ee31SRichard Henderson 7445b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 7455b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 7465b38ee31SRichard Henderson { 7471768987bSRichard Henderson int result = tcg_out_pool_finalize(s); 7481768987bSRichard Henderson tcg_debug_assert(result == 0); 7495b38ee31SRichard Henderson } 7505b38ee31SRichard Henderson #endif 7515b38ee31SRichard Henderson 752b0a0794aSRichard Henderson prologue_size = tcg_current_code_size(s); 753b0a0794aSRichard Henderson 754df5d2b16SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 755b0a0794aSRichard Henderson flush_idcache_range((uintptr_t)tcg_splitwx_to_rx(s->code_buf), 756b0a0794aSRichard Henderson (uintptr_t)s->code_buf, prologue_size); 757df5d2b16SRichard Henderson #endif 7588163b749SRichard Henderson 759d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 760d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 761c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 76278b54858SRichard Henderson if (logfile) { 76378b54858SRichard Henderson fprintf(logfile, "PROLOGUE: [size=%zu]\n", prologue_size); 7645b38ee31SRichard Henderson if (s->data_gen_ptr) { 765b0a0794aSRichard Henderson size_t code_size = s->data_gen_ptr - s->code_gen_ptr; 7665b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 7675b38ee31SRichard Henderson size_t i; 7685b38ee31SRichard Henderson 76978b54858SRichard Henderson disas(logfile, s->code_gen_ptr, code_size); 7705b38ee31SRichard Henderson 7715b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 7725b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 77378b54858SRichard Henderson fprintf(logfile, 77478b54858SRichard Henderson "0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 7755b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 7765b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 7775b38ee31SRichard Henderson } else { 77878b54858SRichard Henderson fprintf(logfile, 77978b54858SRichard Henderson "0x%08" PRIxPTR ": .long 0x%08x\n", 7805b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 7815b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 7825b38ee31SRichard Henderson } 7835b38ee31SRichard Henderson } 7845b38ee31SRichard Henderson } else { 78578b54858SRichard Henderson disas(logfile, s->code_gen_ptr, prologue_size); 7865b38ee31SRichard Henderson } 78778b54858SRichard Henderson fprintf(logfile, "\n"); 788fc59d2d8SRobert Foley qemu_log_unlock(logfile); 789d6b64b2bSRichard Henderson } 79078b54858SRichard Henderson } 791d6b64b2bSRichard Henderson #endif 792cedbcb01SEmilio G. Cota 7936eea0434SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 7946eea0434SRichard Henderson /* 7956eea0434SRichard Henderson * Assert that goto_ptr is implemented completely, setting an epilogue. 7966eea0434SRichard Henderson * For tci, we use NULL as the signal to return from the interpreter, 7976eea0434SRichard Henderson * so skip this check. 7986eea0434SRichard Henderson */ 7998b5c2b62SRichard Henderson tcg_debug_assert(tcg_code_gen_epilogue != NULL); 8006eea0434SRichard Henderson #endif 801d1c74ab3SRichard Henderson 802d1c74ab3SRichard Henderson tcg_region_prologue_set(s); 803c896fe29Sbellard } 804c896fe29Sbellard 805c896fe29Sbellard void tcg_func_start(TCGContext *s) 806c896fe29Sbellard { 807c896fe29Sbellard tcg_pool_reset(s); 808c896fe29Sbellard s->nb_temps = s->nb_globals; 8090ec9eabcSRichard Henderson 8100ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 8110ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 8120ec9eabcSRichard Henderson 813c0522136SRichard Henderson /* No constant temps have been previously allocated. */ 814c0522136SRichard Henderson for (int i = 0; i < TCG_TYPE_COUNT; ++i) { 815c0522136SRichard Henderson if (s->const_table[i]) { 816c0522136SRichard Henderson g_hash_table_remove_all(s->const_table[i]); 817c0522136SRichard Henderson } 818c0522136SRichard Henderson } 819c0522136SRichard Henderson 820abebf925SRichard Henderson s->nb_ops = 0; 821c896fe29Sbellard s->nb_labels = 0; 822c896fe29Sbellard s->current_frame_offset = s->frame_start; 823c896fe29Sbellard 8240a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 8250a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 8260a209d4bSRichard Henderson #endif 8270a209d4bSRichard Henderson 82815fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 82915fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 830bef16ab4SRichard Henderson QSIMPLEQ_INIT(&s->labels); 831c896fe29Sbellard } 832c896fe29Sbellard 833ae30e866SRichard Henderson static TCGTemp *tcg_temp_alloc(TCGContext *s) 8347ca4b752SRichard Henderson { 8357ca4b752SRichard Henderson int n = s->nb_temps++; 836ae30e866SRichard Henderson 837ae30e866SRichard Henderson if (n >= TCG_MAX_TEMPS) { 838db6b7d0cSRichard Henderson tcg_raise_tb_overflow(s); 839ae30e866SRichard Henderson } 8407ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 8417ca4b752SRichard Henderson } 8427ca4b752SRichard Henderson 843ae30e866SRichard Henderson static TCGTemp *tcg_global_alloc(TCGContext *s) 8447ca4b752SRichard Henderson { 845fa477d25SRichard Henderson TCGTemp *ts; 846fa477d25SRichard Henderson 8477ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 848ae30e866SRichard Henderson tcg_debug_assert(s->nb_globals < TCG_MAX_TEMPS); 8497ca4b752SRichard Henderson s->nb_globals++; 850fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 851ee17db83SRichard Henderson ts->kind = TEMP_GLOBAL; 852fa477d25SRichard Henderson 853fa477d25SRichard Henderson return ts; 854c896fe29Sbellard } 855c896fe29Sbellard 856085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 857b6638662SRichard Henderson TCGReg reg, const char *name) 858c896fe29Sbellard { 859c896fe29Sbellard TCGTemp *ts; 860c896fe29Sbellard 861b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 862c896fe29Sbellard tcg_abort(); 863b3a62939SRichard Henderson } 8647ca4b752SRichard Henderson 8657ca4b752SRichard Henderson ts = tcg_global_alloc(s); 866c896fe29Sbellard ts->base_type = type; 867c896fe29Sbellard ts->type = type; 868ee17db83SRichard Henderson ts->kind = TEMP_FIXED; 869c896fe29Sbellard ts->reg = reg; 870c896fe29Sbellard ts->name = name; 871c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 8727ca4b752SRichard Henderson 873085272b3SRichard Henderson return ts; 874a7812ae4Spbrook } 875a7812ae4Spbrook 876b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 877a7812ae4Spbrook { 878b3a62939SRichard Henderson s->frame_start = start; 879b3a62939SRichard Henderson s->frame_end = start + size; 880085272b3SRichard Henderson s->frame_temp 881085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 882b3a62939SRichard Henderson } 883a7812ae4Spbrook 884085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 885e1ccc054SRichard Henderson intptr_t offset, const char *name) 886c896fe29Sbellard { 887b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 888dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 8897ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 890aef85402SRichard Henderson int indirect_reg = 0; 891c896fe29Sbellard 892c0522136SRichard Henderson switch (base_ts->kind) { 893c0522136SRichard Henderson case TEMP_FIXED: 894c0522136SRichard Henderson break; 895c0522136SRichard Henderson case TEMP_GLOBAL: 8965a18407fSRichard Henderson /* We do not support double-indirect registers. */ 8975a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 898b3915dbbSRichard Henderson base_ts->indirect_base = 1; 8995a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 9005a18407fSRichard Henderson ? 2 : 1); 9015a18407fSRichard Henderson indirect_reg = 1; 902c0522136SRichard Henderson break; 903c0522136SRichard Henderson default: 904c0522136SRichard Henderson g_assert_not_reached(); 905b3915dbbSRichard Henderson } 906b3915dbbSRichard Henderson 9077ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 9087ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 909c896fe29Sbellard char buf[64]; 9107ca4b752SRichard Henderson 9117ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 912c896fe29Sbellard ts->type = TCG_TYPE_I32; 913b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 914c896fe29Sbellard ts->mem_allocated = 1; 915b3a62939SRichard Henderson ts->mem_base = base_ts; 916aef85402SRichard Henderson ts->mem_offset = offset; 917c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 918c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 919c896fe29Sbellard ts->name = strdup(buf); 920c896fe29Sbellard 9217ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 9227ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 9237ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 924b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 9257ca4b752SRichard Henderson ts2->mem_allocated = 1; 9267ca4b752SRichard Henderson ts2->mem_base = base_ts; 927aef85402SRichard Henderson ts2->mem_offset = offset + 4; 928fac87bd2SRichard Henderson ts2->temp_subindex = 1; 929c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 930c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 931120c1084SRichard Henderson ts2->name = strdup(buf); 9327ca4b752SRichard Henderson } else { 933c896fe29Sbellard ts->base_type = type; 934c896fe29Sbellard ts->type = type; 935b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 936c896fe29Sbellard ts->mem_allocated = 1; 937b3a62939SRichard Henderson ts->mem_base = base_ts; 938c896fe29Sbellard ts->mem_offset = offset; 939c896fe29Sbellard ts->name = name; 940c896fe29Sbellard } 941085272b3SRichard Henderson return ts; 942c896fe29Sbellard } 943c896fe29Sbellard 9445bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 945c896fe29Sbellard { 946b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 947ee17db83SRichard Henderson TCGTempKind kind = temp_local ? TEMP_LOCAL : TEMP_NORMAL; 948c896fe29Sbellard TCGTemp *ts; 949641d5fbeSbellard int idx, k; 950c896fe29Sbellard 9510ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 9520ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 9530ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 9540ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 9550ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 9560ec9eabcSRichard Henderson 957e8996ee0Sbellard ts = &s->temps[idx]; 958e8996ee0Sbellard ts->temp_allocated = 1; 9597ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 960ee17db83SRichard Henderson tcg_debug_assert(ts->kind == kind); 961e8996ee0Sbellard } else { 9627ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 9637ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 9647ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 9657ca4b752SRichard Henderson 966c896fe29Sbellard ts->base_type = type; 967c896fe29Sbellard ts->type = TCG_TYPE_I32; 968e8996ee0Sbellard ts->temp_allocated = 1; 969ee17db83SRichard Henderson ts->kind = kind; 9707ca4b752SRichard Henderson 9717ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 9727ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 9737ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 9747ca4b752SRichard Henderson ts2->temp_allocated = 1; 975fac87bd2SRichard Henderson ts2->temp_subindex = 1; 976ee17db83SRichard Henderson ts2->kind = kind; 9777ca4b752SRichard Henderson } else { 978c896fe29Sbellard ts->base_type = type; 979c896fe29Sbellard ts->type = type; 980e8996ee0Sbellard ts->temp_allocated = 1; 981ee17db83SRichard Henderson ts->kind = kind; 982c896fe29Sbellard } 983e8996ee0Sbellard } 98427bfd83cSPeter Maydell 98527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 98627bfd83cSPeter Maydell s->temps_in_use++; 98727bfd83cSPeter Maydell #endif 988085272b3SRichard Henderson return ts; 989c896fe29Sbellard } 990c896fe29Sbellard 991d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 992d2fd745fSRichard Henderson { 993d2fd745fSRichard Henderson TCGTemp *t; 994d2fd745fSRichard Henderson 995d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 996d2fd745fSRichard Henderson switch (type) { 997d2fd745fSRichard Henderson case TCG_TYPE_V64: 998d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 999d2fd745fSRichard Henderson break; 1000d2fd745fSRichard Henderson case TCG_TYPE_V128: 1001d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 1002d2fd745fSRichard Henderson break; 1003d2fd745fSRichard Henderson case TCG_TYPE_V256: 1004d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 1005d2fd745fSRichard Henderson break; 1006d2fd745fSRichard Henderson default: 1007d2fd745fSRichard Henderson g_assert_not_reached(); 1008d2fd745fSRichard Henderson } 1009d2fd745fSRichard Henderson #endif 1010d2fd745fSRichard Henderson 1011d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 1012d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1013d2fd745fSRichard Henderson } 1014d2fd745fSRichard Henderson 1015d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 1016d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 1017d2fd745fSRichard Henderson { 1018d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 1019d2fd745fSRichard Henderson 1020d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 1021d2fd745fSRichard Henderson 1022d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 1023d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1024d2fd745fSRichard Henderson } 1025d2fd745fSRichard Henderson 10265bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 1027c896fe29Sbellard { 1028b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1029085272b3SRichard Henderson int k, idx; 1030c896fe29Sbellard 1031c7482438SRichard Henderson switch (ts->kind) { 1032c7482438SRichard Henderson case TEMP_CONST: 1033c7482438SRichard Henderson /* 1034c7482438SRichard Henderson * In order to simplify users of tcg_constant_*, 1035c7482438SRichard Henderson * silently ignore free. 1036c7482438SRichard Henderson */ 1037c0522136SRichard Henderson return; 1038c7482438SRichard Henderson case TEMP_NORMAL: 1039c7482438SRichard Henderson case TEMP_LOCAL: 1040c7482438SRichard Henderson break; 1041c7482438SRichard Henderson default: 1042c7482438SRichard Henderson g_assert_not_reached(); 1043c0522136SRichard Henderson } 1044c0522136SRichard Henderson 104527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 104627bfd83cSPeter Maydell s->temps_in_use--; 104727bfd83cSPeter Maydell if (s->temps_in_use < 0) { 104827bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 104927bfd83cSPeter Maydell } 105027bfd83cSPeter Maydell #endif 105127bfd83cSPeter Maydell 1052eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 1053e8996ee0Sbellard ts->temp_allocated = 0; 10540ec9eabcSRichard Henderson 1055085272b3SRichard Henderson idx = temp_idx(ts); 1056ee17db83SRichard Henderson k = ts->base_type + (ts->kind == TEMP_NORMAL ? 0 : TCG_TYPE_COUNT); 10570ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 1058e8996ee0Sbellard } 1059e8996ee0Sbellard 1060c0522136SRichard Henderson TCGTemp *tcg_constant_internal(TCGType type, int64_t val) 1061c0522136SRichard Henderson { 1062c0522136SRichard Henderson TCGContext *s = tcg_ctx; 1063c0522136SRichard Henderson GHashTable *h = s->const_table[type]; 1064c0522136SRichard Henderson TCGTemp *ts; 1065c0522136SRichard Henderson 1066c0522136SRichard Henderson if (h == NULL) { 1067c0522136SRichard Henderson h = g_hash_table_new(g_int64_hash, g_int64_equal); 1068c0522136SRichard Henderson s->const_table[type] = h; 1069c0522136SRichard Henderson } 1070c0522136SRichard Henderson 1071c0522136SRichard Henderson ts = g_hash_table_lookup(h, &val); 1072c0522136SRichard Henderson if (ts == NULL) { 1073aef85402SRichard Henderson int64_t *val_ptr; 1074aef85402SRichard Henderson 1075c0522136SRichard Henderson ts = tcg_temp_alloc(s); 1076c0522136SRichard Henderson 1077c0522136SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 1078c0522136SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 1079c0522136SRichard Henderson 1080aef85402SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 1081aef85402SRichard Henderson 1082c0522136SRichard Henderson ts->base_type = TCG_TYPE_I64; 1083c0522136SRichard Henderson ts->type = TCG_TYPE_I32; 1084c0522136SRichard Henderson ts->kind = TEMP_CONST; 1085c0522136SRichard Henderson ts->temp_allocated = 1; 1086c0522136SRichard Henderson 1087c0522136SRichard Henderson ts2->base_type = TCG_TYPE_I64; 1088c0522136SRichard Henderson ts2->type = TCG_TYPE_I32; 1089c0522136SRichard Henderson ts2->kind = TEMP_CONST; 1090c0522136SRichard Henderson ts2->temp_allocated = 1; 1091fac87bd2SRichard Henderson ts2->temp_subindex = 1; 1092aef85402SRichard Henderson 1093aef85402SRichard Henderson /* 1094aef85402SRichard Henderson * Retain the full value of the 64-bit constant in the low 1095aef85402SRichard Henderson * part, so that the hash table works. Actual uses will 1096aef85402SRichard Henderson * truncate the value to the low part. 1097aef85402SRichard Henderson */ 1098aef85402SRichard Henderson ts[HOST_BIG_ENDIAN].val = val; 1099aef85402SRichard Henderson ts[!HOST_BIG_ENDIAN].val = val >> 32; 1100aef85402SRichard Henderson val_ptr = &ts[HOST_BIG_ENDIAN].val; 1101c0522136SRichard Henderson } else { 1102c0522136SRichard Henderson ts->base_type = type; 1103c0522136SRichard Henderson ts->type = type; 1104c0522136SRichard Henderson ts->kind = TEMP_CONST; 1105c0522136SRichard Henderson ts->temp_allocated = 1; 1106c0522136SRichard Henderson ts->val = val; 1107aef85402SRichard Henderson val_ptr = &ts->val; 1108c0522136SRichard Henderson } 1109aef85402SRichard Henderson g_hash_table_insert(h, val_ptr, ts); 1110c0522136SRichard Henderson } 1111c0522136SRichard Henderson 1112c0522136SRichard Henderson return ts; 1113c0522136SRichard Henderson } 1114c0522136SRichard Henderson 1115c0522136SRichard Henderson TCGv_vec tcg_constant_vec(TCGType type, unsigned vece, int64_t val) 1116c0522136SRichard Henderson { 1117c0522136SRichard Henderson val = dup_const(vece, val); 1118c0522136SRichard Henderson return temp_tcgv_vec(tcg_constant_internal(type, val)); 1119c0522136SRichard Henderson } 1120c0522136SRichard Henderson 112188d4005bSRichard Henderson TCGv_vec tcg_constant_vec_matching(TCGv_vec match, unsigned vece, int64_t val) 112288d4005bSRichard Henderson { 112388d4005bSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 112488d4005bSRichard Henderson 112588d4005bSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 112688d4005bSRichard Henderson return tcg_constant_vec(t->base_type, vece, val); 112788d4005bSRichard Henderson } 112888d4005bSRichard Henderson 1129a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1130a7812ae4Spbrook { 1131a7812ae4Spbrook TCGv_i32 t0; 1132a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1133e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1134e8996ee0Sbellard return t0; 1135c896fe29Sbellard } 1136c896fe29Sbellard 1137a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1138c896fe29Sbellard { 1139a7812ae4Spbrook TCGv_i64 t0; 1140a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1141e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1142e8996ee0Sbellard return t0; 1143c896fe29Sbellard } 1144c896fe29Sbellard 1145a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1146bdffd4a9Saurel32 { 1147a7812ae4Spbrook TCGv_i32 t0; 1148a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1149bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1150bdffd4a9Saurel32 return t0; 1151bdffd4a9Saurel32 } 1152bdffd4a9Saurel32 1153a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1154bdffd4a9Saurel32 { 1155a7812ae4Spbrook TCGv_i64 t0; 1156a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1157bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1158bdffd4a9Saurel32 return t0; 1159bdffd4a9Saurel32 } 1160bdffd4a9Saurel32 116127bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 116227bfd83cSPeter Maydell void tcg_clear_temp_count(void) 116327bfd83cSPeter Maydell { 1164b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 116527bfd83cSPeter Maydell s->temps_in_use = 0; 116627bfd83cSPeter Maydell } 116727bfd83cSPeter Maydell 116827bfd83cSPeter Maydell int tcg_check_temp_count(void) 116927bfd83cSPeter Maydell { 1170b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 117127bfd83cSPeter Maydell if (s->temps_in_use) { 117227bfd83cSPeter Maydell /* Clear the count so that we don't give another 117327bfd83cSPeter Maydell * warning immediately next time around. 117427bfd83cSPeter Maydell */ 117527bfd83cSPeter Maydell s->temps_in_use = 0; 117627bfd83cSPeter Maydell return 1; 117727bfd83cSPeter Maydell } 117827bfd83cSPeter Maydell return 0; 117927bfd83cSPeter Maydell } 118027bfd83cSPeter Maydell #endif 118127bfd83cSPeter Maydell 1182be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1183be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1184be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1185be0f34b5SRichard Henderson { 1186d2fd745fSRichard Henderson const bool have_vec 1187d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1188d2fd745fSRichard Henderson 1189be0f34b5SRichard Henderson switch (op) { 1190be0f34b5SRichard Henderson case INDEX_op_discard: 1191be0f34b5SRichard Henderson case INDEX_op_set_label: 1192be0f34b5SRichard Henderson case INDEX_op_call: 1193be0f34b5SRichard Henderson case INDEX_op_br: 1194be0f34b5SRichard Henderson case INDEX_op_mb: 1195be0f34b5SRichard Henderson case INDEX_op_insn_start: 1196be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1197be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1198f4e01e30SRichard Henderson case INDEX_op_goto_ptr: 1199be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1200be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1201be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1202be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1203be0f34b5SRichard Henderson return true; 1204be0f34b5SRichard Henderson 120507ce0b05SRichard Henderson case INDEX_op_qemu_st8_i32: 120607ce0b05SRichard Henderson return TCG_TARGET_HAS_qemu_st8_i32; 120707ce0b05SRichard Henderson 1208be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1209be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1210be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1211be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1212be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1213be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1214be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1215be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1216be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1217be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1218be0f34b5SRichard Henderson case INDEX_op_st_i32: 1219be0f34b5SRichard Henderson case INDEX_op_add_i32: 1220be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1221be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1222be0f34b5SRichard Henderson case INDEX_op_and_i32: 1223be0f34b5SRichard Henderson case INDEX_op_or_i32: 1224be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1225be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1226be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1227be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1228be0f34b5SRichard Henderson return true; 1229be0f34b5SRichard Henderson 1230be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1231be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1232be0f34b5SRichard Henderson case INDEX_op_div_i32: 1233be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1234be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1235be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1236be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1237be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1238be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1239be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1240be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1241be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1242be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1243be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1244be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1245be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1246be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1247be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1248be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1249be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1250fce1296fSRichard Henderson case INDEX_op_extract2_i32: 1251fce1296fSRichard Henderson return TCG_TARGET_HAS_extract2_i32; 1252be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1253be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1254be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1255be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1256be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1257be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1258be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1259be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1260be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1261be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1262be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1263be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1264be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1265be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1266be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1267be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1268be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1269be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1270be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1271be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1272be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1273be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1274be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1275be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1276be0f34b5SRichard Henderson case INDEX_op_not_i32: 1277be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1278be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1279be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1280be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1281be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1282be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1283be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1284be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1285be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1286be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1287be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1288be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1289be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1290be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1291be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1292be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1293be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1294be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1295be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1296be0f34b5SRichard Henderson 1297be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1298be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1299be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1300be0f34b5SRichard Henderson 1301be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1302be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1303be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1304be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1305be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1306be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1307be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1308be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1309be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1310be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1311be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1312be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1313be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1314be0f34b5SRichard Henderson case INDEX_op_st_i64: 1315be0f34b5SRichard Henderson case INDEX_op_add_i64: 1316be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1317be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1318be0f34b5SRichard Henderson case INDEX_op_and_i64: 1319be0f34b5SRichard Henderson case INDEX_op_or_i64: 1320be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1321be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1322be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1323be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1324be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1325be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1326be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1327be0f34b5SRichard Henderson 1328be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1329be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1330be0f34b5SRichard Henderson case INDEX_op_div_i64: 1331be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1332be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1333be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1334be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1335be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1336be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1337be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1338be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1339be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1340be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1341be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1342be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1343be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1344be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1345be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1346be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1347be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1348fce1296fSRichard Henderson case INDEX_op_extract2_i64: 1349fce1296fSRichard Henderson return TCG_TARGET_HAS_extract2_i64; 1350be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1351be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1352be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1353be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1354be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1355be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1356be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1357be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1358be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1359be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1360be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1361be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1362be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1363be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1364be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1365be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1366be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1367be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1368be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1369be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1370be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1371be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1372be0f34b5SRichard Henderson case INDEX_op_not_i64: 1373be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1374be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1375be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1376be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1377be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1378be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1379be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1380be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1381be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1382be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1383be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1384be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1385be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1386be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1387be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1388be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1389be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1390be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1391be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1392be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1393be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1394be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1395be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1396be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1397be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1398be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1399be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1400be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1401be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1402be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1403be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1404be0f34b5SRichard Henderson 1405d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1406d2fd745fSRichard Henderson case INDEX_op_dup_vec: 140737ee55a0SRichard Henderson case INDEX_op_dupm_vec: 1408d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1409d2fd745fSRichard Henderson case INDEX_op_st_vec: 1410d2fd745fSRichard Henderson case INDEX_op_add_vec: 1411d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1412d2fd745fSRichard Henderson case INDEX_op_and_vec: 1413d2fd745fSRichard Henderson case INDEX_op_or_vec: 1414d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1415212be173SRichard Henderson case INDEX_op_cmp_vec: 1416d2fd745fSRichard Henderson return have_vec; 1417d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1418d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1419d2fd745fSRichard Henderson case INDEX_op_not_vec: 1420d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1421d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1422d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1423bcefc902SRichard Henderson case INDEX_op_abs_vec: 1424bcefc902SRichard Henderson return have_vec && TCG_TARGET_HAS_abs_vec; 1425d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1426d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1427d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1428d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 1429ed523473SRichard Henderson case INDEX_op_nand_vec: 1430ed523473SRichard Henderson return have_vec && TCG_TARGET_HAS_nand_vec; 1431ed523473SRichard Henderson case INDEX_op_nor_vec: 1432ed523473SRichard Henderson return have_vec && TCG_TARGET_HAS_nor_vec; 1433ed523473SRichard Henderson case INDEX_op_eqv_vec: 1434ed523473SRichard Henderson return have_vec && TCG_TARGET_HAS_eqv_vec; 14353774030aSRichard Henderson case INDEX_op_mul_vec: 14363774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1437d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1438d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1439d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1440d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1441d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1442d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1443d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1444d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1445d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1446d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1447d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1448d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1449b0f7e744SRichard Henderson case INDEX_op_rotli_vec: 1450b0f7e744SRichard Henderson return have_vec && TCG_TARGET_HAS_roti_vec; 145123850a74SRichard Henderson case INDEX_op_rotls_vec: 145223850a74SRichard Henderson return have_vec && TCG_TARGET_HAS_rots_vec; 14535d0ceda9SRichard Henderson case INDEX_op_rotlv_vec: 14545d0ceda9SRichard Henderson case INDEX_op_rotrv_vec: 14555d0ceda9SRichard Henderson return have_vec && TCG_TARGET_HAS_rotv_vec; 14568afaf050SRichard Henderson case INDEX_op_ssadd_vec: 14578afaf050SRichard Henderson case INDEX_op_usadd_vec: 14588afaf050SRichard Henderson case INDEX_op_sssub_vec: 14598afaf050SRichard Henderson case INDEX_op_ussub_vec: 14608afaf050SRichard Henderson return have_vec && TCG_TARGET_HAS_sat_vec; 1461dd0a0fcdSRichard Henderson case INDEX_op_smin_vec: 1462dd0a0fcdSRichard Henderson case INDEX_op_umin_vec: 1463dd0a0fcdSRichard Henderson case INDEX_op_smax_vec: 1464dd0a0fcdSRichard Henderson case INDEX_op_umax_vec: 1465dd0a0fcdSRichard Henderson return have_vec && TCG_TARGET_HAS_minmax_vec; 146638dc1294SRichard Henderson case INDEX_op_bitsel_vec: 146738dc1294SRichard Henderson return have_vec && TCG_TARGET_HAS_bitsel_vec; 1468f75da298SRichard Henderson case INDEX_op_cmpsel_vec: 1469f75da298SRichard Henderson return have_vec && TCG_TARGET_HAS_cmpsel_vec; 1470d2fd745fSRichard Henderson 1471db432672SRichard Henderson default: 1472db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1473db432672SRichard Henderson return true; 1474be0f34b5SRichard Henderson } 1475be0f34b5SRichard Henderson } 1476be0f34b5SRichard Henderson 147739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 147839cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 147939cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1480ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1481c896fe29Sbellard { 148275e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 14833e92aa34SRichard Henderson unsigned typemask; 14843e92aa34SRichard Henderson const TCGHelperInfo *info; 148575e8b9b7SRichard Henderson TCGOp *op; 1486afb49896SRichard Henderson 1487619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 14887319d83aSRichard Henderson typemask = info->typemask; 14892bece2c8SRichard Henderson 149038b47b19SEmilio G. Cota #ifdef CONFIG_PLUGIN 149138b47b19SEmilio G. Cota /* detect non-plugin helpers */ 149238b47b19SEmilio G. Cota if (tcg_ctx->plugin_insn && unlikely(strncmp(info->name, "plugin_", 7))) { 149338b47b19SEmilio G. Cota tcg_ctx->plugin_insn->calls_helpers = true; 149438b47b19SEmilio G. Cota } 149538b47b19SEmilio G. Cota #endif 149638b47b19SEmilio G. Cota 1497eb8b0224SRichard Henderson if (TCG_TARGET_CALL_ARG_I32 == TCG_CALL_ARG_EXTEND) { 14982bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 14997319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 15007319d83aSRichard Henderson bool is_32bit = (argtype & ~1) == dh_typecode_i32; 15017319d83aSRichard Henderson bool is_signed = argtype & 1; 15027319d83aSRichard Henderson 15037319d83aSRichard Henderson if (is_32bit) { 15042bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 150518cf3d07SRichard Henderson TCGv_i32 orig = temp_tcgv_i32(args[i]); 15062bece2c8SRichard Henderson if (is_signed) { 150718cf3d07SRichard Henderson tcg_gen_ext_i32_i64(temp, orig); 15082bece2c8SRichard Henderson } else { 150918cf3d07SRichard Henderson tcg_gen_extu_i32_i64(temp, orig); 15102bece2c8SRichard Henderson } 1511ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 15122bece2c8SRichard Henderson } 15132bece2c8SRichard Henderson } 1514eb8b0224SRichard Henderson } 15152bece2c8SRichard Henderson 151615fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 151775e8b9b7SRichard Henderson 151875e8b9b7SRichard Henderson pi = 0; 1519ae8b75dcSRichard Henderson if (ret != NULL) { 15207319d83aSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (typemask & 6) == dh_typecode_i64) { 1521ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1522ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1523a7812ae4Spbrook nb_rets = 2; 152434b1a49cSRichard Henderson } else { 1525ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1526a7812ae4Spbrook nb_rets = 1; 1527a7812ae4Spbrook } 1528a7812ae4Spbrook } else { 1529a7812ae4Spbrook nb_rets = 0; 1530a7812ae4Spbrook } 1531cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 153275e8b9b7SRichard Henderson 1533a7812ae4Spbrook real_args = 0; 1534a7812ae4Spbrook for (i = 0; i < nargs; i++) { 15357319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 1536*e2a9dd6bSRichard Henderson TCGCallArgumentKind kind; 1537*e2a9dd6bSRichard Henderson TCGType type; 15387319d83aSRichard Henderson 1539*e2a9dd6bSRichard Henderson switch (argtype) { 1540*e2a9dd6bSRichard Henderson case dh_typecode_i32: 1541*e2a9dd6bSRichard Henderson case dh_typecode_s32: 1542*e2a9dd6bSRichard Henderson type = TCG_TYPE_I32; 1543*e2a9dd6bSRichard Henderson break; 1544*e2a9dd6bSRichard Henderson case dh_typecode_i64: 1545*e2a9dd6bSRichard Henderson case dh_typecode_s64: 1546*e2a9dd6bSRichard Henderson type = TCG_TYPE_I64; 1547*e2a9dd6bSRichard Henderson break; 1548*e2a9dd6bSRichard Henderson case dh_typecode_ptr: 1549*e2a9dd6bSRichard Henderson type = TCG_TYPE_PTR; 1550*e2a9dd6bSRichard Henderson break; 1551*e2a9dd6bSRichard Henderson default: 1552*e2a9dd6bSRichard Henderson g_assert_not_reached(); 1553c8eef960SRichard Henderson } 15547b7d8b2dSRichard Henderson 1555*e2a9dd6bSRichard Henderson switch (type) { 1556*e2a9dd6bSRichard Henderson case TCG_TYPE_I32: 1557*e2a9dd6bSRichard Henderson kind = TCG_TARGET_CALL_ARG_I32; 1558*e2a9dd6bSRichard Henderson break; 1559*e2a9dd6bSRichard Henderson case TCG_TYPE_I64: 1560*e2a9dd6bSRichard Henderson kind = TCG_TARGET_CALL_ARG_I64; 1561*e2a9dd6bSRichard Henderson break; 1562*e2a9dd6bSRichard Henderson default: 1563*e2a9dd6bSRichard Henderson g_assert_not_reached(); 1564*e2a9dd6bSRichard Henderson } 1565*e2a9dd6bSRichard Henderson 1566*e2a9dd6bSRichard Henderson switch (kind) { 1567*e2a9dd6bSRichard Henderson case TCG_CALL_ARG_EVEN: 1568*e2a9dd6bSRichard Henderson if (real_args & 1) { 156975e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1570ebd486d5Smalc real_args++; 157139cf05d3Sbellard } 1572*e2a9dd6bSRichard Henderson /* fall through */ 1573*e2a9dd6bSRichard Henderson case TCG_CALL_ARG_NORMAL: 1574*e2a9dd6bSRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 1575aef85402SRichard Henderson op->args[pi++] = temp_arg(args[i]); 1576aef85402SRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1577a7812ae4Spbrook real_args += 2; 1578*e2a9dd6bSRichard Henderson break; 15792bece2c8SRichard Henderson } 1580ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1581a7812ae4Spbrook real_args++; 1582*e2a9dd6bSRichard Henderson break; 1583*e2a9dd6bSRichard Henderson default: 1584*e2a9dd6bSRichard Henderson g_assert_not_reached(); 1585*e2a9dd6bSRichard Henderson } 1586c896fe29Sbellard } 158775e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 15883e92aa34SRichard Henderson op->args[pi++] = (uintptr_t)info; 1589cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1590a7812ae4Spbrook 159175e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1592cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 159375e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 15942bece2c8SRichard Henderson 1595eb8b0224SRichard Henderson if (TCG_TARGET_CALL_ARG_I32 == TCG_CALL_ARG_EXTEND) { 15962bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 15977319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 15987319d83aSRichard Henderson bool is_32bit = (argtype & ~1) == dh_typecode_i32; 15997319d83aSRichard Henderson 16007319d83aSRichard Henderson if (is_32bit) { 1601085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 16022bece2c8SRichard Henderson } 16032bece2c8SRichard Henderson } 1604eb8b0224SRichard Henderson } 1605a7812ae4Spbrook } 1606c896fe29Sbellard 16078fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1608c896fe29Sbellard { 1609ac3b8891SRichard Henderson int i, n; 1610ac3b8891SRichard Henderson 1611ee17db83SRichard Henderson for (i = 0, n = s->nb_temps; i < n; i++) { 1612ee17db83SRichard Henderson TCGTemp *ts = &s->temps[i]; 1613ee17db83SRichard Henderson TCGTempVal val = TEMP_VAL_MEM; 1614ee17db83SRichard Henderson 1615ee17db83SRichard Henderson switch (ts->kind) { 1616c0522136SRichard Henderson case TEMP_CONST: 1617c0522136SRichard Henderson val = TEMP_VAL_CONST; 1618c0522136SRichard Henderson break; 1619ee17db83SRichard Henderson case TEMP_FIXED: 1620ee17db83SRichard Henderson val = TEMP_VAL_REG; 1621ee17db83SRichard Henderson break; 1622ee17db83SRichard Henderson case TEMP_GLOBAL: 1623ee17db83SRichard Henderson break; 1624ee17db83SRichard Henderson case TEMP_NORMAL: 1625c7482438SRichard Henderson case TEMP_EBB: 1626ee17db83SRichard Henderson val = TEMP_VAL_DEAD; 1627ee17db83SRichard Henderson /* fall through */ 1628ee17db83SRichard Henderson case TEMP_LOCAL: 1629e8996ee0Sbellard ts->mem_allocated = 0; 1630ee17db83SRichard Henderson break; 1631ee17db83SRichard Henderson default: 1632ee17db83SRichard Henderson g_assert_not_reached(); 1633ee17db83SRichard Henderson } 1634ee17db83SRichard Henderson ts->val_type = val; 1635e8996ee0Sbellard } 1636f8b2f202SRichard Henderson 1637f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1638c896fe29Sbellard } 1639c896fe29Sbellard 1640f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1641f8b2f202SRichard Henderson TCGTemp *ts) 1642c896fe29Sbellard { 16431807f4c4SRichard Henderson int idx = temp_idx(ts); 1644ac56dd48Spbrook 1645ee17db83SRichard Henderson switch (ts->kind) { 1646ee17db83SRichard Henderson case TEMP_FIXED: 1647ee17db83SRichard Henderson case TEMP_GLOBAL: 1648ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1649ee17db83SRichard Henderson break; 1650ee17db83SRichard Henderson case TEMP_LOCAL: 1651641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1652ee17db83SRichard Henderson break; 1653c7482438SRichard Henderson case TEMP_EBB: 1654c7482438SRichard Henderson snprintf(buf, buf_size, "ebb%d", idx - s->nb_globals); 1655c7482438SRichard Henderson break; 1656ee17db83SRichard Henderson case TEMP_NORMAL: 1657ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1658ee17db83SRichard Henderson break; 1659c0522136SRichard Henderson case TEMP_CONST: 1660c0522136SRichard Henderson switch (ts->type) { 1661c0522136SRichard Henderson case TCG_TYPE_I32: 1662c0522136SRichard Henderson snprintf(buf, buf_size, "$0x%x", (int32_t)ts->val); 1663c0522136SRichard Henderson break; 1664c0522136SRichard Henderson #if TCG_TARGET_REG_BITS > 32 1665c0522136SRichard Henderson case TCG_TYPE_I64: 1666c0522136SRichard Henderson snprintf(buf, buf_size, "$0x%" PRIx64, ts->val); 1667c0522136SRichard Henderson break; 1668c0522136SRichard Henderson #endif 1669c0522136SRichard Henderson case TCG_TYPE_V64: 1670c0522136SRichard Henderson case TCG_TYPE_V128: 1671c0522136SRichard Henderson case TCG_TYPE_V256: 1672c0522136SRichard Henderson snprintf(buf, buf_size, "v%d$0x%" PRIx64, 1673c0522136SRichard Henderson 64 << (ts->type - TCG_TYPE_V64), ts->val); 1674c0522136SRichard Henderson break; 1675c0522136SRichard Henderson default: 1676c0522136SRichard Henderson g_assert_not_reached(); 1677c0522136SRichard Henderson } 1678c0522136SRichard Henderson break; 1679c896fe29Sbellard } 1680c896fe29Sbellard return buf; 1681c896fe29Sbellard } 1682c896fe29Sbellard 168343439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 168443439139SRichard Henderson int buf_size, TCGArg arg) 1685f8b2f202SRichard Henderson { 168643439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1687f8b2f202SRichard Henderson } 1688f8b2f202SRichard Henderson 1689f48f3edeSblueswir1 static const char * const cond_name[] = 1690f48f3edeSblueswir1 { 16910aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 16920aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1693f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1694f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1695f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1696f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1697f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1698f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1699f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1700f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1701f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1702f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1703f48f3edeSblueswir1 }; 1704f48f3edeSblueswir1 1705f713d6adSRichard Henderson static const char * const ldst_name[] = 1706f713d6adSRichard Henderson { 1707f713d6adSRichard Henderson [MO_UB] = "ub", 1708f713d6adSRichard Henderson [MO_SB] = "sb", 1709f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1710f713d6adSRichard Henderson [MO_LESW] = "lesw", 1711f713d6adSRichard Henderson [MO_LEUL] = "leul", 1712f713d6adSRichard Henderson [MO_LESL] = "lesl", 1713fc313c64SFrédéric Pétrot [MO_LEUQ] = "leq", 1714f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1715f713d6adSRichard Henderson [MO_BESW] = "besw", 1716f713d6adSRichard Henderson [MO_BEUL] = "beul", 1717f713d6adSRichard Henderson [MO_BESL] = "besl", 1718fc313c64SFrédéric Pétrot [MO_BEUQ] = "beq", 1719f713d6adSRichard Henderson }; 1720f713d6adSRichard Henderson 17211f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 172252bf9771Stony.nguyen@bt.com #ifdef TARGET_ALIGNED_ONLY 17231f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 17241f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 17251f00b27fSSergey Sorokin #else 17261f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 17271f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 17281f00b27fSSergey Sorokin #endif 17291f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 17301f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 17311f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 17321f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 17331f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 17341f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 17351f00b27fSSergey Sorokin }; 17361f00b27fSSergey Sorokin 1737587195bdSRichard Henderson static const char bswap_flag_name[][6] = { 1738587195bdSRichard Henderson [TCG_BSWAP_IZ] = "iz", 1739587195bdSRichard Henderson [TCG_BSWAP_OZ] = "oz", 1740587195bdSRichard Henderson [TCG_BSWAP_OS] = "os", 1741587195bdSRichard Henderson [TCG_BSWAP_IZ | TCG_BSWAP_OZ] = "iz,oz", 1742587195bdSRichard Henderson [TCG_BSWAP_IZ | TCG_BSWAP_OS] = "iz,os", 1743587195bdSRichard Henderson }; 1744587195bdSRichard Henderson 1745b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d) 1746b016486eSRichard Henderson { 1747b016486eSRichard Henderson return (d & (d - 1)) == 0; 1748b016486eSRichard Henderson } 1749b016486eSRichard Henderson 1750b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d) 1751b016486eSRichard Henderson { 1752b016486eSRichard Henderson if (TCG_TARGET_NB_REGS <= 32) { 1753b016486eSRichard Henderson return ctz32(d); 1754b016486eSRichard Henderson } else { 1755b016486eSRichard Henderson return ctz64(d); 1756b016486eSRichard Henderson } 1757b016486eSRichard Henderson } 1758b016486eSRichard Henderson 1759b7a83ff8SRichard Henderson /* Return only the number of characters output -- no error return. */ 1760b7a83ff8SRichard Henderson #define ne_fprintf(...) \ 1761b7a83ff8SRichard Henderson ({ int ret_ = fprintf(__VA_ARGS__); ret_ >= 0 ? ret_ : 0; }) 1762b7a83ff8SRichard Henderson 1763b7a83ff8SRichard Henderson static void tcg_dump_ops(TCGContext *s, FILE *f, bool have_prefs) 1764c896fe29Sbellard { 1765c896fe29Sbellard char buf[128]; 1766c45cb8bbSRichard Henderson TCGOp *op; 1767c896fe29Sbellard 176815fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1769c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1770c45cb8bbSRichard Henderson const TCGOpDef *def; 1771c45cb8bbSRichard Henderson TCGOpcode c; 1772bdfb460eSRichard Henderson int col = 0; 1773c45cb8bbSRichard Henderson 1774c45cb8bbSRichard Henderson c = op->opc; 1775c896fe29Sbellard def = &tcg_op_defs[c]; 1776c45cb8bbSRichard Henderson 1777765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1778b016486eSRichard Henderson nb_oargs = 0; 1779b7a83ff8SRichard Henderson col += ne_fprintf(f, "\n ----"); 17809aef40edSRichard Henderson 17819aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 17829aef40edSRichard Henderson target_ulong a; 17837e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1784efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 17857e4597d7Sbellard #else 1786efee3746SRichard Henderson a = op->args[i]; 17877e4597d7Sbellard #endif 1788b7a83ff8SRichard Henderson col += ne_fprintf(f, " " TARGET_FMT_lx, a); 1789eeacee4dSBlue Swirl } 17907e4597d7Sbellard } else if (c == INDEX_op_call) { 17913e92aa34SRichard Henderson const TCGHelperInfo *info = tcg_call_info(op); 1792fa52e660SRichard Henderson void *func = tcg_call_func(op); 17933e92aa34SRichard Henderson 1794c896fe29Sbellard /* variable number of arguments */ 1795cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1796cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1797c896fe29Sbellard nb_cargs = def->nb_cargs; 1798b03cce8eSbellard 1799b7a83ff8SRichard Henderson col += ne_fprintf(f, " %s ", def->name); 18003e92aa34SRichard Henderson 18013e92aa34SRichard Henderson /* 18023e92aa34SRichard Henderson * Print the function name from TCGHelperInfo, if available. 18033e92aa34SRichard Henderson * Note that plugins have a template function for the info, 18043e92aa34SRichard Henderson * but the actual function pointer comes from the plugin. 18053e92aa34SRichard Henderson */ 18063e92aa34SRichard Henderson if (func == info->func) { 1807b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s", info->name); 18083e92aa34SRichard Henderson } else { 1809b7a83ff8SRichard Henderson col += ne_fprintf(f, "plugin(%p)", func); 18103e92aa34SRichard Henderson } 18113e92aa34SRichard Henderson 1812b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%x,$%d", info->flags, nb_oargs); 1813b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 1814b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1815efee3746SRichard Henderson op->args[i])); 1816b03cce8eSbellard } 1817cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1818efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1819cf066674SRichard Henderson const char *t = "<dummy>"; 1820cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 182143439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1822b03cce8eSbellard } 1823b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", t); 1824e8996ee0Sbellard } 1825b03cce8eSbellard } else { 1826b7a83ff8SRichard Henderson col += ne_fprintf(f, " %s ", def->name); 1827c45cb8bbSRichard Henderson 1828c896fe29Sbellard nb_oargs = def->nb_oargs; 1829c896fe29Sbellard nb_iargs = def->nb_iargs; 1830c896fe29Sbellard nb_cargs = def->nb_cargs; 1831c896fe29Sbellard 1832d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1833b7a83ff8SRichard Henderson col += ne_fprintf(f, "v%d,e%d,", 64 << TCGOP_VECL(op), 1834d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1835d2fd745fSRichard Henderson } 1836d2fd745fSRichard Henderson 1837c896fe29Sbellard k = 0; 1838c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1839b7a83ff8SRichard Henderson const char *sep = k ? "," : ""; 1840b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s%s", sep, 1841b7a83ff8SRichard Henderson tcg_get_arg_str(s, buf, sizeof(buf), 1842efee3746SRichard Henderson op->args[k++])); 1843c896fe29Sbellard } 1844c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1845b7a83ff8SRichard Henderson const char *sep = k ? "," : ""; 1846b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s%s", sep, 1847b7a83ff8SRichard Henderson tcg_get_arg_str(s, buf, sizeof(buf), 1848efee3746SRichard Henderson op->args[k++])); 1849c896fe29Sbellard } 1850be210acbSRichard Henderson switch (c) { 1851be210acbSRichard Henderson case INDEX_op_brcond_i32: 1852ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1853ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1854be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1855be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1856ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1857be210acbSRichard Henderson case INDEX_op_setcond_i64: 1858ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1859212be173SRichard Henderson case INDEX_op_cmp_vec: 1860f75da298SRichard Henderson case INDEX_op_cmpsel_vec: 1861efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1862efee3746SRichard Henderson && cond_name[op->args[k]]) { 1863b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", cond_name[op->args[k++]]); 1864eeacee4dSBlue Swirl } else { 1865b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%" TCG_PRIlx, op->args[k++]); 1866eeacee4dSBlue Swirl } 1867f48f3edeSblueswir1 i = 1; 1868be210acbSRichard Henderson break; 1869f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1870f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 187107ce0b05SRichard Henderson case INDEX_op_qemu_st8_i32: 1872f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1873f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 187459227d5dSRichard Henderson { 18759002ffcbSRichard Henderson MemOpIdx oi = op->args[k++]; 187614776ab5STony Nguyen MemOp op = get_memop(oi); 187759227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 187859227d5dSRichard Henderson 187959c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1880b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%x,%u", op, ix); 188159c4b7e8SRichard Henderson } else { 18821f00b27fSSergey Sorokin const char *s_al, *s_op; 18831f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 188459c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1885b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s%s,%u", s_al, s_op, ix); 1886f713d6adSRichard Henderson } 1887f713d6adSRichard Henderson i = 1; 188859227d5dSRichard Henderson } 1889f713d6adSRichard Henderson break; 1890587195bdSRichard Henderson case INDEX_op_bswap16_i32: 1891587195bdSRichard Henderson case INDEX_op_bswap16_i64: 1892587195bdSRichard Henderson case INDEX_op_bswap32_i32: 1893587195bdSRichard Henderson case INDEX_op_bswap32_i64: 1894587195bdSRichard Henderson case INDEX_op_bswap64_i64: 1895587195bdSRichard Henderson { 1896587195bdSRichard Henderson TCGArg flags = op->args[k]; 1897587195bdSRichard Henderson const char *name = NULL; 1898587195bdSRichard Henderson 1899587195bdSRichard Henderson if (flags < ARRAY_SIZE(bswap_flag_name)) { 1900587195bdSRichard Henderson name = bswap_flag_name[flags]; 1901587195bdSRichard Henderson } 1902587195bdSRichard Henderson if (name) { 1903b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", name); 1904587195bdSRichard Henderson } else { 1905b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%" TCG_PRIlx, flags); 1906587195bdSRichard Henderson } 1907587195bdSRichard Henderson i = k = 1; 1908587195bdSRichard Henderson } 1909587195bdSRichard Henderson break; 1910be210acbSRichard Henderson default: 1911f48f3edeSblueswir1 i = 0; 1912be210acbSRichard Henderson break; 1913be210acbSRichard Henderson } 191451e3972cSRichard Henderson switch (c) { 191551e3972cSRichard Henderson case INDEX_op_set_label: 191651e3972cSRichard Henderson case INDEX_op_br: 191751e3972cSRichard Henderson case INDEX_op_brcond_i32: 191851e3972cSRichard Henderson case INDEX_op_brcond_i64: 191951e3972cSRichard Henderson case INDEX_op_brcond2_i32: 1920b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s$L%d", k ? "," : "", 1921efee3746SRichard Henderson arg_label(op->args[k])->id); 192251e3972cSRichard Henderson i++, k++; 192351e3972cSRichard Henderson break; 192451e3972cSRichard Henderson default: 192551e3972cSRichard Henderson break; 1926eeacee4dSBlue Swirl } 192751e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 1928b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s$0x%" TCG_PRIlx, k ? "," : "", 1929b7a83ff8SRichard Henderson op->args[k]); 1930bdfb460eSRichard Henderson } 1931bdfb460eSRichard Henderson } 1932bdfb460eSRichard Henderson 19331894f69aSRichard Henderson if (have_prefs || op->life) { 19341894f69aSRichard Henderson for (; col < 40; ++col) { 1935b7a83ff8SRichard Henderson putc(' ', f); 1936bdfb460eSRichard Henderson } 19371894f69aSRichard Henderson } 19381894f69aSRichard Henderson 19391894f69aSRichard Henderson if (op->life) { 19401894f69aSRichard Henderson unsigned life = op->life; 1941bdfb460eSRichard Henderson 1942bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 1943b7a83ff8SRichard Henderson ne_fprintf(f, " sync:"); 1944bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 1945bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 1946b7a83ff8SRichard Henderson ne_fprintf(f, " %d", i); 1947bdfb460eSRichard Henderson } 1948bdfb460eSRichard Henderson } 1949bdfb460eSRichard Henderson } 1950bdfb460eSRichard Henderson life /= DEAD_ARG; 1951bdfb460eSRichard Henderson if (life) { 1952b7a83ff8SRichard Henderson ne_fprintf(f, " dead:"); 1953bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 1954bdfb460eSRichard Henderson if (life & 1) { 1955b7a83ff8SRichard Henderson ne_fprintf(f, " %d", i); 1956bdfb460eSRichard Henderson } 1957bdfb460eSRichard Henderson } 1958c896fe29Sbellard } 1959b03cce8eSbellard } 19601894f69aSRichard Henderson 19611894f69aSRichard Henderson if (have_prefs) { 19621894f69aSRichard Henderson for (i = 0; i < nb_oargs; ++i) { 19631894f69aSRichard Henderson TCGRegSet set = op->output_pref[i]; 19641894f69aSRichard Henderson 19651894f69aSRichard Henderson if (i == 0) { 1966b7a83ff8SRichard Henderson ne_fprintf(f, " pref="); 19671894f69aSRichard Henderson } else { 1968b7a83ff8SRichard Henderson ne_fprintf(f, ","); 19691894f69aSRichard Henderson } 19701894f69aSRichard Henderson if (set == 0) { 1971b7a83ff8SRichard Henderson ne_fprintf(f, "none"); 19721894f69aSRichard Henderson } else if (set == MAKE_64BIT_MASK(0, TCG_TARGET_NB_REGS)) { 1973b7a83ff8SRichard Henderson ne_fprintf(f, "all"); 19741894f69aSRichard Henderson #ifdef CONFIG_DEBUG_TCG 19751894f69aSRichard Henderson } else if (tcg_regset_single(set)) { 19761894f69aSRichard Henderson TCGReg reg = tcg_regset_first(set); 1977b7a83ff8SRichard Henderson ne_fprintf(f, "%s", tcg_target_reg_names[reg]); 19781894f69aSRichard Henderson #endif 19791894f69aSRichard Henderson } else if (TCG_TARGET_NB_REGS <= 32) { 1980b7a83ff8SRichard Henderson ne_fprintf(f, "0x%x", (uint32_t)set); 19811894f69aSRichard Henderson } else { 1982b7a83ff8SRichard Henderson ne_fprintf(f, "0x%" PRIx64, (uint64_t)set); 19831894f69aSRichard Henderson } 19841894f69aSRichard Henderson } 19851894f69aSRichard Henderson } 19861894f69aSRichard Henderson 1987b7a83ff8SRichard Henderson putc('\n', f); 1988c896fe29Sbellard } 1989c896fe29Sbellard } 1990c896fe29Sbellard 1991c896fe29Sbellard /* we give more priority to constraints with less registers */ 1992c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 1993c896fe29Sbellard { 199474a11790SRichard Henderson const TCGArgConstraint *arg_ct = &def->args_ct[k]; 199529f5e925SRichard Henderson int n = ctpop64(arg_ct->regs); 1996c896fe29Sbellard 199729f5e925SRichard Henderson /* 199829f5e925SRichard Henderson * Sort constraints of a single register first, which includes output 199929f5e925SRichard Henderson * aliases (which must exactly match the input already allocated). 200029f5e925SRichard Henderson */ 200129f5e925SRichard Henderson if (n == 1 || arg_ct->oalias) { 200229f5e925SRichard Henderson return INT_MAX; 2003c896fe29Sbellard } 200429f5e925SRichard Henderson 200529f5e925SRichard Henderson /* 200629f5e925SRichard Henderson * Sort register pairs next, first then second immediately after. 200729f5e925SRichard Henderson * Arbitrarily sort multiple pairs by the index of the first reg; 200829f5e925SRichard Henderson * there shouldn't be many pairs. 200929f5e925SRichard Henderson */ 201029f5e925SRichard Henderson switch (arg_ct->pair) { 201129f5e925SRichard Henderson case 1: 201229f5e925SRichard Henderson case 3: 201329f5e925SRichard Henderson return (k + 1) * 2; 201429f5e925SRichard Henderson case 2: 201529f5e925SRichard Henderson return (arg_ct->pair_index + 1) * 2 - 1; 201629f5e925SRichard Henderson } 201729f5e925SRichard Henderson 201829f5e925SRichard Henderson /* Finally, sort by decreasing register count. */ 201929f5e925SRichard Henderson assert(n > 1); 202029f5e925SRichard Henderson return -n; 2021c896fe29Sbellard } 2022c896fe29Sbellard 2023c896fe29Sbellard /* sort from highest priority to lowest */ 2024c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 2025c896fe29Sbellard { 202666792f90SRichard Henderson int i, j; 202766792f90SRichard Henderson TCGArgConstraint *a = def->args_ct; 2028c896fe29Sbellard 202966792f90SRichard Henderson for (i = 0; i < n; i++) { 203066792f90SRichard Henderson a[start + i].sort_index = start + i; 203166792f90SRichard Henderson } 203266792f90SRichard Henderson if (n <= 1) { 2033c896fe29Sbellard return; 203466792f90SRichard Henderson } 2035c896fe29Sbellard for (i = 0; i < n - 1; i++) { 2036c896fe29Sbellard for (j = i + 1; j < n; j++) { 203766792f90SRichard Henderson int p1 = get_constraint_priority(def, a[start + i].sort_index); 203866792f90SRichard Henderson int p2 = get_constraint_priority(def, a[start + j].sort_index); 2039c896fe29Sbellard if (p1 < p2) { 204066792f90SRichard Henderson int tmp = a[start + i].sort_index; 204166792f90SRichard Henderson a[start + i].sort_index = a[start + j].sort_index; 204266792f90SRichard Henderson a[start + j].sort_index = tmp; 2043c896fe29Sbellard } 2044c896fe29Sbellard } 2045c896fe29Sbellard } 2046c896fe29Sbellard } 2047c896fe29Sbellard 2048f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 2049c896fe29Sbellard { 2050a9751609SRichard Henderson TCGOpcode op; 2051c896fe29Sbellard 2052f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 2053f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 2054f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 205529f5e925SRichard Henderson bool saw_alias_pair = false; 205629f5e925SRichard Henderson int i, o, i2, o2, nb_args; 2057f69d277eSRichard Henderson 2058f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 2059f69d277eSRichard Henderson continue; 2060f69d277eSRichard Henderson } 2061f69d277eSRichard Henderson 2062c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 2063f69d277eSRichard Henderson if (nb_args == 0) { 2064f69d277eSRichard Henderson continue; 2065f69d277eSRichard Henderson } 2066f69d277eSRichard Henderson 20674c22e840SRichard Henderson /* 20684c22e840SRichard Henderson * Macro magic should make it impossible, but double-check that 20694c22e840SRichard Henderson * the array index is in range. Since the signness of an enum 20704c22e840SRichard Henderson * is implementation defined, force the result to unsigned. 20714c22e840SRichard Henderson */ 20724c22e840SRichard Henderson unsigned con_set = tcg_target_op_def(op); 20734c22e840SRichard Henderson tcg_debug_assert(con_set < ARRAY_SIZE(constraint_sets)); 20744c22e840SRichard Henderson tdefs = &constraint_sets[con_set]; 2075f69d277eSRichard Henderson 2076c896fe29Sbellard for (i = 0; i < nb_args; i++) { 2077f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 20788940ea0dSPhilippe Mathieu-Daudé bool input_p = i >= def->nb_oargs; 20798940ea0dSPhilippe Mathieu-Daudé 2080f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2081eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2082f69d277eSRichard Henderson 208317280ff4SRichard Henderson switch (*ct_str) { 208417280ff4SRichard Henderson case '0' ... '9': 20858940ea0dSPhilippe Mathieu-Daudé o = *ct_str - '0'; 20868940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(input_p); 20878940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(o < def->nb_oargs); 20888940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(def->args_ct[o].regs != 0); 20898940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(!def->args_ct[o].oalias); 20908940ea0dSPhilippe Mathieu-Daudé def->args_ct[i] = def->args_ct[o]; 2091bc2b17e6SRichard Henderson /* The output sets oalias. */ 20928940ea0dSPhilippe Mathieu-Daudé def->args_ct[o].oalias = 1; 20938940ea0dSPhilippe Mathieu-Daudé def->args_ct[o].alias_index = i; 2094bc2b17e6SRichard Henderson /* The input sets ialias. */ 20958940ea0dSPhilippe Mathieu-Daudé def->args_ct[i].ialias = 1; 20968940ea0dSPhilippe Mathieu-Daudé def->args_ct[i].alias_index = o; 209729f5e925SRichard Henderson if (def->args_ct[i].pair) { 209829f5e925SRichard Henderson saw_alias_pair = true; 209929f5e925SRichard Henderson } 21008940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(ct_str[1] == '\0'); 21018940ea0dSPhilippe Mathieu-Daudé continue; 21028940ea0dSPhilippe Mathieu-Daudé 210382790a87SRichard Henderson case '&': 21048940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(!input_p); 2105bc2b17e6SRichard Henderson def->args_ct[i].newreg = true; 210682790a87SRichard Henderson ct_str++; 210782790a87SRichard Henderson break; 210829f5e925SRichard Henderson 210929f5e925SRichard Henderson case 'p': /* plus */ 211029f5e925SRichard Henderson /* Allocate to the register after the previous. */ 211129f5e925SRichard Henderson tcg_debug_assert(i > (input_p ? def->nb_oargs : 0)); 211229f5e925SRichard Henderson o = i - 1; 211329f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].pair); 211429f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].ct); 211529f5e925SRichard Henderson def->args_ct[i] = (TCGArgConstraint){ 211629f5e925SRichard Henderson .pair = 2, 211729f5e925SRichard Henderson .pair_index = o, 211829f5e925SRichard Henderson .regs = def->args_ct[o].regs << 1, 211929f5e925SRichard Henderson }; 212029f5e925SRichard Henderson def->args_ct[o].pair = 1; 212129f5e925SRichard Henderson def->args_ct[o].pair_index = i; 212229f5e925SRichard Henderson tcg_debug_assert(ct_str[1] == '\0'); 212329f5e925SRichard Henderson continue; 212429f5e925SRichard Henderson 212529f5e925SRichard Henderson case 'm': /* minus */ 212629f5e925SRichard Henderson /* Allocate to the register before the previous. */ 212729f5e925SRichard Henderson tcg_debug_assert(i > (input_p ? def->nb_oargs : 0)); 212829f5e925SRichard Henderson o = i - 1; 212929f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].pair); 213029f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].ct); 213129f5e925SRichard Henderson def->args_ct[i] = (TCGArgConstraint){ 213229f5e925SRichard Henderson .pair = 1, 213329f5e925SRichard Henderson .pair_index = o, 213429f5e925SRichard Henderson .regs = def->args_ct[o].regs >> 1, 213529f5e925SRichard Henderson }; 213629f5e925SRichard Henderson def->args_ct[o].pair = 2; 213729f5e925SRichard Henderson def->args_ct[o].pair_index = i; 213829f5e925SRichard Henderson tcg_debug_assert(ct_str[1] == '\0'); 213929f5e925SRichard Henderson continue; 21408940ea0dSPhilippe Mathieu-Daudé } 21418940ea0dSPhilippe Mathieu-Daudé 21428940ea0dSPhilippe Mathieu-Daudé do { 21438940ea0dSPhilippe Mathieu-Daudé switch (*ct_str) { 2144c896fe29Sbellard case 'i': 2145c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2146c896fe29Sbellard break; 2147358b4923SRichard Henderson 2148358b4923SRichard Henderson /* Include all of the target-specific constraints. */ 2149358b4923SRichard Henderson 2150358b4923SRichard Henderson #undef CONST 2151358b4923SRichard Henderson #define CONST(CASE, MASK) \ 21528940ea0dSPhilippe Mathieu-Daudé case CASE: def->args_ct[i].ct |= MASK; break; 2153358b4923SRichard Henderson #define REGS(CASE, MASK) \ 21548940ea0dSPhilippe Mathieu-Daudé case CASE: def->args_ct[i].regs |= MASK; break; 2155358b4923SRichard Henderson 2156358b4923SRichard Henderson #include "tcg-target-con-str.h" 2157358b4923SRichard Henderson 2158358b4923SRichard Henderson #undef REGS 2159358b4923SRichard Henderson #undef CONST 2160c896fe29Sbellard default: 21618940ea0dSPhilippe Mathieu-Daudé case '0' ... '9': 21628940ea0dSPhilippe Mathieu-Daudé case '&': 216329f5e925SRichard Henderson case 'p': 216429f5e925SRichard Henderson case 'm': 2165358b4923SRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2166358b4923SRichard Henderson g_assert_not_reached(); 2167358b4923SRichard Henderson } 21688940ea0dSPhilippe Mathieu-Daudé } while (*++ct_str != '\0'); 2169c896fe29Sbellard } 2170c896fe29Sbellard 2171c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2172eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2173c68aaa18SStefan Weil 217429f5e925SRichard Henderson /* 217529f5e925SRichard Henderson * Fix up output pairs that are aliased with inputs. 217629f5e925SRichard Henderson * When we created the alias, we copied pair from the output. 217729f5e925SRichard Henderson * There are three cases: 217829f5e925SRichard Henderson * (1a) Pairs of inputs alias pairs of outputs. 217929f5e925SRichard Henderson * (1b) One input aliases the first of a pair of outputs. 218029f5e925SRichard Henderson * (2) One input aliases the second of a pair of outputs. 218129f5e925SRichard Henderson * 218229f5e925SRichard Henderson * Case 1a is handled by making sure that the pair_index'es are 218329f5e925SRichard Henderson * properly updated so that they appear the same as a pair of inputs. 218429f5e925SRichard Henderson * 218529f5e925SRichard Henderson * Case 1b is handled by setting the pair_index of the input to 218629f5e925SRichard Henderson * itself, simply so it doesn't point to an unrelated argument. 218729f5e925SRichard Henderson * Since we don't encounter the "second" during the input allocation 218829f5e925SRichard Henderson * phase, nothing happens with the second half of the input pair. 218929f5e925SRichard Henderson * 219029f5e925SRichard Henderson * Case 2 is handled by setting the second input to pair=3, the 219129f5e925SRichard Henderson * first output to pair=3, and the pair_index'es to match. 219229f5e925SRichard Henderson */ 219329f5e925SRichard Henderson if (saw_alias_pair) { 219429f5e925SRichard Henderson for (i = def->nb_oargs; i < nb_args; i++) { 219529f5e925SRichard Henderson /* 219629f5e925SRichard Henderson * Since [0-9pm] must be alone in the constraint string, 219729f5e925SRichard Henderson * the only way they can both be set is if the pair comes 219829f5e925SRichard Henderson * from the output alias. 219929f5e925SRichard Henderson */ 220029f5e925SRichard Henderson if (!def->args_ct[i].ialias) { 220129f5e925SRichard Henderson continue; 220229f5e925SRichard Henderson } 220329f5e925SRichard Henderson switch (def->args_ct[i].pair) { 220429f5e925SRichard Henderson case 0: 220529f5e925SRichard Henderson break; 220629f5e925SRichard Henderson case 1: 220729f5e925SRichard Henderson o = def->args_ct[i].alias_index; 220829f5e925SRichard Henderson o2 = def->args_ct[o].pair_index; 220929f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o].pair == 1); 221029f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o2].pair == 2); 221129f5e925SRichard Henderson if (def->args_ct[o2].oalias) { 221229f5e925SRichard Henderson /* Case 1a */ 221329f5e925SRichard Henderson i2 = def->args_ct[o2].alias_index; 221429f5e925SRichard Henderson tcg_debug_assert(def->args_ct[i2].pair == 2); 221529f5e925SRichard Henderson def->args_ct[i2].pair_index = i; 221629f5e925SRichard Henderson def->args_ct[i].pair_index = i2; 221729f5e925SRichard Henderson } else { 221829f5e925SRichard Henderson /* Case 1b */ 221929f5e925SRichard Henderson def->args_ct[i].pair_index = i; 222029f5e925SRichard Henderson } 222129f5e925SRichard Henderson break; 222229f5e925SRichard Henderson case 2: 222329f5e925SRichard Henderson o = def->args_ct[i].alias_index; 222429f5e925SRichard Henderson o2 = def->args_ct[o].pair_index; 222529f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o].pair == 2); 222629f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o2].pair == 1); 222729f5e925SRichard Henderson if (def->args_ct[o2].oalias) { 222829f5e925SRichard Henderson /* Case 1a */ 222929f5e925SRichard Henderson i2 = def->args_ct[o2].alias_index; 223029f5e925SRichard Henderson tcg_debug_assert(def->args_ct[i2].pair == 1); 223129f5e925SRichard Henderson def->args_ct[i2].pair_index = i; 223229f5e925SRichard Henderson def->args_ct[i].pair_index = i2; 223329f5e925SRichard Henderson } else { 223429f5e925SRichard Henderson /* Case 2 */ 223529f5e925SRichard Henderson def->args_ct[i].pair = 3; 223629f5e925SRichard Henderson def->args_ct[o2].pair = 3; 223729f5e925SRichard Henderson def->args_ct[i].pair_index = o2; 223829f5e925SRichard Henderson def->args_ct[o2].pair_index = i; 223929f5e925SRichard Henderson } 224029f5e925SRichard Henderson break; 224129f5e925SRichard Henderson default: 224229f5e925SRichard Henderson g_assert_not_reached(); 224329f5e925SRichard Henderson } 224429f5e925SRichard Henderson } 224529f5e925SRichard Henderson } 224629f5e925SRichard Henderson 2247c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2248c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2249c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2250c896fe29Sbellard } 2251c896fe29Sbellard } 2252c896fe29Sbellard 22530c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 22540c627cdcSRichard Henderson { 2255d88a117eSRichard Henderson TCGLabel *label; 2256d88a117eSRichard Henderson 2257d88a117eSRichard Henderson switch (op->opc) { 2258d88a117eSRichard Henderson case INDEX_op_br: 2259d88a117eSRichard Henderson label = arg_label(op->args[0]); 2260d88a117eSRichard Henderson label->refs--; 2261d88a117eSRichard Henderson break; 2262d88a117eSRichard Henderson case INDEX_op_brcond_i32: 2263d88a117eSRichard Henderson case INDEX_op_brcond_i64: 2264d88a117eSRichard Henderson label = arg_label(op->args[3]); 2265d88a117eSRichard Henderson label->refs--; 2266d88a117eSRichard Henderson break; 2267d88a117eSRichard Henderson case INDEX_op_brcond2_i32: 2268d88a117eSRichard Henderson label = arg_label(op->args[5]); 2269d88a117eSRichard Henderson label->refs--; 2270d88a117eSRichard Henderson break; 2271d88a117eSRichard Henderson default: 2272d88a117eSRichard Henderson break; 2273d88a117eSRichard Henderson } 2274d88a117eSRichard Henderson 227515fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 227615fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2277abebf925SRichard Henderson s->nb_ops--; 22780c627cdcSRichard Henderson 22790c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2280d73415a3SStefan Hajnoczi qatomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 22810c627cdcSRichard Henderson #endif 22820c627cdcSRichard Henderson } 22830c627cdcSRichard Henderson 2284a80cdd31SRichard Henderson void tcg_remove_ops_after(TCGOp *op) 2285a80cdd31SRichard Henderson { 2286a80cdd31SRichard Henderson TCGContext *s = tcg_ctx; 2287a80cdd31SRichard Henderson 2288a80cdd31SRichard Henderson while (true) { 2289a80cdd31SRichard Henderson TCGOp *last = tcg_last_op(); 2290a80cdd31SRichard Henderson if (last == op) { 2291a80cdd31SRichard Henderson return; 2292a80cdd31SRichard Henderson } 2293a80cdd31SRichard Henderson tcg_op_remove(s, last); 2294a80cdd31SRichard Henderson } 2295a80cdd31SRichard Henderson } 2296a80cdd31SRichard Henderson 229715fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 229815fa08f8SRichard Henderson { 229915fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 230015fa08f8SRichard Henderson TCGOp *op; 230115fa08f8SRichard Henderson 230215fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 230315fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 230415fa08f8SRichard Henderson } else { 230515fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 230615fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 230715fa08f8SRichard Henderson } 230815fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 230915fa08f8SRichard Henderson op->opc = opc; 2310abebf925SRichard Henderson s->nb_ops++; 231115fa08f8SRichard Henderson 231215fa08f8SRichard Henderson return op; 231315fa08f8SRichard Henderson } 231415fa08f8SRichard Henderson 231515fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 231615fa08f8SRichard Henderson { 231715fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 231815fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 231915fa08f8SRichard Henderson return op; 232015fa08f8SRichard Henderson } 232115fa08f8SRichard Henderson 2322ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 23235a18407fSRichard Henderson { 232415fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 232515fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 23265a18407fSRichard Henderson return new_op; 23275a18407fSRichard Henderson } 23285a18407fSRichard Henderson 2329ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 23305a18407fSRichard Henderson { 233115fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 233215fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 23335a18407fSRichard Henderson return new_op; 23345a18407fSRichard Henderson } 23355a18407fSRichard Henderson 2336b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code. */ 2337b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s) 2338b4fc67c7SRichard Henderson { 2339b4fc67c7SRichard Henderson TCGOp *op, *op_next; 2340b4fc67c7SRichard Henderson bool dead = false; 2341b4fc67c7SRichard Henderson 2342b4fc67c7SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 2343b4fc67c7SRichard Henderson bool remove = dead; 2344b4fc67c7SRichard Henderson TCGLabel *label; 2345b4fc67c7SRichard Henderson 2346b4fc67c7SRichard Henderson switch (op->opc) { 2347b4fc67c7SRichard Henderson case INDEX_op_set_label: 2348b4fc67c7SRichard Henderson label = arg_label(op->args[0]); 2349b4fc67c7SRichard Henderson if (label->refs == 0) { 2350b4fc67c7SRichard Henderson /* 2351b4fc67c7SRichard Henderson * While there is an occasional backward branch, virtually 2352b4fc67c7SRichard Henderson * all branches generated by the translators are forward. 2353b4fc67c7SRichard Henderson * Which means that generally we will have already removed 2354b4fc67c7SRichard Henderson * all references to the label that will be, and there is 2355b4fc67c7SRichard Henderson * little to be gained by iterating. 2356b4fc67c7SRichard Henderson */ 2357b4fc67c7SRichard Henderson remove = true; 2358b4fc67c7SRichard Henderson } else { 2359b4fc67c7SRichard Henderson /* Once we see a label, insns become live again. */ 2360b4fc67c7SRichard Henderson dead = false; 2361b4fc67c7SRichard Henderson remove = false; 2362b4fc67c7SRichard Henderson 2363b4fc67c7SRichard Henderson /* 2364b4fc67c7SRichard Henderson * Optimization can fold conditional branches to unconditional. 2365b4fc67c7SRichard Henderson * If we find a label with one reference which is preceded by 2366b4fc67c7SRichard Henderson * an unconditional branch to it, remove both. This needed to 2367b4fc67c7SRichard Henderson * wait until the dead code in between them was removed. 2368b4fc67c7SRichard Henderson */ 2369b4fc67c7SRichard Henderson if (label->refs == 1) { 2370eae3eb3eSPaolo Bonzini TCGOp *op_prev = QTAILQ_PREV(op, link); 2371b4fc67c7SRichard Henderson if (op_prev->opc == INDEX_op_br && 2372b4fc67c7SRichard Henderson label == arg_label(op_prev->args[0])) { 2373b4fc67c7SRichard Henderson tcg_op_remove(s, op_prev); 2374b4fc67c7SRichard Henderson remove = true; 2375b4fc67c7SRichard Henderson } 2376b4fc67c7SRichard Henderson } 2377b4fc67c7SRichard Henderson } 2378b4fc67c7SRichard Henderson break; 2379b4fc67c7SRichard Henderson 2380b4fc67c7SRichard Henderson case INDEX_op_br: 2381b4fc67c7SRichard Henderson case INDEX_op_exit_tb: 2382b4fc67c7SRichard Henderson case INDEX_op_goto_ptr: 2383b4fc67c7SRichard Henderson /* Unconditional branches; everything following is dead. */ 2384b4fc67c7SRichard Henderson dead = true; 2385b4fc67c7SRichard Henderson break; 2386b4fc67c7SRichard Henderson 2387b4fc67c7SRichard Henderson case INDEX_op_call: 2388b4fc67c7SRichard Henderson /* Notice noreturn helper calls, raising exceptions. */ 238990163900SRichard Henderson if (tcg_call_flags(op) & TCG_CALL_NO_RETURN) { 2390b4fc67c7SRichard Henderson dead = true; 2391b4fc67c7SRichard Henderson } 2392b4fc67c7SRichard Henderson break; 2393b4fc67c7SRichard Henderson 2394b4fc67c7SRichard Henderson case INDEX_op_insn_start: 2395b4fc67c7SRichard Henderson /* Never remove -- we need to keep these for unwind. */ 2396b4fc67c7SRichard Henderson remove = false; 2397b4fc67c7SRichard Henderson break; 2398b4fc67c7SRichard Henderson 2399b4fc67c7SRichard Henderson default: 2400b4fc67c7SRichard Henderson break; 2401b4fc67c7SRichard Henderson } 2402b4fc67c7SRichard Henderson 2403b4fc67c7SRichard Henderson if (remove) { 2404b4fc67c7SRichard Henderson tcg_op_remove(s, op); 2405b4fc67c7SRichard Henderson } 2406b4fc67c7SRichard Henderson } 2407b4fc67c7SRichard Henderson } 2408b4fc67c7SRichard Henderson 2409c70fbf0aSRichard Henderson #define TS_DEAD 1 2410c70fbf0aSRichard Henderson #define TS_MEM 2 2411c70fbf0aSRichard Henderson 24125a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 24135a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 24145a18407fSRichard Henderson 241525f49c5fSRichard Henderson /* For liveness_pass_1, the register preferences for a given temp. */ 241625f49c5fSRichard Henderson static inline TCGRegSet *la_temp_pref(TCGTemp *ts) 241725f49c5fSRichard Henderson { 241825f49c5fSRichard Henderson return ts->state_ptr; 241925f49c5fSRichard Henderson } 242025f49c5fSRichard Henderson 242125f49c5fSRichard Henderson /* For liveness_pass_1, reset the preferences for a given temp to the 242225f49c5fSRichard Henderson * maximal regset for its type. 242325f49c5fSRichard Henderson */ 242425f49c5fSRichard Henderson static inline void la_reset_pref(TCGTemp *ts) 242525f49c5fSRichard Henderson { 242625f49c5fSRichard Henderson *la_temp_pref(ts) 242725f49c5fSRichard Henderson = (ts->state == TS_DEAD ? 0 : tcg_target_available_regs[ts->type]); 242825f49c5fSRichard Henderson } 242925f49c5fSRichard Henderson 24309c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 24319c43b68dSAurelien Jarno should be in memory. */ 24322616c808SRichard Henderson static void la_func_end(TCGContext *s, int ng, int nt) 2433c896fe29Sbellard { 2434b83eabeaSRichard Henderson int i; 2435b83eabeaSRichard Henderson 2436b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2437b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 243825f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 2439b83eabeaSRichard Henderson } 2440b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2441b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 244225f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 2443b83eabeaSRichard Henderson } 2444c896fe29Sbellard } 2445c896fe29Sbellard 24469c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 24479c43b68dSAurelien Jarno and local temps should be in memory. */ 24482616c808SRichard Henderson static void la_bb_end(TCGContext *s, int ng, int nt) 2449641d5fbeSbellard { 2450b83eabeaSRichard Henderson int i; 2451641d5fbeSbellard 2452ee17db83SRichard Henderson for (i = 0; i < nt; ++i) { 2453ee17db83SRichard Henderson TCGTemp *ts = &s->temps[i]; 2454ee17db83SRichard Henderson int state; 2455ee17db83SRichard Henderson 2456ee17db83SRichard Henderson switch (ts->kind) { 2457ee17db83SRichard Henderson case TEMP_FIXED: 2458ee17db83SRichard Henderson case TEMP_GLOBAL: 2459ee17db83SRichard Henderson case TEMP_LOCAL: 2460ee17db83SRichard Henderson state = TS_DEAD | TS_MEM; 2461ee17db83SRichard Henderson break; 2462ee17db83SRichard Henderson case TEMP_NORMAL: 2463c7482438SRichard Henderson case TEMP_EBB: 2464c0522136SRichard Henderson case TEMP_CONST: 2465ee17db83SRichard Henderson state = TS_DEAD; 2466ee17db83SRichard Henderson break; 2467ee17db83SRichard Henderson default: 2468ee17db83SRichard Henderson g_assert_not_reached(); 2469c70fbf0aSRichard Henderson } 2470ee17db83SRichard Henderson ts->state = state; 2471ee17db83SRichard Henderson la_reset_pref(ts); 2472641d5fbeSbellard } 2473641d5fbeSbellard } 2474641d5fbeSbellard 2475f65a061cSRichard Henderson /* liveness analysis: sync globals back to memory. */ 2476f65a061cSRichard Henderson static void la_global_sync(TCGContext *s, int ng) 2477f65a061cSRichard Henderson { 2478f65a061cSRichard Henderson int i; 2479f65a061cSRichard Henderson 2480f65a061cSRichard Henderson for (i = 0; i < ng; ++i) { 248125f49c5fSRichard Henderson int state = s->temps[i].state; 248225f49c5fSRichard Henderson s->temps[i].state = state | TS_MEM; 248325f49c5fSRichard Henderson if (state == TS_DEAD) { 248425f49c5fSRichard Henderson /* If the global was previously dead, reset prefs. */ 248525f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 248625f49c5fSRichard Henderson } 2487f65a061cSRichard Henderson } 2488f65a061cSRichard Henderson } 2489f65a061cSRichard Henderson 2490b4cb76e6SRichard Henderson /* 2491c7482438SRichard Henderson * liveness analysis: conditional branch: all temps are dead unless 2492c7482438SRichard Henderson * explicitly live-across-conditional-branch, globals and local temps 2493c7482438SRichard Henderson * should be synced. 2494b4cb76e6SRichard Henderson */ 2495b4cb76e6SRichard Henderson static void la_bb_sync(TCGContext *s, int ng, int nt) 2496b4cb76e6SRichard Henderson { 2497b4cb76e6SRichard Henderson la_global_sync(s, ng); 2498b4cb76e6SRichard Henderson 2499b4cb76e6SRichard Henderson for (int i = ng; i < nt; ++i) { 2500c0522136SRichard Henderson TCGTemp *ts = &s->temps[i]; 2501c0522136SRichard Henderson int state; 2502c0522136SRichard Henderson 2503c0522136SRichard Henderson switch (ts->kind) { 2504c0522136SRichard Henderson case TEMP_LOCAL: 2505c0522136SRichard Henderson state = ts->state; 2506c0522136SRichard Henderson ts->state = state | TS_MEM; 2507b4cb76e6SRichard Henderson if (state != TS_DEAD) { 2508b4cb76e6SRichard Henderson continue; 2509b4cb76e6SRichard Henderson } 2510c0522136SRichard Henderson break; 2511c0522136SRichard Henderson case TEMP_NORMAL: 2512b4cb76e6SRichard Henderson s->temps[i].state = TS_DEAD; 2513c0522136SRichard Henderson break; 2514c7482438SRichard Henderson case TEMP_EBB: 2515c0522136SRichard Henderson case TEMP_CONST: 2516c0522136SRichard Henderson continue; 2517c0522136SRichard Henderson default: 2518c0522136SRichard Henderson g_assert_not_reached(); 2519b4cb76e6SRichard Henderson } 2520b4cb76e6SRichard Henderson la_reset_pref(&s->temps[i]); 2521b4cb76e6SRichard Henderson } 2522b4cb76e6SRichard Henderson } 2523b4cb76e6SRichard Henderson 2524f65a061cSRichard Henderson /* liveness analysis: sync globals back to memory and kill. */ 2525f65a061cSRichard Henderson static void la_global_kill(TCGContext *s, int ng) 2526f65a061cSRichard Henderson { 2527f65a061cSRichard Henderson int i; 2528f65a061cSRichard Henderson 2529f65a061cSRichard Henderson for (i = 0; i < ng; i++) { 2530f65a061cSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 253125f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 253225f49c5fSRichard Henderson } 253325f49c5fSRichard Henderson } 253425f49c5fSRichard Henderson 253525f49c5fSRichard Henderson /* liveness analysis: note live globals crossing calls. */ 253625f49c5fSRichard Henderson static void la_cross_call(TCGContext *s, int nt) 253725f49c5fSRichard Henderson { 253825f49c5fSRichard Henderson TCGRegSet mask = ~tcg_target_call_clobber_regs; 253925f49c5fSRichard Henderson int i; 254025f49c5fSRichard Henderson 254125f49c5fSRichard Henderson for (i = 0; i < nt; i++) { 254225f49c5fSRichard Henderson TCGTemp *ts = &s->temps[i]; 254325f49c5fSRichard Henderson if (!(ts->state & TS_DEAD)) { 254425f49c5fSRichard Henderson TCGRegSet *pset = la_temp_pref(ts); 254525f49c5fSRichard Henderson TCGRegSet set = *pset; 254625f49c5fSRichard Henderson 254725f49c5fSRichard Henderson set &= mask; 254825f49c5fSRichard Henderson /* If the combination is not possible, restart. */ 254925f49c5fSRichard Henderson if (set == 0) { 255025f49c5fSRichard Henderson set = tcg_target_available_regs[ts->type] & mask; 255125f49c5fSRichard Henderson } 255225f49c5fSRichard Henderson *pset = set; 255325f49c5fSRichard Henderson } 2554f65a061cSRichard Henderson } 2555f65a061cSRichard Henderson } 2556f65a061cSRichard Henderson 2557a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2558c896fe29Sbellard given input arguments is dead. Instructions updating dead 2559c896fe29Sbellard temporaries are removed. */ 2560b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2561c896fe29Sbellard { 2562c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 25632616c808SRichard Henderson int nb_temps = s->nb_temps; 256415fa08f8SRichard Henderson TCGOp *op, *op_prev; 256525f49c5fSRichard Henderson TCGRegSet *prefs; 256625f49c5fSRichard Henderson int i; 256725f49c5fSRichard Henderson 256825f49c5fSRichard Henderson prefs = tcg_malloc(sizeof(TCGRegSet) * nb_temps); 256925f49c5fSRichard Henderson for (i = 0; i < nb_temps; ++i) { 257025f49c5fSRichard Henderson s->temps[i].state_ptr = prefs + i; 257125f49c5fSRichard Henderson } 2572c896fe29Sbellard 2573ae36a246SRichard Henderson /* ??? Should be redundant with the exit_tb that ends the TB. */ 25742616c808SRichard Henderson la_func_end(s, nb_globals, nb_temps); 2575c896fe29Sbellard 2576eae3eb3eSPaolo Bonzini QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, link, op_prev) { 257725f49c5fSRichard Henderson int nb_iargs, nb_oargs; 2578c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2579c45cb8bbSRichard Henderson bool have_opc_new2; 2580a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 258125f49c5fSRichard Henderson TCGTemp *ts; 2582c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2583c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2584c45cb8bbSRichard Henderson 2585c45cb8bbSRichard Henderson switch (opc) { 2586c896fe29Sbellard case INDEX_op_call: 2587c6e113f5Sbellard { 2588c6e113f5Sbellard int call_flags; 258925f49c5fSRichard Henderson int nb_call_regs; 2590c6e113f5Sbellard 2591cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2592cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 259390163900SRichard Henderson call_flags = tcg_call_flags(op); 2594c6e113f5Sbellard 2595c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 259678505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2597c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 259825f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 259925f49c5fSRichard Henderson if (ts->state != TS_DEAD) { 2600c6e113f5Sbellard goto do_not_remove_call; 2601c6e113f5Sbellard } 26029c43b68dSAurelien Jarno } 2603c45cb8bbSRichard Henderson goto do_remove; 2604152c35aaSRichard Henderson } 2605c6e113f5Sbellard do_not_remove_call: 2606c896fe29Sbellard 260725f49c5fSRichard Henderson /* Output args are dead. */ 2608c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 260925f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 261025f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2611a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 26126b64b624SAurelien Jarno } 261325f49c5fSRichard Henderson if (ts->state & TS_MEM) { 2614a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 26159c43b68dSAurelien Jarno } 261625f49c5fSRichard Henderson ts->state = TS_DEAD; 261725f49c5fSRichard Henderson la_reset_pref(ts); 261825f49c5fSRichard Henderson 261925f49c5fSRichard Henderson /* Not used -- it will be tcg_target_call_oarg_regs[i]. */ 262025f49c5fSRichard Henderson op->output_pref[i] = 0; 2621c896fe29Sbellard } 2622c896fe29Sbellard 262378505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 262478505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 2625f65a061cSRichard Henderson la_global_kill(s, nb_globals); 2626c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2627f65a061cSRichard Henderson la_global_sync(s, nb_globals); 2628b9c18f56Saurel32 } 2629c896fe29Sbellard 263025f49c5fSRichard Henderson /* Record arguments that die in this helper. */ 2631866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 263225f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 263325f49c5fSRichard Henderson if (ts && ts->state & TS_DEAD) { 2634a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2635c896fe29Sbellard } 2636c896fe29Sbellard } 263725f49c5fSRichard Henderson 263825f49c5fSRichard Henderson /* For all live registers, remove call-clobbered prefs. */ 263925f49c5fSRichard Henderson la_cross_call(s, nb_temps); 264025f49c5fSRichard Henderson 264125f49c5fSRichard Henderson nb_call_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 264225f49c5fSRichard Henderson 264325f49c5fSRichard Henderson /* Input arguments are live for preceding opcodes. */ 264425f49c5fSRichard Henderson for (i = 0; i < nb_iargs; i++) { 264525f49c5fSRichard Henderson ts = arg_temp(op->args[i + nb_oargs]); 264625f49c5fSRichard Henderson if (ts && ts->state & TS_DEAD) { 264725f49c5fSRichard Henderson /* For those arguments that die, and will be allocated 264825f49c5fSRichard Henderson * in registers, clear the register set for that arg, 264925f49c5fSRichard Henderson * to be filled in below. For args that will be on 265025f49c5fSRichard Henderson * the stack, reset to any available reg. 265125f49c5fSRichard Henderson */ 265225f49c5fSRichard Henderson *la_temp_pref(ts) 265325f49c5fSRichard Henderson = (i < nb_call_regs ? 0 : 265425f49c5fSRichard Henderson tcg_target_available_regs[ts->type]); 265525f49c5fSRichard Henderson ts->state &= ~TS_DEAD; 265625f49c5fSRichard Henderson } 265725f49c5fSRichard Henderson } 265825f49c5fSRichard Henderson 265925f49c5fSRichard Henderson /* For each input argument, add its input register to prefs. 266025f49c5fSRichard Henderson If a temp is used once, this produces a single set bit. */ 266125f49c5fSRichard Henderson for (i = 0; i < MIN(nb_call_regs, nb_iargs); i++) { 266225f49c5fSRichard Henderson ts = arg_temp(op->args[i + nb_oargs]); 266325f49c5fSRichard Henderson if (ts) { 266425f49c5fSRichard Henderson tcg_regset_set_reg(*la_temp_pref(ts), 266525f49c5fSRichard Henderson tcg_target_call_iarg_regs[i]); 2666c70fbf0aSRichard Henderson } 2667c19f47bfSAurelien Jarno } 2668c6e113f5Sbellard } 2669c896fe29Sbellard break; 2670765b842aSRichard Henderson case INDEX_op_insn_start: 2671c896fe29Sbellard break; 26725ff9d6a4Sbellard case INDEX_op_discard: 26735ff9d6a4Sbellard /* mark the temporary as dead */ 267425f49c5fSRichard Henderson ts = arg_temp(op->args[0]); 267525f49c5fSRichard Henderson ts->state = TS_DEAD; 267625f49c5fSRichard Henderson la_reset_pref(ts); 26775ff9d6a4Sbellard break; 26781305c451SRichard Henderson 26791305c451SRichard Henderson case INDEX_op_add2_i32: 2680c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2681f1fae40cSRichard Henderson goto do_addsub2; 26821305c451SRichard Henderson case INDEX_op_sub2_i32: 2683c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2684f1fae40cSRichard Henderson goto do_addsub2; 2685f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2686c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2687f1fae40cSRichard Henderson goto do_addsub2; 2688f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2689c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2690f1fae40cSRichard Henderson do_addsub2: 26911305c451SRichard Henderson nb_iargs = 4; 26921305c451SRichard Henderson nb_oargs = 2; 26931305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 26941305c451SRichard Henderson the low part. The result can be optimized to a simple 26951305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 26961305c451SRichard Henderson cpu mode is set to 32 bit. */ 2697b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2698b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 26991305c451SRichard Henderson goto do_remove; 27001305c451SRichard Henderson } 2701c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2702c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2703c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2704efee3746SRichard Henderson op->args[1] = op->args[2]; 2705efee3746SRichard Henderson op->args[2] = op->args[4]; 27061305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 27071305c451SRichard Henderson nb_iargs = 2; 27081305c451SRichard Henderson nb_oargs = 1; 27091305c451SRichard Henderson } 27101305c451SRichard Henderson goto do_not_remove; 27111305c451SRichard Henderson 27121414968aSRichard Henderson case INDEX_op_mulu2_i32: 2713c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2714c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2715c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 271603271524SRichard Henderson goto do_mul2; 2717f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2718c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2719c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2720c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2721f1fae40cSRichard Henderson goto do_mul2; 2722f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2723c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2724c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2725c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 272603271524SRichard Henderson goto do_mul2; 2727f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2728c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2729c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2730c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 273103271524SRichard Henderson goto do_mul2; 2732f1fae40cSRichard Henderson do_mul2: 27331414968aSRichard Henderson nb_iargs = 2; 27341414968aSRichard Henderson nb_oargs = 2; 2735b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2736b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 273703271524SRichard Henderson /* Both parts of the operation are dead. */ 27381414968aSRichard Henderson goto do_remove; 27391414968aSRichard Henderson } 274003271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2741c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2742efee3746SRichard Henderson op->args[1] = op->args[2]; 2743efee3746SRichard Henderson op->args[2] = op->args[3]; 2744b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 274503271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2746c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2747efee3746SRichard Henderson op->args[0] = op->args[1]; 2748efee3746SRichard Henderson op->args[1] = op->args[2]; 2749efee3746SRichard Henderson op->args[2] = op->args[3]; 275003271524SRichard Henderson } else { 275103271524SRichard Henderson goto do_not_remove; 275203271524SRichard Henderson } 275303271524SRichard Henderson /* Mark the single-word operation live. */ 27541414968aSRichard Henderson nb_oargs = 1; 27551414968aSRichard Henderson goto do_not_remove; 27561414968aSRichard Henderson 2757c896fe29Sbellard default: 27581305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2759c896fe29Sbellard nb_iargs = def->nb_iargs; 2760c896fe29Sbellard nb_oargs = def->nb_oargs; 2761c896fe29Sbellard 2762c896fe29Sbellard /* Test if the operation can be removed because all 27635ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 27645ff9d6a4Sbellard implies side effects */ 27655ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2766c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2767b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2768c896fe29Sbellard goto do_not_remove; 2769c896fe29Sbellard } 27709c43b68dSAurelien Jarno } 2771152c35aaSRichard Henderson goto do_remove; 2772152c35aaSRichard Henderson } 2773152c35aaSRichard Henderson goto do_not_remove; 2774152c35aaSRichard Henderson 27751305c451SRichard Henderson do_remove: 27760c627cdcSRichard Henderson tcg_op_remove(s, op); 2777152c35aaSRichard Henderson break; 2778152c35aaSRichard Henderson 2779c896fe29Sbellard do_not_remove: 2780c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 278125f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 278225f49c5fSRichard Henderson 278325f49c5fSRichard Henderson /* Remember the preference of the uses that followed. */ 278425f49c5fSRichard Henderson op->output_pref[i] = *la_temp_pref(ts); 278525f49c5fSRichard Henderson 278625f49c5fSRichard Henderson /* Output args are dead. */ 278725f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2788a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 27896b64b624SAurelien Jarno } 279025f49c5fSRichard Henderson if (ts->state & TS_MEM) { 2791a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 27929c43b68dSAurelien Jarno } 279325f49c5fSRichard Henderson ts->state = TS_DEAD; 279425f49c5fSRichard Henderson la_reset_pref(ts); 2795c896fe29Sbellard } 2796c896fe29Sbellard 279725f49c5fSRichard Henderson /* If end of basic block, update. */ 2798ae36a246SRichard Henderson if (def->flags & TCG_OPF_BB_EXIT) { 2799ae36a246SRichard Henderson la_func_end(s, nb_globals, nb_temps); 2800b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_COND_BRANCH) { 2801b4cb76e6SRichard Henderson la_bb_sync(s, nb_globals, nb_temps); 2802ae36a246SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 28032616c808SRichard Henderson la_bb_end(s, nb_globals, nb_temps); 28043d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 2805f65a061cSRichard Henderson la_global_sync(s, nb_globals); 280625f49c5fSRichard Henderson if (def->flags & TCG_OPF_CALL_CLOBBER) { 280725f49c5fSRichard Henderson la_cross_call(s, nb_temps); 280825f49c5fSRichard Henderson } 2809c896fe29Sbellard } 2810c896fe29Sbellard 281125f49c5fSRichard Henderson /* Record arguments that die in this opcode. */ 2812866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 281325f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 281425f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2815a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2816c896fe29Sbellard } 2817c19f47bfSAurelien Jarno } 281825f49c5fSRichard Henderson 281925f49c5fSRichard Henderson /* Input arguments are live for preceding opcodes. */ 2820c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 282125f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 282225f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 282325f49c5fSRichard Henderson /* For operands that were dead, initially allow 282425f49c5fSRichard Henderson all regs for the type. */ 282525f49c5fSRichard Henderson *la_temp_pref(ts) = tcg_target_available_regs[ts->type]; 282625f49c5fSRichard Henderson ts->state &= ~TS_DEAD; 282725f49c5fSRichard Henderson } 282825f49c5fSRichard Henderson } 282925f49c5fSRichard Henderson 283025f49c5fSRichard Henderson /* Incorporate constraints for this operand. */ 283125f49c5fSRichard Henderson switch (opc) { 283225f49c5fSRichard Henderson case INDEX_op_mov_i32: 283325f49c5fSRichard Henderson case INDEX_op_mov_i64: 283425f49c5fSRichard Henderson /* Note that these are TCG_OPF_NOT_PRESENT and do not 283525f49c5fSRichard Henderson have proper constraints. That said, special case 283625f49c5fSRichard Henderson moves to propagate preferences backward. */ 283725f49c5fSRichard Henderson if (IS_DEAD_ARG(1)) { 283825f49c5fSRichard Henderson *la_temp_pref(arg_temp(op->args[0])) 283925f49c5fSRichard Henderson = *la_temp_pref(arg_temp(op->args[1])); 284025f49c5fSRichard Henderson } 284125f49c5fSRichard Henderson break; 284225f49c5fSRichard Henderson 284325f49c5fSRichard Henderson default: 284425f49c5fSRichard Henderson for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 284525f49c5fSRichard Henderson const TCGArgConstraint *ct = &def->args_ct[i]; 284625f49c5fSRichard Henderson TCGRegSet set, *pset; 284725f49c5fSRichard Henderson 284825f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 284925f49c5fSRichard Henderson pset = la_temp_pref(ts); 285025f49c5fSRichard Henderson set = *pset; 285125f49c5fSRichard Henderson 28529be0d080SRichard Henderson set &= ct->regs; 2853bc2b17e6SRichard Henderson if (ct->ialias) { 285425f49c5fSRichard Henderson set &= op->output_pref[ct->alias_index]; 285525f49c5fSRichard Henderson } 285625f49c5fSRichard Henderson /* If the combination is not possible, restart. */ 285725f49c5fSRichard Henderson if (set == 0) { 28589be0d080SRichard Henderson set = ct->regs; 285925f49c5fSRichard Henderson } 286025f49c5fSRichard Henderson *pset = set; 286125f49c5fSRichard Henderson } 286225f49c5fSRichard Henderson break; 2863c896fe29Sbellard } 2864c896fe29Sbellard break; 2865c896fe29Sbellard } 2866bee158cbSRichard Henderson op->life = arg_life; 2867c896fe29Sbellard } 28681ff0a2c5SEvgeny Voevodin } 2869c896fe29Sbellard 28705a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2871b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 28725a18407fSRichard Henderson { 28735a18407fSRichard Henderson int nb_globals = s->nb_globals; 287415fa08f8SRichard Henderson int nb_temps, i; 28755a18407fSRichard Henderson bool changes = false; 287615fa08f8SRichard Henderson TCGOp *op, *op_next; 28775a18407fSRichard Henderson 28785a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 28795a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 28805a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 28815a18407fSRichard Henderson if (its->indirect_reg) { 28825a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 28835a18407fSRichard Henderson dts->type = its->type; 28845a18407fSRichard Henderson dts->base_type = its->base_type; 2885c7482438SRichard Henderson dts->kind = TEMP_EBB; 2886b83eabeaSRichard Henderson its->state_ptr = dts; 2887b83eabeaSRichard Henderson } else { 2888b83eabeaSRichard Henderson its->state_ptr = NULL; 28895a18407fSRichard Henderson } 2890b83eabeaSRichard Henderson /* All globals begin dead. */ 2891b83eabeaSRichard Henderson its->state = TS_DEAD; 28925a18407fSRichard Henderson } 2893b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2894b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2895b83eabeaSRichard Henderson its->state_ptr = NULL; 2896b83eabeaSRichard Henderson its->state = TS_DEAD; 2897b83eabeaSRichard Henderson } 28985a18407fSRichard Henderson 289915fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 29005a18407fSRichard Henderson TCGOpcode opc = op->opc; 29015a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 29025a18407fSRichard Henderson TCGLifeData arg_life = op->life; 29035a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2904b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 29055a18407fSRichard Henderson 29065a18407fSRichard Henderson if (opc == INDEX_op_call) { 2907cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2908cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 290990163900SRichard Henderson call_flags = tcg_call_flags(op); 29105a18407fSRichard Henderson } else { 29115a18407fSRichard Henderson nb_iargs = def->nb_iargs; 29125a18407fSRichard Henderson nb_oargs = def->nb_oargs; 29135a18407fSRichard Henderson 29145a18407fSRichard Henderson /* Set flags similar to how calls require. */ 2915b4cb76e6SRichard Henderson if (def->flags & TCG_OPF_COND_BRANCH) { 2916b4cb76e6SRichard Henderson /* Like reading globals: sync_globals */ 2917b4cb76e6SRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 2918b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 29195a18407fSRichard Henderson /* Like writing globals: save_globals */ 29205a18407fSRichard Henderson call_flags = 0; 29215a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 29225a18407fSRichard Henderson /* Like reading globals: sync_globals */ 29235a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 29245a18407fSRichard Henderson } else { 29255a18407fSRichard Henderson /* No effect on globals. */ 29265a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 29275a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 29285a18407fSRichard Henderson } 29295a18407fSRichard Henderson } 29305a18407fSRichard Henderson 29315a18407fSRichard Henderson /* Make sure that input arguments are available. */ 29325a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2933b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2934b83eabeaSRichard Henderson if (arg_ts) { 2935b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2936b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2937b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 29385a18407fSRichard Henderson ? INDEX_op_ld_i32 29395a18407fSRichard Henderson : INDEX_op_ld_i64); 2940ac1043f6SEmilio G. Cota TCGOp *lop = tcg_op_insert_before(s, op, lopc); 29415a18407fSRichard Henderson 2942b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2943b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2944b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 29455a18407fSRichard Henderson 29465a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2947b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 29485a18407fSRichard Henderson } 29495a18407fSRichard Henderson } 29505a18407fSRichard Henderson } 29515a18407fSRichard Henderson 29525a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 29535a18407fSRichard Henderson No action is required except keeping temp_state up to date 29545a18407fSRichard Henderson so that we reload when needed. */ 29555a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2956b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2957b83eabeaSRichard Henderson if (arg_ts) { 2958b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2959b83eabeaSRichard Henderson if (dir_ts) { 2960b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 29615a18407fSRichard Henderson changes = true; 29625a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2963b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 29645a18407fSRichard Henderson } 29655a18407fSRichard Henderson } 29665a18407fSRichard Henderson } 29675a18407fSRichard Henderson } 29685a18407fSRichard Henderson 29695a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 29705a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 29715a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 29725a18407fSRichard Henderson /* Nothing to do */ 29735a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 29745a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 29755a18407fSRichard Henderson /* Liveness should see that globals are synced back, 29765a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2977b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2978b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2979b83eabeaSRichard Henderson || arg_ts->state != 0); 29805a18407fSRichard Henderson } 29815a18407fSRichard Henderson } else { 29825a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 29835a18407fSRichard Henderson /* Liveness should see that globals are saved back, 29845a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2985b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2986b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2987b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 29885a18407fSRichard Henderson } 29895a18407fSRichard Henderson } 29905a18407fSRichard Henderson 29915a18407fSRichard Henderson /* Outputs become available. */ 299261f15c48SRichard Henderson if (opc == INDEX_op_mov_i32 || opc == INDEX_op_mov_i64) { 299361f15c48SRichard Henderson arg_ts = arg_temp(op->args[0]); 299461f15c48SRichard Henderson dir_ts = arg_ts->state_ptr; 299561f15c48SRichard Henderson if (dir_ts) { 299661f15c48SRichard Henderson op->args[0] = temp_arg(dir_ts); 299761f15c48SRichard Henderson changes = true; 299861f15c48SRichard Henderson 299961f15c48SRichard Henderson /* The output is now live and modified. */ 300061f15c48SRichard Henderson arg_ts->state = 0; 300161f15c48SRichard Henderson 300261f15c48SRichard Henderson if (NEED_SYNC_ARG(0)) { 300361f15c48SRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 300461f15c48SRichard Henderson ? INDEX_op_st_i32 300561f15c48SRichard Henderson : INDEX_op_st_i64); 300661f15c48SRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc); 300761f15c48SRichard Henderson TCGTemp *out_ts = dir_ts; 300861f15c48SRichard Henderson 300961f15c48SRichard Henderson if (IS_DEAD_ARG(0)) { 301061f15c48SRichard Henderson out_ts = arg_temp(op->args[1]); 301161f15c48SRichard Henderson arg_ts->state = TS_DEAD; 301261f15c48SRichard Henderson tcg_op_remove(s, op); 301361f15c48SRichard Henderson } else { 301461f15c48SRichard Henderson arg_ts->state = TS_MEM; 301561f15c48SRichard Henderson } 301661f15c48SRichard Henderson 301761f15c48SRichard Henderson sop->args[0] = temp_arg(out_ts); 301861f15c48SRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 301961f15c48SRichard Henderson sop->args[2] = arg_ts->mem_offset; 302061f15c48SRichard Henderson } else { 302161f15c48SRichard Henderson tcg_debug_assert(!IS_DEAD_ARG(0)); 302261f15c48SRichard Henderson } 302361f15c48SRichard Henderson } 302461f15c48SRichard Henderson } else { 30255a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 3026b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 3027b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 3028b83eabeaSRichard Henderson if (!dir_ts) { 30295a18407fSRichard Henderson continue; 30305a18407fSRichard Henderson } 3031b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 30325a18407fSRichard Henderson changes = true; 30335a18407fSRichard Henderson 30345a18407fSRichard Henderson /* The output is now live and modified. */ 3035b83eabeaSRichard Henderson arg_ts->state = 0; 30365a18407fSRichard Henderson 30375a18407fSRichard Henderson /* Sync outputs upon their last write. */ 30385a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 3039b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 30405a18407fSRichard Henderson ? INDEX_op_st_i32 30415a18407fSRichard Henderson : INDEX_op_st_i64); 3042ac1043f6SEmilio G. Cota TCGOp *sop = tcg_op_insert_after(s, op, sopc); 30435a18407fSRichard Henderson 3044b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 3045b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 3046b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 30475a18407fSRichard Henderson 3048b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 30495a18407fSRichard Henderson } 30505a18407fSRichard Henderson /* Drop outputs that are dead. */ 30515a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 3052b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 30535a18407fSRichard Henderson } 30545a18407fSRichard Henderson } 30555a18407fSRichard Henderson } 305661f15c48SRichard Henderson } 30575a18407fSRichard Henderson 30585a18407fSRichard Henderson return changes; 30595a18407fSRichard Henderson } 30605a18407fSRichard Henderson 30612272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 3062c896fe29Sbellard { 306331c96417SRichard Henderson int size = tcg_type_size(ts->type); 306431c96417SRichard Henderson int align; 306531c96417SRichard Henderson intptr_t off; 3066c1c09194SRichard Henderson 3067c1c09194SRichard Henderson switch (ts->type) { 3068c1c09194SRichard Henderson case TCG_TYPE_I32: 306931c96417SRichard Henderson align = 4; 3070c1c09194SRichard Henderson break; 3071c1c09194SRichard Henderson case TCG_TYPE_I64: 3072c1c09194SRichard Henderson case TCG_TYPE_V64: 307331c96417SRichard Henderson align = 8; 3074c1c09194SRichard Henderson break; 3075c1c09194SRichard Henderson case TCG_TYPE_V128: 3076c1c09194SRichard Henderson case TCG_TYPE_V256: 3077c1c09194SRichard Henderson /* Note that we do not require aligned storage for V256. */ 307831c96417SRichard Henderson align = 16; 3079c1c09194SRichard Henderson break; 3080c1c09194SRichard Henderson default: 3081c1c09194SRichard Henderson g_assert_not_reached(); 3082b591dc59SBlue Swirl } 3083c1c09194SRichard Henderson 3084b9537d59SRichard Henderson /* 3085b9537d59SRichard Henderson * Assume the stack is sufficiently aligned. 3086b9537d59SRichard Henderson * This affects e.g. ARM NEON, where we have 8 byte stack alignment 3087b9537d59SRichard Henderson * and do not require 16 byte vector alignment. This seems slightly 3088b9537d59SRichard Henderson * easier than fully parameterizing the above switch statement. 3089b9537d59SRichard Henderson */ 3090b9537d59SRichard Henderson align = MIN(TCG_TARGET_STACK_ALIGN, align); 3091c1c09194SRichard Henderson off = ROUND_UP(s->current_frame_offset, align); 3092732d5897SRichard Henderson 3093732d5897SRichard Henderson /* If we've exhausted the stack frame, restart with a smaller TB. */ 3094732d5897SRichard Henderson if (off + size > s->frame_end) { 3095732d5897SRichard Henderson tcg_raise_tb_overflow(s); 3096732d5897SRichard Henderson } 3097c1c09194SRichard Henderson s->current_frame_offset = off + size; 3098c1c09194SRichard Henderson 3099c1c09194SRichard Henderson ts->mem_offset = off; 31009defd1bdSRichard Henderson #if defined(__sparc__) 31019defd1bdSRichard Henderson ts->mem_offset += TCG_TARGET_STACK_BIAS; 31029defd1bdSRichard Henderson #endif 3103b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 3104c896fe29Sbellard ts->mem_allocated = 1; 3105c896fe29Sbellard } 3106c896fe29Sbellard 3107098859f1SRichard Henderson /* Assign @reg to @ts, and update reg_to_temp[]. */ 3108098859f1SRichard Henderson static void set_temp_val_reg(TCGContext *s, TCGTemp *ts, TCGReg reg) 3109098859f1SRichard Henderson { 3110098859f1SRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 3111098859f1SRichard Henderson TCGReg old = ts->reg; 3112098859f1SRichard Henderson tcg_debug_assert(s->reg_to_temp[old] == ts); 3113098859f1SRichard Henderson if (old == reg) { 3114098859f1SRichard Henderson return; 3115098859f1SRichard Henderson } 3116098859f1SRichard Henderson s->reg_to_temp[old] = NULL; 3117098859f1SRichard Henderson } 3118098859f1SRichard Henderson tcg_debug_assert(s->reg_to_temp[reg] == NULL); 3119098859f1SRichard Henderson s->reg_to_temp[reg] = ts; 3120098859f1SRichard Henderson ts->val_type = TEMP_VAL_REG; 3121098859f1SRichard Henderson ts->reg = reg; 3122098859f1SRichard Henderson } 3123098859f1SRichard Henderson 3124098859f1SRichard Henderson /* Assign a non-register value type to @ts, and update reg_to_temp[]. */ 3125098859f1SRichard Henderson static void set_temp_val_nonreg(TCGContext *s, TCGTemp *ts, TCGTempVal type) 3126098859f1SRichard Henderson { 3127098859f1SRichard Henderson tcg_debug_assert(type != TEMP_VAL_REG); 3128098859f1SRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 3129098859f1SRichard Henderson TCGReg reg = ts->reg; 3130098859f1SRichard Henderson tcg_debug_assert(s->reg_to_temp[reg] == ts); 3131098859f1SRichard Henderson s->reg_to_temp[reg] = NULL; 3132098859f1SRichard Henderson } 3133098859f1SRichard Henderson ts->val_type = type; 3134098859f1SRichard Henderson } 3135098859f1SRichard Henderson 3136b722452aSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet, TCGRegSet); 3137b3915dbbSRichard Henderson 313859d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 313959d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 314059d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 3141c896fe29Sbellard { 3142c0522136SRichard Henderson TCGTempVal new_type; 3143c0522136SRichard Henderson 3144c0522136SRichard Henderson switch (ts->kind) { 3145c0522136SRichard Henderson case TEMP_FIXED: 314659d7c14eSRichard Henderson return; 3147c0522136SRichard Henderson case TEMP_GLOBAL: 3148c0522136SRichard Henderson case TEMP_LOCAL: 3149c0522136SRichard Henderson new_type = TEMP_VAL_MEM; 3150c0522136SRichard Henderson break; 3151c0522136SRichard Henderson case TEMP_NORMAL: 3152c7482438SRichard Henderson case TEMP_EBB: 3153c0522136SRichard Henderson new_type = free_or_dead < 0 ? TEMP_VAL_MEM : TEMP_VAL_DEAD; 3154c0522136SRichard Henderson break; 3155c0522136SRichard Henderson case TEMP_CONST: 3156c0522136SRichard Henderson new_type = TEMP_VAL_CONST; 3157c0522136SRichard Henderson break; 3158c0522136SRichard Henderson default: 3159c0522136SRichard Henderson g_assert_not_reached(); 316059d7c14eSRichard Henderson } 3161098859f1SRichard Henderson set_temp_val_nonreg(s, ts, new_type); 316259d7c14eSRichard Henderson } 3163c896fe29Sbellard 316459d7c14eSRichard Henderson /* Mark a temporary as dead. */ 316559d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 316659d7c14eSRichard Henderson { 316759d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 316859d7c14eSRichard Henderson } 316959d7c14eSRichard Henderson 317059d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 317159d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 317259d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 317359d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 317498b4e186SRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs, 317598b4e186SRichard Henderson TCGRegSet preferred_regs, int free_or_dead) 317659d7c14eSRichard Henderson { 3177c0522136SRichard Henderson if (!temp_readonly(ts) && !ts->mem_coherent) { 31787f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 31792272e4a7SRichard Henderson temp_allocate_frame(s, ts); 318059d7c14eSRichard Henderson } 318159d7c14eSRichard Henderson switch (ts->val_type) { 318259d7c14eSRichard Henderson case TEMP_VAL_CONST: 318359d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 318459d7c14eSRichard Henderson require it later in a register, so attempt to store the 318559d7c14eSRichard Henderson constant to memory directly. */ 318659d7c14eSRichard Henderson if (free_or_dead 318759d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 318859d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 318959d7c14eSRichard Henderson break; 319059d7c14eSRichard Henderson } 319159d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 319298b4e186SRichard Henderson allocated_regs, preferred_regs); 319359d7c14eSRichard Henderson /* fallthrough */ 319459d7c14eSRichard Henderson 319559d7c14eSRichard Henderson case TEMP_VAL_REG: 319659d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 319759d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 319859d7c14eSRichard Henderson break; 319959d7c14eSRichard Henderson 320059d7c14eSRichard Henderson case TEMP_VAL_MEM: 320159d7c14eSRichard Henderson break; 320259d7c14eSRichard Henderson 320359d7c14eSRichard Henderson case TEMP_VAL_DEAD: 320459d7c14eSRichard Henderson default: 320559d7c14eSRichard Henderson tcg_abort(); 3206c896fe29Sbellard } 32077f6ceedfSAurelien Jarno ts->mem_coherent = 1; 32087f6ceedfSAurelien Jarno } 320959d7c14eSRichard Henderson if (free_or_dead) { 321059d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 321159d7c14eSRichard Henderson } 321259d7c14eSRichard Henderson } 32137f6ceedfSAurelien Jarno 32147f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 3215b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 32167f6ceedfSAurelien Jarno { 3217f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 3218f8b2f202SRichard Henderson if (ts != NULL) { 321998b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, -1); 3220c896fe29Sbellard } 3221c896fe29Sbellard } 3222c896fe29Sbellard 3223b016486eSRichard Henderson /** 3224b016486eSRichard Henderson * tcg_reg_alloc: 3225b016486eSRichard Henderson * @required_regs: Set of registers in which we must allocate. 3226b016486eSRichard Henderson * @allocated_regs: Set of registers which must be avoided. 3227b016486eSRichard Henderson * @preferred_regs: Set of registers we should prefer. 3228b016486eSRichard Henderson * @rev: True if we search the registers in "indirect" order. 3229b016486eSRichard Henderson * 3230b016486eSRichard Henderson * The allocated register must be in @required_regs & ~@allocated_regs, 3231b016486eSRichard Henderson * but if we can put it in @preferred_regs we may save a move later. 3232b016486eSRichard Henderson */ 3233b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs, 3234b016486eSRichard Henderson TCGRegSet allocated_regs, 3235b016486eSRichard Henderson TCGRegSet preferred_regs, bool rev) 3236c896fe29Sbellard { 3237b016486eSRichard Henderson int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 3238b016486eSRichard Henderson TCGRegSet reg_ct[2]; 323991478cefSRichard Henderson const int *order; 3240c896fe29Sbellard 3241b016486eSRichard Henderson reg_ct[1] = required_regs & ~allocated_regs; 3242b016486eSRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 3243b016486eSRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 3244b016486eSRichard Henderson 3245b016486eSRichard Henderson /* Skip the preferred_regs option if it cannot be satisfied, 3246b016486eSRichard Henderson or if the preference made no difference. */ 3247b016486eSRichard Henderson f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 3248b016486eSRichard Henderson 324991478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 3250c896fe29Sbellard 3251b016486eSRichard Henderson /* Try free registers, preferences first. */ 3252b016486eSRichard Henderson for (j = f; j < 2; j++) { 3253b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3254b016486eSRichard Henderson 3255b016486eSRichard Henderson if (tcg_regset_single(set)) { 3256b016486eSRichard Henderson /* One register in the set. */ 3257b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3258b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL) { 3259c896fe29Sbellard return reg; 3260c896fe29Sbellard } 3261b016486eSRichard Henderson } else { 326291478cefSRichard Henderson for (i = 0; i < n; i++) { 3263b016486eSRichard Henderson TCGReg reg = order[i]; 3264b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL && 3265b016486eSRichard Henderson tcg_regset_test_reg(set, reg)) { 3266b016486eSRichard Henderson return reg; 3267b016486eSRichard Henderson } 3268b016486eSRichard Henderson } 3269b016486eSRichard Henderson } 3270b016486eSRichard Henderson } 3271b016486eSRichard Henderson 3272b016486eSRichard Henderson /* We must spill something. */ 3273b016486eSRichard Henderson for (j = f; j < 2; j++) { 3274b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3275b016486eSRichard Henderson 3276b016486eSRichard Henderson if (tcg_regset_single(set)) { 3277b016486eSRichard Henderson /* One register in the set. */ 3278b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3279b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3280c896fe29Sbellard return reg; 3281b016486eSRichard Henderson } else { 3282b016486eSRichard Henderson for (i = 0; i < n; i++) { 3283b016486eSRichard Henderson TCGReg reg = order[i]; 3284b016486eSRichard Henderson if (tcg_regset_test_reg(set, reg)) { 3285b016486eSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3286b016486eSRichard Henderson return reg; 3287b016486eSRichard Henderson } 3288b016486eSRichard Henderson } 3289c896fe29Sbellard } 3290c896fe29Sbellard } 3291c896fe29Sbellard 3292c896fe29Sbellard tcg_abort(); 3293c896fe29Sbellard } 3294c896fe29Sbellard 329529f5e925SRichard Henderson static TCGReg tcg_reg_alloc_pair(TCGContext *s, TCGRegSet required_regs, 329629f5e925SRichard Henderson TCGRegSet allocated_regs, 329729f5e925SRichard Henderson TCGRegSet preferred_regs, bool rev) 329829f5e925SRichard Henderson { 329929f5e925SRichard Henderson int i, j, k, fmin, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 330029f5e925SRichard Henderson TCGRegSet reg_ct[2]; 330129f5e925SRichard Henderson const int *order; 330229f5e925SRichard Henderson 330329f5e925SRichard Henderson /* Ensure that if I is not in allocated_regs, I+1 is not either. */ 330429f5e925SRichard Henderson reg_ct[1] = required_regs & ~(allocated_regs | (allocated_regs >> 1)); 330529f5e925SRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 330629f5e925SRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 330729f5e925SRichard Henderson 330829f5e925SRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 330929f5e925SRichard Henderson 331029f5e925SRichard Henderson /* 331129f5e925SRichard Henderson * Skip the preferred_regs option if it cannot be satisfied, 331229f5e925SRichard Henderson * or if the preference made no difference. 331329f5e925SRichard Henderson */ 331429f5e925SRichard Henderson k = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 331529f5e925SRichard Henderson 331629f5e925SRichard Henderson /* 331729f5e925SRichard Henderson * Minimize the number of flushes by looking for 2 free registers first, 331829f5e925SRichard Henderson * then a single flush, then two flushes. 331929f5e925SRichard Henderson */ 332029f5e925SRichard Henderson for (fmin = 2; fmin >= 0; fmin--) { 332129f5e925SRichard Henderson for (j = k; j < 2; j++) { 332229f5e925SRichard Henderson TCGRegSet set = reg_ct[j]; 332329f5e925SRichard Henderson 332429f5e925SRichard Henderson for (i = 0; i < n; i++) { 332529f5e925SRichard Henderson TCGReg reg = order[i]; 332629f5e925SRichard Henderson 332729f5e925SRichard Henderson if (tcg_regset_test_reg(set, reg)) { 332829f5e925SRichard Henderson int f = !s->reg_to_temp[reg] + !s->reg_to_temp[reg + 1]; 332929f5e925SRichard Henderson if (f >= fmin) { 333029f5e925SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 333129f5e925SRichard Henderson tcg_reg_free(s, reg + 1, allocated_regs); 333229f5e925SRichard Henderson return reg; 333329f5e925SRichard Henderson } 333429f5e925SRichard Henderson } 333529f5e925SRichard Henderson } 333629f5e925SRichard Henderson } 333729f5e925SRichard Henderson } 333829f5e925SRichard Henderson tcg_abort(); 333929f5e925SRichard Henderson } 334029f5e925SRichard Henderson 334140ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 334240ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 334340ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 3344b722452aSRichard Henderson TCGRegSet allocated_regs, TCGRegSet preferred_regs) 334540ae5c62SRichard Henderson { 334640ae5c62SRichard Henderson TCGReg reg; 334740ae5c62SRichard Henderson 334840ae5c62SRichard Henderson switch (ts->val_type) { 334940ae5c62SRichard Henderson case TEMP_VAL_REG: 335040ae5c62SRichard Henderson return; 335140ae5c62SRichard Henderson case TEMP_VAL_CONST: 3352b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3353b722452aSRichard Henderson preferred_regs, ts->indirect_base); 33540a6a8bc8SRichard Henderson if (ts->type <= TCG_TYPE_I64) { 335540ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 33560a6a8bc8SRichard Henderson } else { 33574e186175SRichard Henderson uint64_t val = ts->val; 33584e186175SRichard Henderson MemOp vece = MO_64; 33594e186175SRichard Henderson 33604e186175SRichard Henderson /* 33614e186175SRichard Henderson * Find the minimal vector element that matches the constant. 33624e186175SRichard Henderson * The targets will, in general, have to do this search anyway, 33634e186175SRichard Henderson * do this generically. 33644e186175SRichard Henderson */ 33654e186175SRichard Henderson if (val == dup_const(MO_8, val)) { 33664e186175SRichard Henderson vece = MO_8; 33674e186175SRichard Henderson } else if (val == dup_const(MO_16, val)) { 33684e186175SRichard Henderson vece = MO_16; 33690b4286ddSRichard Henderson } else if (val == dup_const(MO_32, val)) { 33704e186175SRichard Henderson vece = MO_32; 33714e186175SRichard Henderson } 33724e186175SRichard Henderson 33734e186175SRichard Henderson tcg_out_dupi_vec(s, ts->type, vece, reg, ts->val); 33740a6a8bc8SRichard Henderson } 337540ae5c62SRichard Henderson ts->mem_coherent = 0; 337640ae5c62SRichard Henderson break; 337740ae5c62SRichard Henderson case TEMP_VAL_MEM: 3378b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3379b722452aSRichard Henderson preferred_regs, ts->indirect_base); 338040ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 338140ae5c62SRichard Henderson ts->mem_coherent = 1; 338240ae5c62SRichard Henderson break; 338340ae5c62SRichard Henderson case TEMP_VAL_DEAD: 338440ae5c62SRichard Henderson default: 338540ae5c62SRichard Henderson tcg_abort(); 338640ae5c62SRichard Henderson } 3387098859f1SRichard Henderson set_temp_val_reg(s, ts, reg); 338840ae5c62SRichard Henderson } 338940ae5c62SRichard Henderson 339059d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 3391e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 339259d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 33931ad80729SAurelien Jarno { 33942c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 3395eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 3396e01fa97dSRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || temp_readonly(ts)); 33971ad80729SAurelien Jarno } 33981ad80729SAurelien Jarno 33999814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 3400641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 3401641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 3402641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 3403641d5fbeSbellard { 3404ac3b8891SRichard Henderson int i, n; 3405641d5fbeSbellard 3406ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 3407b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 3408641d5fbeSbellard } 3409e5097dc8Sbellard } 3410e5097dc8Sbellard 34113d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 34123d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 34133d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 34143d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 34153d5c5f87SAurelien Jarno { 3416ac3b8891SRichard Henderson int i, n; 34173d5c5f87SAurelien Jarno 3418ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 341912b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 342012b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 3421ee17db83SRichard Henderson || ts->kind == TEMP_FIXED 342212b9b11aSRichard Henderson || ts->mem_coherent); 34233d5c5f87SAurelien Jarno } 34243d5c5f87SAurelien Jarno } 34253d5c5f87SAurelien Jarno 3426e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 3427e8996ee0Sbellard all globals are stored at their canonical location. */ 3428e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 3429e5097dc8Sbellard { 3430e5097dc8Sbellard int i; 3431e5097dc8Sbellard 3432c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 3433b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 3434c0522136SRichard Henderson 3435c0522136SRichard Henderson switch (ts->kind) { 3436c0522136SRichard Henderson case TEMP_LOCAL: 3437b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 3438c0522136SRichard Henderson break; 3439c0522136SRichard Henderson case TEMP_NORMAL: 3440c7482438SRichard Henderson case TEMP_EBB: 34412c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 3442eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 3443eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3444c0522136SRichard Henderson break; 3445c0522136SRichard Henderson case TEMP_CONST: 3446c0522136SRichard Henderson /* Similarly, we should have freed any allocated register. */ 3447c0522136SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_CONST); 3448c0522136SRichard Henderson break; 3449c0522136SRichard Henderson default: 3450c0522136SRichard Henderson g_assert_not_reached(); 3451c896fe29Sbellard } 3452641d5fbeSbellard } 3453e8996ee0Sbellard 3454e8996ee0Sbellard save_globals(s, allocated_regs); 3455c896fe29Sbellard } 3456c896fe29Sbellard 3457bab1671fSRichard Henderson /* 3458c7482438SRichard Henderson * At a conditional branch, we assume all temporaries are dead unless 3459c7482438SRichard Henderson * explicitly live-across-conditional-branch; all globals and local 3460c7482438SRichard Henderson * temps are synced to their location. 3461b4cb76e6SRichard Henderson */ 3462b4cb76e6SRichard Henderson static void tcg_reg_alloc_cbranch(TCGContext *s, TCGRegSet allocated_regs) 3463b4cb76e6SRichard Henderson { 3464b4cb76e6SRichard Henderson sync_globals(s, allocated_regs); 3465b4cb76e6SRichard Henderson 3466b4cb76e6SRichard Henderson for (int i = s->nb_globals; i < s->nb_temps; i++) { 3467b4cb76e6SRichard Henderson TCGTemp *ts = &s->temps[i]; 3468b4cb76e6SRichard Henderson /* 3469b4cb76e6SRichard Henderson * The liveness analysis already ensures that temps are dead. 3470b4cb76e6SRichard Henderson * Keep tcg_debug_asserts for safety. 3471b4cb76e6SRichard Henderson */ 3472c0522136SRichard Henderson switch (ts->kind) { 3473c0522136SRichard Henderson case TEMP_LOCAL: 3474b4cb76e6SRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG || ts->mem_coherent); 3475c0522136SRichard Henderson break; 3476c0522136SRichard Henderson case TEMP_NORMAL: 3477b4cb76e6SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3478c0522136SRichard Henderson break; 3479c7482438SRichard Henderson case TEMP_EBB: 3480c0522136SRichard Henderson case TEMP_CONST: 3481c0522136SRichard Henderson break; 3482c0522136SRichard Henderson default: 3483c0522136SRichard Henderson g_assert_not_reached(); 3484b4cb76e6SRichard Henderson } 3485b4cb76e6SRichard Henderson } 3486b4cb76e6SRichard Henderson } 3487b4cb76e6SRichard Henderson 3488b4cb76e6SRichard Henderson /* 3489c58f4c97SRichard Henderson * Specialized code generation for INDEX_op_mov_* with a constant. 3490bab1671fSRichard Henderson */ 34910fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 3492ba87719cSRichard Henderson tcg_target_ulong val, TCGLifeData arg_life, 3493ba87719cSRichard Henderson TCGRegSet preferred_regs) 3494e8996ee0Sbellard { 3495d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3496e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 349759d7c14eSRichard Henderson 349859d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 3499098859f1SRichard Henderson set_temp_val_nonreg(s, ots, TEMP_VAL_CONST); 3500e8996ee0Sbellard ots->val = val; 350159d7c14eSRichard Henderson ots->mem_coherent = 0; 3502ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 3503ba87719cSRichard Henderson temp_sync(s, ots, s->reserved_regs, preferred_regs, IS_DEAD_ARG(0)); 350459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 3505f8bf00f1SRichard Henderson temp_dead(s, ots); 35064c4e1ab2SAurelien Jarno } 3507e8996ee0Sbellard } 3508e8996ee0Sbellard 3509bab1671fSRichard Henderson /* 3510bab1671fSRichard Henderson * Specialized code generation for INDEX_op_mov_*. 3511bab1671fSRichard Henderson */ 3512dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 3513c896fe29Sbellard { 3514dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 351569e3706dSRichard Henderson TCGRegSet allocated_regs, preferred_regs; 3516c896fe29Sbellard TCGTemp *ts, *ots; 3517450445d5SRichard Henderson TCGType otype, itype; 3518098859f1SRichard Henderson TCGReg oreg, ireg; 3519c896fe29Sbellard 3520d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 352169e3706dSRichard Henderson preferred_regs = op->output_pref[0]; 352243439139SRichard Henderson ots = arg_temp(op->args[0]); 352343439139SRichard Henderson ts = arg_temp(op->args[1]); 3524450445d5SRichard Henderson 3525d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3526e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3527d63e3b6eSRichard Henderson 3528450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 3529450445d5SRichard Henderson otype = ots->type; 3530450445d5SRichard Henderson itype = ts->type; 3531c896fe29Sbellard 35320fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 35330fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 35340fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 35350fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 35360fe4fca4SPaolo Bonzini temp_dead(s, ts); 35370fe4fca4SPaolo Bonzini } 353869e3706dSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, preferred_regs); 35390fe4fca4SPaolo Bonzini return; 35400fe4fca4SPaolo Bonzini } 35410fe4fca4SPaolo Bonzini 35420fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 35430fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 35440fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 35450fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 35460fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 354769e3706dSRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], 354869e3706dSRichard Henderson allocated_regs, preferred_regs); 3549c29c1d7eSAurelien Jarno } 35500fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 3551098859f1SRichard Henderson ireg = ts->reg; 3552098859f1SRichard Henderson 3553d63e3b6eSRichard Henderson if (IS_DEAD_ARG(0)) { 3554c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 3555c29c1d7eSAurelien Jarno liveness analysis disabled). */ 3556eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 3557c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 35582272e4a7SRichard Henderson temp_allocate_frame(s, ots); 3559c29c1d7eSAurelien Jarno } 3560098859f1SRichard Henderson tcg_out_st(s, otype, ireg, ots->mem_base->reg, ots->mem_offset); 3561c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 3562f8bf00f1SRichard Henderson temp_dead(s, ts); 3563c29c1d7eSAurelien Jarno } 3564f8bf00f1SRichard Henderson temp_dead(s, ots); 3565098859f1SRichard Henderson return; 3566098859f1SRichard Henderson } 3567098859f1SRichard Henderson 3568ee17db83SRichard Henderson if (IS_DEAD_ARG(1) && ts->kind != TEMP_FIXED) { 3569098859f1SRichard Henderson /* 3570098859f1SRichard Henderson * The mov can be suppressed. Kill input first, so that it 3571098859f1SRichard Henderson * is unlinked from reg_to_temp, then set the output to the 3572098859f1SRichard Henderson * reg that we saved from the input. 3573098859f1SRichard Henderson */ 3574f8bf00f1SRichard Henderson temp_dead(s, ts); 3575098859f1SRichard Henderson oreg = ireg; 3576c29c1d7eSAurelien Jarno } else { 3577098859f1SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 3578098859f1SRichard Henderson oreg = ots->reg; 3579098859f1SRichard Henderson } else { 3580098859f1SRichard Henderson /* Make sure to not spill the input register during allocation. */ 3581098859f1SRichard Henderson oreg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 3582098859f1SRichard Henderson allocated_regs | ((TCGRegSet)1 << ireg), 3583098859f1SRichard Henderson preferred_regs, ots->indirect_base); 3584c29c1d7eSAurelien Jarno } 3585098859f1SRichard Henderson if (!tcg_out_mov(s, otype, oreg, ireg)) { 3586240c08d0SRichard Henderson /* 3587240c08d0SRichard Henderson * Cross register class move not supported. 3588240c08d0SRichard Henderson * Store the source register into the destination slot 3589240c08d0SRichard Henderson * and leave the destination temp as TEMP_VAL_MEM. 3590240c08d0SRichard Henderson */ 3591e01fa97dSRichard Henderson assert(!temp_readonly(ots)); 3592240c08d0SRichard Henderson if (!ts->mem_allocated) { 3593240c08d0SRichard Henderson temp_allocate_frame(s, ots); 3594240c08d0SRichard Henderson } 3595098859f1SRichard Henderson tcg_out_st(s, ts->type, ireg, ots->mem_base->reg, ots->mem_offset); 3596098859f1SRichard Henderson set_temp_val_nonreg(s, ts, TEMP_VAL_MEM); 3597240c08d0SRichard Henderson ots->mem_coherent = 1; 3598240c08d0SRichard Henderson return; 359978113e83SRichard Henderson } 3600c29c1d7eSAurelien Jarno } 3601098859f1SRichard Henderson set_temp_val_reg(s, ots, oreg); 3602c896fe29Sbellard ots->mem_coherent = 0; 3603098859f1SRichard Henderson 3604ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 360598b4e186SRichard Henderson temp_sync(s, ots, allocated_regs, 0, 0); 3606c29c1d7eSAurelien Jarno } 3607ec7a869dSAurelien Jarno } 3608c896fe29Sbellard 3609bab1671fSRichard Henderson /* 3610bab1671fSRichard Henderson * Specialized code generation for INDEX_op_dup_vec. 3611bab1671fSRichard Henderson */ 3612bab1671fSRichard Henderson static void tcg_reg_alloc_dup(TCGContext *s, const TCGOp *op) 3613bab1671fSRichard Henderson { 3614bab1671fSRichard Henderson const TCGLifeData arg_life = op->life; 3615bab1671fSRichard Henderson TCGRegSet dup_out_regs, dup_in_regs; 3616bab1671fSRichard Henderson TCGTemp *its, *ots; 3617bab1671fSRichard Henderson TCGType itype, vtype; 3618bab1671fSRichard Henderson unsigned vece; 361931c96417SRichard Henderson int lowpart_ofs; 3620bab1671fSRichard Henderson bool ok; 3621bab1671fSRichard Henderson 3622bab1671fSRichard Henderson ots = arg_temp(op->args[0]); 3623bab1671fSRichard Henderson its = arg_temp(op->args[1]); 3624bab1671fSRichard Henderson 3625bab1671fSRichard Henderson /* ENV should not be modified. */ 3626e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3627bab1671fSRichard Henderson 3628bab1671fSRichard Henderson itype = its->type; 3629bab1671fSRichard Henderson vece = TCGOP_VECE(op); 3630bab1671fSRichard Henderson vtype = TCGOP_VECL(op) + TCG_TYPE_V64; 3631bab1671fSRichard Henderson 3632bab1671fSRichard Henderson if (its->val_type == TEMP_VAL_CONST) { 3633bab1671fSRichard Henderson /* Propagate constant via movi -> dupi. */ 3634bab1671fSRichard Henderson tcg_target_ulong val = its->val; 3635bab1671fSRichard Henderson if (IS_DEAD_ARG(1)) { 3636bab1671fSRichard Henderson temp_dead(s, its); 3637bab1671fSRichard Henderson } 3638bab1671fSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, op->output_pref[0]); 3639bab1671fSRichard Henderson return; 3640bab1671fSRichard Henderson } 3641bab1671fSRichard Henderson 36429be0d080SRichard Henderson dup_out_regs = tcg_op_defs[INDEX_op_dup_vec].args_ct[0].regs; 36439be0d080SRichard Henderson dup_in_regs = tcg_op_defs[INDEX_op_dup_vec].args_ct[1].regs; 3644bab1671fSRichard Henderson 3645bab1671fSRichard Henderson /* Allocate the output register now. */ 3646bab1671fSRichard Henderson if (ots->val_type != TEMP_VAL_REG) { 3647bab1671fSRichard Henderson TCGRegSet allocated_regs = s->reserved_regs; 3648098859f1SRichard Henderson TCGReg oreg; 3649bab1671fSRichard Henderson 3650bab1671fSRichard Henderson if (!IS_DEAD_ARG(1) && its->val_type == TEMP_VAL_REG) { 3651bab1671fSRichard Henderson /* Make sure to not spill the input register. */ 3652bab1671fSRichard Henderson tcg_regset_set_reg(allocated_regs, its->reg); 3653bab1671fSRichard Henderson } 3654098859f1SRichard Henderson oreg = tcg_reg_alloc(s, dup_out_regs, allocated_regs, 3655bab1671fSRichard Henderson op->output_pref[0], ots->indirect_base); 3656098859f1SRichard Henderson set_temp_val_reg(s, ots, oreg); 3657bab1671fSRichard Henderson } 3658bab1671fSRichard Henderson 3659bab1671fSRichard Henderson switch (its->val_type) { 3660bab1671fSRichard Henderson case TEMP_VAL_REG: 3661bab1671fSRichard Henderson /* 3662bab1671fSRichard Henderson * The dup constriaints must be broad, covering all possible VECE. 3663bab1671fSRichard Henderson * However, tcg_op_dup_vec() gets to see the VECE and we allow it 3664bab1671fSRichard Henderson * to fail, indicating that extra moves are required for that case. 3665bab1671fSRichard Henderson */ 3666bab1671fSRichard Henderson if (tcg_regset_test_reg(dup_in_regs, its->reg)) { 3667bab1671fSRichard Henderson if (tcg_out_dup_vec(s, vtype, vece, ots->reg, its->reg)) { 3668bab1671fSRichard Henderson goto done; 3669bab1671fSRichard Henderson } 3670bab1671fSRichard Henderson /* Try again from memory or a vector input register. */ 3671bab1671fSRichard Henderson } 3672bab1671fSRichard Henderson if (!its->mem_coherent) { 3673bab1671fSRichard Henderson /* 3674bab1671fSRichard Henderson * The input register is not synced, and so an extra store 3675bab1671fSRichard Henderson * would be required to use memory. Attempt an integer-vector 3676bab1671fSRichard Henderson * register move first. We do not have a TCGRegSet for this. 3677bab1671fSRichard Henderson */ 3678bab1671fSRichard Henderson if (tcg_out_mov(s, itype, ots->reg, its->reg)) { 3679bab1671fSRichard Henderson break; 3680bab1671fSRichard Henderson } 3681bab1671fSRichard Henderson /* Sync the temp back to its slot and load from there. */ 3682bab1671fSRichard Henderson temp_sync(s, its, s->reserved_regs, 0, 0); 3683bab1671fSRichard Henderson } 3684bab1671fSRichard Henderson /* fall through */ 3685bab1671fSRichard Henderson 3686bab1671fSRichard Henderson case TEMP_VAL_MEM: 368731c96417SRichard Henderson lowpart_ofs = 0; 368831c96417SRichard Henderson if (HOST_BIG_ENDIAN) { 368931c96417SRichard Henderson lowpart_ofs = tcg_type_size(itype) - (1 << vece); 369031c96417SRichard Henderson } 3691d6ecb4a9SRichard Henderson if (tcg_out_dupm_vec(s, vtype, vece, ots->reg, its->mem_base->reg, 369231c96417SRichard Henderson its->mem_offset + lowpart_ofs)) { 3693d6ecb4a9SRichard Henderson goto done; 3694d6ecb4a9SRichard Henderson } 3695098859f1SRichard Henderson /* Load the input into the destination vector register. */ 3696bab1671fSRichard Henderson tcg_out_ld(s, itype, ots->reg, its->mem_base->reg, its->mem_offset); 3697bab1671fSRichard Henderson break; 3698bab1671fSRichard Henderson 3699bab1671fSRichard Henderson default: 3700bab1671fSRichard Henderson g_assert_not_reached(); 3701bab1671fSRichard Henderson } 3702bab1671fSRichard Henderson 3703bab1671fSRichard Henderson /* We now have a vector input register, so dup must succeed. */ 3704bab1671fSRichard Henderson ok = tcg_out_dup_vec(s, vtype, vece, ots->reg, ots->reg); 3705bab1671fSRichard Henderson tcg_debug_assert(ok); 3706bab1671fSRichard Henderson 3707bab1671fSRichard Henderson done: 370836f5539cSRichard Henderson ots->mem_coherent = 0; 3709bab1671fSRichard Henderson if (IS_DEAD_ARG(1)) { 3710bab1671fSRichard Henderson temp_dead(s, its); 3711bab1671fSRichard Henderson } 3712bab1671fSRichard Henderson if (NEED_SYNC_ARG(0)) { 3713bab1671fSRichard Henderson temp_sync(s, ots, s->reserved_regs, 0, 0); 3714bab1671fSRichard Henderson } 3715bab1671fSRichard Henderson if (IS_DEAD_ARG(0)) { 3716bab1671fSRichard Henderson temp_dead(s, ots); 3717bab1671fSRichard Henderson } 3718bab1671fSRichard Henderson } 3719bab1671fSRichard Henderson 3720dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3721c896fe29Sbellard { 3722dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3723dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 372482790a87SRichard Henderson TCGRegSet i_allocated_regs; 372582790a87SRichard Henderson TCGRegSet o_allocated_regs; 3726b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3727b6638662SRichard Henderson TCGReg reg; 3728c896fe29Sbellard TCGArg arg; 3729c896fe29Sbellard const TCGArgConstraint *arg_ct; 3730c896fe29Sbellard TCGTemp *ts; 3731c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3732c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3733c896fe29Sbellard 3734c896fe29Sbellard nb_oargs = def->nb_oargs; 3735c896fe29Sbellard nb_iargs = def->nb_iargs; 3736c896fe29Sbellard 3737c896fe29Sbellard /* copy constants */ 3738c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3739dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3740c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3741c896fe29Sbellard 3742d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3743d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 374482790a87SRichard Henderson 3745c896fe29Sbellard /* satisfy input constraints */ 3746c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 374729f5e925SRichard Henderson TCGRegSet i_preferred_regs, i_required_regs; 374829f5e925SRichard Henderson bool allocate_new_reg, copyto_new_reg; 374929f5e925SRichard Henderson TCGTemp *ts2; 375029f5e925SRichard Henderson int i1, i2; 3751d62816f2SRichard Henderson 375266792f90SRichard Henderson i = def->args_ct[nb_oargs + k].sort_index; 3753dd186292SRichard Henderson arg = op->args[i]; 3754c896fe29Sbellard arg_ct = &def->args_ct[i]; 375543439139SRichard Henderson ts = arg_temp(arg); 375640ae5c62SRichard Henderson 375740ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 3758a4fbbd77SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct->ct)) { 3759c896fe29Sbellard /* constant is OK for instruction */ 3760c896fe29Sbellard const_args[i] = 1; 3761c896fe29Sbellard new_args[i] = ts->val; 3762d62816f2SRichard Henderson continue; 3763c896fe29Sbellard } 376440ae5c62SRichard Henderson 37651c1824dcSRichard Henderson reg = ts->reg; 37661c1824dcSRichard Henderson i_preferred_regs = 0; 376729f5e925SRichard Henderson i_required_regs = arg_ct->regs; 37681c1824dcSRichard Henderson allocate_new_reg = false; 376929f5e925SRichard Henderson copyto_new_reg = false; 37701c1824dcSRichard Henderson 377129f5e925SRichard Henderson switch (arg_ct->pair) { 377229f5e925SRichard Henderson case 0: /* not paired */ 3773bc2b17e6SRichard Henderson if (arg_ct->ialias) { 37741c1824dcSRichard Henderson i_preferred_regs = op->output_pref[arg_ct->alias_index]; 3775c0522136SRichard Henderson 3776c0522136SRichard Henderson /* 3777c0522136SRichard Henderson * If the input is readonly, then it cannot also be an 3778c0522136SRichard Henderson * output and aliased to itself. If the input is not 3779c0522136SRichard Henderson * dead after the instruction, we must allocate a new 3780c0522136SRichard Henderson * register and move it. 3781c0522136SRichard Henderson */ 3782c0522136SRichard Henderson if (temp_readonly(ts) || !IS_DEAD_ARG(i)) { 37831c1824dcSRichard Henderson allocate_new_reg = true; 37841c1824dcSRichard Henderson } else if (ts->val_type == TEMP_VAL_REG) { 3785c0522136SRichard Henderson /* 37861c1824dcSRichard Henderson * Check if the current register has already been 37871c1824dcSRichard Henderson * allocated for another input. 3788c0522136SRichard Henderson */ 378929f5e925SRichard Henderson allocate_new_reg = 379029f5e925SRichard Henderson tcg_regset_test_reg(i_allocated_regs, reg); 37917e1df267SAurelien Jarno } 37927e1df267SAurelien Jarno } 37931c1824dcSRichard Henderson if (!allocate_new_reg) { 379429f5e925SRichard Henderson temp_load(s, ts, i_required_regs, i_allocated_regs, 379529f5e925SRichard Henderson i_preferred_regs); 3796c896fe29Sbellard reg = ts->reg; 379729f5e925SRichard Henderson allocate_new_reg = !tcg_regset_test_reg(i_required_regs, reg); 37981c1824dcSRichard Henderson } 37991c1824dcSRichard Henderson if (allocate_new_reg) { 3800c0522136SRichard Henderson /* 3801c0522136SRichard Henderson * Allocate a new register matching the constraint 3802c0522136SRichard Henderson * and move the temporary register into it. 3803c0522136SRichard Henderson */ 3804d62816f2SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 3805d62816f2SRichard Henderson i_allocated_regs, 0); 380629f5e925SRichard Henderson reg = tcg_reg_alloc(s, i_required_regs, i_allocated_regs, 38071c1824dcSRichard Henderson i_preferred_regs, ts->indirect_base); 380829f5e925SRichard Henderson copyto_new_reg = true; 380929f5e925SRichard Henderson } 381029f5e925SRichard Henderson break; 381129f5e925SRichard Henderson 381229f5e925SRichard Henderson case 1: 381329f5e925SRichard Henderson /* First of an input pair; if i1 == i2, the second is an output. */ 381429f5e925SRichard Henderson i1 = i; 381529f5e925SRichard Henderson i2 = arg_ct->pair_index; 381629f5e925SRichard Henderson ts2 = i1 != i2 ? arg_temp(op->args[i2]) : NULL; 381729f5e925SRichard Henderson 381829f5e925SRichard Henderson /* 381929f5e925SRichard Henderson * It is easier to default to allocating a new pair 382029f5e925SRichard Henderson * and to identify a few cases where it's not required. 382129f5e925SRichard Henderson */ 382229f5e925SRichard Henderson if (arg_ct->ialias) { 382329f5e925SRichard Henderson i_preferred_regs = op->output_pref[arg_ct->alias_index]; 382429f5e925SRichard Henderson if (IS_DEAD_ARG(i1) && 382529f5e925SRichard Henderson IS_DEAD_ARG(i2) && 382629f5e925SRichard Henderson !temp_readonly(ts) && 382729f5e925SRichard Henderson ts->val_type == TEMP_VAL_REG && 382829f5e925SRichard Henderson ts->reg < TCG_TARGET_NB_REGS - 1 && 382929f5e925SRichard Henderson tcg_regset_test_reg(i_required_regs, reg) && 383029f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg) && 383129f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg + 1) && 383229f5e925SRichard Henderson (ts2 383329f5e925SRichard Henderson ? ts2->val_type == TEMP_VAL_REG && 383429f5e925SRichard Henderson ts2->reg == reg + 1 && 383529f5e925SRichard Henderson !temp_readonly(ts2) 383629f5e925SRichard Henderson : s->reg_to_temp[reg + 1] == NULL)) { 383729f5e925SRichard Henderson break; 383829f5e925SRichard Henderson } 383929f5e925SRichard Henderson } else { 384029f5e925SRichard Henderson /* Without aliasing, the pair must also be an input. */ 384129f5e925SRichard Henderson tcg_debug_assert(ts2); 384229f5e925SRichard Henderson if (ts->val_type == TEMP_VAL_REG && 384329f5e925SRichard Henderson ts2->val_type == TEMP_VAL_REG && 384429f5e925SRichard Henderson ts2->reg == reg + 1 && 384529f5e925SRichard Henderson tcg_regset_test_reg(i_required_regs, reg)) { 384629f5e925SRichard Henderson break; 384729f5e925SRichard Henderson } 384829f5e925SRichard Henderson } 384929f5e925SRichard Henderson reg = tcg_reg_alloc_pair(s, i_required_regs, i_allocated_regs, 385029f5e925SRichard Henderson 0, ts->indirect_base); 385129f5e925SRichard Henderson goto do_pair; 385229f5e925SRichard Henderson 385329f5e925SRichard Henderson case 2: /* pair second */ 385429f5e925SRichard Henderson reg = new_args[arg_ct->pair_index] + 1; 385529f5e925SRichard Henderson goto do_pair; 385629f5e925SRichard Henderson 385729f5e925SRichard Henderson case 3: /* ialias with second output, no first input */ 385829f5e925SRichard Henderson tcg_debug_assert(arg_ct->ialias); 385929f5e925SRichard Henderson i_preferred_regs = op->output_pref[arg_ct->alias_index]; 386029f5e925SRichard Henderson 386129f5e925SRichard Henderson if (IS_DEAD_ARG(i) && 386229f5e925SRichard Henderson !temp_readonly(ts) && 386329f5e925SRichard Henderson ts->val_type == TEMP_VAL_REG && 386429f5e925SRichard Henderson reg > 0 && 386529f5e925SRichard Henderson s->reg_to_temp[reg - 1] == NULL && 386629f5e925SRichard Henderson tcg_regset_test_reg(i_required_regs, reg) && 386729f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg) && 386829f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg - 1)) { 386929f5e925SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg - 1); 387029f5e925SRichard Henderson break; 387129f5e925SRichard Henderson } 387229f5e925SRichard Henderson reg = tcg_reg_alloc_pair(s, i_required_regs >> 1, 387329f5e925SRichard Henderson i_allocated_regs, 0, 387429f5e925SRichard Henderson ts->indirect_base); 387529f5e925SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 387629f5e925SRichard Henderson reg += 1; 387729f5e925SRichard Henderson goto do_pair; 387829f5e925SRichard Henderson 387929f5e925SRichard Henderson do_pair: 388029f5e925SRichard Henderson /* 388129f5e925SRichard Henderson * If an aliased input is not dead after the instruction, 388229f5e925SRichard Henderson * we must allocate a new register and move it. 388329f5e925SRichard Henderson */ 388429f5e925SRichard Henderson if (arg_ct->ialias && (!IS_DEAD_ARG(i) || temp_readonly(ts))) { 388529f5e925SRichard Henderson TCGRegSet t_allocated_regs = i_allocated_regs; 388629f5e925SRichard Henderson 388729f5e925SRichard Henderson /* 388829f5e925SRichard Henderson * Because of the alias, and the continued life, make sure 388929f5e925SRichard Henderson * that the temp is somewhere *other* than the reg pair, 389029f5e925SRichard Henderson * and we get a copy in reg. 389129f5e925SRichard Henderson */ 389229f5e925SRichard Henderson tcg_regset_set_reg(t_allocated_regs, reg); 389329f5e925SRichard Henderson tcg_regset_set_reg(t_allocated_regs, reg + 1); 389429f5e925SRichard Henderson if (ts->val_type == TEMP_VAL_REG && ts->reg == reg) { 389529f5e925SRichard Henderson /* If ts was already in reg, copy it somewhere else. */ 389629f5e925SRichard Henderson TCGReg nr; 389729f5e925SRichard Henderson bool ok; 389829f5e925SRichard Henderson 389929f5e925SRichard Henderson tcg_debug_assert(ts->kind != TEMP_FIXED); 390029f5e925SRichard Henderson nr = tcg_reg_alloc(s, tcg_target_available_regs[ts->type], 390129f5e925SRichard Henderson t_allocated_regs, 0, ts->indirect_base); 390229f5e925SRichard Henderson ok = tcg_out_mov(s, ts->type, nr, reg); 390329f5e925SRichard Henderson tcg_debug_assert(ok); 390429f5e925SRichard Henderson 390529f5e925SRichard Henderson set_temp_val_reg(s, ts, nr); 390629f5e925SRichard Henderson } else { 390729f5e925SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 390829f5e925SRichard Henderson t_allocated_regs, 0); 390929f5e925SRichard Henderson copyto_new_reg = true; 391029f5e925SRichard Henderson } 391129f5e925SRichard Henderson } else { 391229f5e925SRichard Henderson /* Preferably allocate to reg, otherwise copy. */ 391329f5e925SRichard Henderson i_required_regs = (TCGRegSet)1 << reg; 391429f5e925SRichard Henderson temp_load(s, ts, i_required_regs, i_allocated_regs, 391529f5e925SRichard Henderson i_preferred_regs); 391629f5e925SRichard Henderson copyto_new_reg = ts->reg != reg; 391729f5e925SRichard Henderson } 391829f5e925SRichard Henderson break; 391929f5e925SRichard Henderson 392029f5e925SRichard Henderson default: 392129f5e925SRichard Henderson g_assert_not_reached(); 392229f5e925SRichard Henderson } 392329f5e925SRichard Henderson 392429f5e925SRichard Henderson if (copyto_new_reg) { 392578113e83SRichard Henderson if (!tcg_out_mov(s, ts->type, reg, ts->reg)) { 3926240c08d0SRichard Henderson /* 3927240c08d0SRichard Henderson * Cross register class move not supported. Sync the 3928240c08d0SRichard Henderson * temp back to its slot and load from there. 3929240c08d0SRichard Henderson */ 3930240c08d0SRichard Henderson temp_sync(s, ts, i_allocated_regs, 0, 0); 3931240c08d0SRichard Henderson tcg_out_ld(s, ts->type, reg, 3932240c08d0SRichard Henderson ts->mem_base->reg, ts->mem_offset); 393378113e83SRichard Henderson } 3934c896fe29Sbellard } 3935c896fe29Sbellard new_args[i] = reg; 3936c896fe29Sbellard const_args[i] = 0; 393782790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3938c896fe29Sbellard } 3939c896fe29Sbellard 3940c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3941866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3942866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 394343439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3944c896fe29Sbellard } 3945c896fe29Sbellard } 3946c896fe29Sbellard 3947b4cb76e6SRichard Henderson if (def->flags & TCG_OPF_COND_BRANCH) { 3948b4cb76e6SRichard Henderson tcg_reg_alloc_cbranch(s, i_allocated_regs); 3949b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 395082790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3951a52ad07eSAurelien Jarno } else { 3952c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3953b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3954c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3955c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 395682790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3957c896fe29Sbellard } 3958c896fe29Sbellard } 39593d5c5f87SAurelien Jarno } 39603d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 39613d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 39623d5c5f87SAurelien Jarno an exception. */ 396382790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3964c896fe29Sbellard } 3965c896fe29Sbellard 3966c896fe29Sbellard /* satisfy the output constraints */ 3967c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 396866792f90SRichard Henderson i = def->args_ct[k].sort_index; 3969dd186292SRichard Henderson arg = op->args[i]; 3970c896fe29Sbellard arg_ct = &def->args_ct[i]; 397143439139SRichard Henderson ts = arg_temp(arg); 3972d63e3b6eSRichard Henderson 3973d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3974e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 3975d63e3b6eSRichard Henderson 397629f5e925SRichard Henderson switch (arg_ct->pair) { 397729f5e925SRichard Henderson case 0: /* not paired */ 3978bc2b17e6SRichard Henderson if (arg_ct->oalias && !const_args[arg_ct->alias_index]) { 39795ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 3980bc2b17e6SRichard Henderson } else if (arg_ct->newreg) { 39819be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, 398282790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 398369e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3984c896fe29Sbellard } else { 39859be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, o_allocated_regs, 398669e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3987c896fe29Sbellard } 398829f5e925SRichard Henderson break; 398929f5e925SRichard Henderson 399029f5e925SRichard Henderson case 1: /* first of pair */ 399129f5e925SRichard Henderson tcg_debug_assert(!arg_ct->newreg); 399229f5e925SRichard Henderson if (arg_ct->oalias) { 399329f5e925SRichard Henderson reg = new_args[arg_ct->alias_index]; 399429f5e925SRichard Henderson break; 399529f5e925SRichard Henderson } 399629f5e925SRichard Henderson reg = tcg_reg_alloc_pair(s, arg_ct->regs, o_allocated_regs, 399729f5e925SRichard Henderson op->output_pref[k], ts->indirect_base); 399829f5e925SRichard Henderson break; 399929f5e925SRichard Henderson 400029f5e925SRichard Henderson case 2: /* second of pair */ 400129f5e925SRichard Henderson tcg_debug_assert(!arg_ct->newreg); 400229f5e925SRichard Henderson if (arg_ct->oalias) { 400329f5e925SRichard Henderson reg = new_args[arg_ct->alias_index]; 400429f5e925SRichard Henderson } else { 400529f5e925SRichard Henderson reg = new_args[arg_ct->pair_index] + 1; 400629f5e925SRichard Henderson } 400729f5e925SRichard Henderson break; 400829f5e925SRichard Henderson 400929f5e925SRichard Henderson case 3: /* first of pair, aliasing with a second input */ 401029f5e925SRichard Henderson tcg_debug_assert(!arg_ct->newreg); 401129f5e925SRichard Henderson reg = new_args[arg_ct->pair_index] - 1; 401229f5e925SRichard Henderson break; 401329f5e925SRichard Henderson 401429f5e925SRichard Henderson default: 401529f5e925SRichard Henderson g_assert_not_reached(); 401629f5e925SRichard Henderson } 401782790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 4018098859f1SRichard Henderson set_temp_val_reg(s, ts, reg); 4019c896fe29Sbellard ts->mem_coherent = 0; 4020c896fe29Sbellard new_args[i] = reg; 4021c896fe29Sbellard } 4022e8996ee0Sbellard } 4023c896fe29Sbellard 4024c896fe29Sbellard /* emit instruction */ 4025d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 4026d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 4027d2fd745fSRichard Henderson new_args, const_args); 4028d2fd745fSRichard Henderson } else { 4029dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 4030d2fd745fSRichard Henderson } 4031c896fe29Sbellard 4032c896fe29Sbellard /* move the outputs in the correct register if needed */ 4033c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 403443439139SRichard Henderson ts = arg_temp(op->args[i]); 4035d63e3b6eSRichard Henderson 4036d63e3b6eSRichard Henderson /* ENV should not be modified. */ 4037e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 4038d63e3b6eSRichard Henderson 4039ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 404098b4e186SRichard Henderson temp_sync(s, ts, o_allocated_regs, 0, IS_DEAD_ARG(i)); 404159d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 4042f8bf00f1SRichard Henderson temp_dead(s, ts); 4043ec7a869dSAurelien Jarno } 4044c896fe29Sbellard } 4045c896fe29Sbellard } 4046c896fe29Sbellard 4047efe86b21SRichard Henderson static bool tcg_reg_alloc_dup2(TCGContext *s, const TCGOp *op) 4048efe86b21SRichard Henderson { 4049efe86b21SRichard Henderson const TCGLifeData arg_life = op->life; 4050efe86b21SRichard Henderson TCGTemp *ots, *itsl, *itsh; 4051efe86b21SRichard Henderson TCGType vtype = TCGOP_VECL(op) + TCG_TYPE_V64; 4052efe86b21SRichard Henderson 4053efe86b21SRichard Henderson /* This opcode is only valid for 32-bit hosts, for 64-bit elements. */ 4054efe86b21SRichard Henderson tcg_debug_assert(TCG_TARGET_REG_BITS == 32); 4055efe86b21SRichard Henderson tcg_debug_assert(TCGOP_VECE(op) == MO_64); 4056efe86b21SRichard Henderson 4057efe86b21SRichard Henderson ots = arg_temp(op->args[0]); 4058efe86b21SRichard Henderson itsl = arg_temp(op->args[1]); 4059efe86b21SRichard Henderson itsh = arg_temp(op->args[2]); 4060efe86b21SRichard Henderson 4061efe86b21SRichard Henderson /* ENV should not be modified. */ 4062efe86b21SRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 4063efe86b21SRichard Henderson 4064efe86b21SRichard Henderson /* Allocate the output register now. */ 4065efe86b21SRichard Henderson if (ots->val_type != TEMP_VAL_REG) { 4066efe86b21SRichard Henderson TCGRegSet allocated_regs = s->reserved_regs; 4067efe86b21SRichard Henderson TCGRegSet dup_out_regs = 4068efe86b21SRichard Henderson tcg_op_defs[INDEX_op_dup_vec].args_ct[0].regs; 4069098859f1SRichard Henderson TCGReg oreg; 4070efe86b21SRichard Henderson 4071efe86b21SRichard Henderson /* Make sure to not spill the input registers. */ 4072efe86b21SRichard Henderson if (!IS_DEAD_ARG(1) && itsl->val_type == TEMP_VAL_REG) { 4073efe86b21SRichard Henderson tcg_regset_set_reg(allocated_regs, itsl->reg); 4074efe86b21SRichard Henderson } 4075efe86b21SRichard Henderson if (!IS_DEAD_ARG(2) && itsh->val_type == TEMP_VAL_REG) { 4076efe86b21SRichard Henderson tcg_regset_set_reg(allocated_regs, itsh->reg); 4077efe86b21SRichard Henderson } 4078efe86b21SRichard Henderson 4079098859f1SRichard Henderson oreg = tcg_reg_alloc(s, dup_out_regs, allocated_regs, 4080efe86b21SRichard Henderson op->output_pref[0], ots->indirect_base); 4081098859f1SRichard Henderson set_temp_val_reg(s, ots, oreg); 4082efe86b21SRichard Henderson } 4083efe86b21SRichard Henderson 4084efe86b21SRichard Henderson /* Promote dup2 of immediates to dupi_vec. */ 4085efe86b21SRichard Henderson if (itsl->val_type == TEMP_VAL_CONST && itsh->val_type == TEMP_VAL_CONST) { 4086efe86b21SRichard Henderson uint64_t val = deposit64(itsl->val, 32, 32, itsh->val); 4087efe86b21SRichard Henderson MemOp vece = MO_64; 4088efe86b21SRichard Henderson 4089efe86b21SRichard Henderson if (val == dup_const(MO_8, val)) { 4090efe86b21SRichard Henderson vece = MO_8; 4091efe86b21SRichard Henderson } else if (val == dup_const(MO_16, val)) { 4092efe86b21SRichard Henderson vece = MO_16; 4093efe86b21SRichard Henderson } else if (val == dup_const(MO_32, val)) { 4094efe86b21SRichard Henderson vece = MO_32; 4095efe86b21SRichard Henderson } 4096efe86b21SRichard Henderson 4097efe86b21SRichard Henderson tcg_out_dupi_vec(s, vtype, vece, ots->reg, val); 4098efe86b21SRichard Henderson goto done; 4099efe86b21SRichard Henderson } 4100efe86b21SRichard Henderson 4101efe86b21SRichard Henderson /* If the two inputs form one 64-bit value, try dupm_vec. */ 4102aef85402SRichard Henderson if (itsl->temp_subindex == HOST_BIG_ENDIAN && 4103aef85402SRichard Henderson itsh->temp_subindex == !HOST_BIG_ENDIAN && 4104aef85402SRichard Henderson itsl == itsh + (HOST_BIG_ENDIAN ? 1 : -1)) { 4105aef85402SRichard Henderson TCGTemp *its = itsl - HOST_BIG_ENDIAN; 4106aef85402SRichard Henderson 4107aef85402SRichard Henderson temp_sync(s, its + 0, s->reserved_regs, 0, 0); 4108aef85402SRichard Henderson temp_sync(s, its + 1, s->reserved_regs, 0, 0); 4109aef85402SRichard Henderson 4110efe86b21SRichard Henderson if (tcg_out_dupm_vec(s, vtype, MO_64, ots->reg, 4111efe86b21SRichard Henderson its->mem_base->reg, its->mem_offset)) { 4112efe86b21SRichard Henderson goto done; 4113efe86b21SRichard Henderson } 4114efe86b21SRichard Henderson } 4115efe86b21SRichard Henderson 4116efe86b21SRichard Henderson /* Fall back to generic expansion. */ 4117efe86b21SRichard Henderson return false; 4118efe86b21SRichard Henderson 4119efe86b21SRichard Henderson done: 412036f5539cSRichard Henderson ots->mem_coherent = 0; 4121efe86b21SRichard Henderson if (IS_DEAD_ARG(1)) { 4122efe86b21SRichard Henderson temp_dead(s, itsl); 4123efe86b21SRichard Henderson } 4124efe86b21SRichard Henderson if (IS_DEAD_ARG(2)) { 4125efe86b21SRichard Henderson temp_dead(s, itsh); 4126efe86b21SRichard Henderson } 4127efe86b21SRichard Henderson if (NEED_SYNC_ARG(0)) { 4128efe86b21SRichard Henderson temp_sync(s, ots, s->reserved_regs, 0, IS_DEAD_ARG(0)); 4129efe86b21SRichard Henderson } else if (IS_DEAD_ARG(0)) { 4130efe86b21SRichard Henderson temp_dead(s, ots); 4131efe86b21SRichard Henderson } 4132efe86b21SRichard Henderson return true; 4133efe86b21SRichard Henderson } 4134efe86b21SRichard Henderson 4135dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 4136c896fe29Sbellard { 4137cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 4138cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 4139dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 41407b7d8b2dSRichard Henderson const TCGHelperInfo *info; 4141b6638662SRichard Henderson int flags, nb_regs, i; 4142b6638662SRichard Henderson TCGReg reg; 4143cf066674SRichard Henderson TCGArg arg; 4144c896fe29Sbellard TCGTemp *ts; 4145d3452f1fSRichard Henderson intptr_t stack_offset; 4146d3452f1fSRichard Henderson size_t call_stack_size; 4147cf066674SRichard Henderson tcg_insn_unit *func_addr; 4148cf066674SRichard Henderson int allocate_args; 4149c896fe29Sbellard TCGRegSet allocated_regs; 4150c896fe29Sbellard 4151fa52e660SRichard Henderson func_addr = tcg_call_func(op); 41527b7d8b2dSRichard Henderson info = tcg_call_info(op); 41537b7d8b2dSRichard Henderson flags = info->flags; 4154c896fe29Sbellard 41556e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 4156c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 4157c45cb8bbSRichard Henderson nb_regs = nb_iargs; 4158cf066674SRichard Henderson } 4159c896fe29Sbellard 4160c896fe29Sbellard /* assign stack slots first */ 4161c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 4162c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 4163c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 4164b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 4165b03cce8eSbellard if (allocate_args) { 4166345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 4167345649c0SBlue Swirl preallocate call stack */ 4168345649c0SBlue Swirl tcg_abort(); 4169b03cce8eSbellard } 417039cf05d3Sbellard 417139cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 4172c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 4173dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 417439cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 417543439139SRichard Henderson ts = arg_temp(arg); 417640ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 4177b722452aSRichard Henderson s->reserved_regs, 0); 4178e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 417939cf05d3Sbellard } 418039cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 4181c896fe29Sbellard } 4182c896fe29Sbellard 4183c896fe29Sbellard /* assign input registers */ 4184d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 4185c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 4186dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 418739cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 418843439139SRichard Henderson ts = arg_temp(arg); 4189c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 419040ae5c62SRichard Henderson 4191c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 4192c896fe29Sbellard if (ts->reg != reg) { 41934250da10SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 419478113e83SRichard Henderson if (!tcg_out_mov(s, ts->type, reg, ts->reg)) { 4195240c08d0SRichard Henderson /* 4196240c08d0SRichard Henderson * Cross register class move not supported. Sync the 4197240c08d0SRichard Henderson * temp back to its slot and load from there. 4198240c08d0SRichard Henderson */ 4199240c08d0SRichard Henderson temp_sync(s, ts, allocated_regs, 0, 0); 4200240c08d0SRichard Henderson tcg_out_ld(s, ts->type, reg, 4201240c08d0SRichard Henderson ts->mem_base->reg, ts->mem_offset); 420278113e83SRichard Henderson } 4203c896fe29Sbellard } 4204c896fe29Sbellard } else { 4205ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 420640ae5c62SRichard Henderson 42074250da10SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 420840ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 4209b722452aSRichard Henderson temp_load(s, ts, arg_set, allocated_regs, 0); 4210c896fe29Sbellard } 421140ae5c62SRichard Henderson 4212c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 4213c896fe29Sbellard } 421439cf05d3Sbellard } 4215c896fe29Sbellard 4216c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 4217866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 4218866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 421943439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 4220c896fe29Sbellard } 4221c896fe29Sbellard } 4222c896fe29Sbellard 4223c896fe29Sbellard /* clobber call registers */ 4224c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 4225c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 4226b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 4227c896fe29Sbellard } 4228c896fe29Sbellard } 4229c896fe29Sbellard 423078505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 423178505279SAurelien Jarno they might be read. */ 423278505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 423378505279SAurelien Jarno /* Nothing to do */ 423478505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 423578505279SAurelien Jarno sync_globals(s, allocated_regs); 423678505279SAurelien Jarno } else { 4237e8996ee0Sbellard save_globals(s, allocated_regs); 4238b9c18f56Saurel32 } 4239c896fe29Sbellard 42407b7d8b2dSRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 42417b7d8b2dSRichard Henderson { 42427b7d8b2dSRichard Henderson gpointer hash = (gpointer)(uintptr_t)info->typemask; 42437b7d8b2dSRichard Henderson ffi_cif *cif = g_hash_table_lookup(ffi_table, hash); 42447b7d8b2dSRichard Henderson assert(cif != NULL); 42457b7d8b2dSRichard Henderson tcg_out_call(s, func_addr, cif); 42467b7d8b2dSRichard Henderson } 42477b7d8b2dSRichard Henderson #else 4248cf066674SRichard Henderson tcg_out_call(s, func_addr); 42497b7d8b2dSRichard Henderson #endif 4250c896fe29Sbellard 4251c896fe29Sbellard /* assign output registers and emit moves if needed */ 4252c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 4253dd186292SRichard Henderson arg = op->args[i]; 425443439139SRichard Henderson ts = arg_temp(arg); 4255d63e3b6eSRichard Henderson 4256d63e3b6eSRichard Henderson /* ENV should not be modified. */ 4257e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 4258d63e3b6eSRichard Henderson 4259c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 4260098859f1SRichard Henderson set_temp_val_reg(s, ts, reg); 4261c896fe29Sbellard ts->mem_coherent = 0; 4262ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 426398b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, IS_DEAD_ARG(i)); 426459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 4265f8bf00f1SRichard Henderson temp_dead(s, ts); 4266c896fe29Sbellard } 4267c896fe29Sbellard } 42688c11ad25SAurelien Jarno } 4269c896fe29Sbellard 4270c896fe29Sbellard #ifdef CONFIG_PROFILER 4271c896fe29Sbellard 4272c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 4273c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 4274c3fac113SEmilio G. Cota do { \ 4275d73415a3SStefan Hajnoczi (to)->field += qatomic_read(&((from)->field)); \ 4276c3fac113SEmilio G. Cota } while (0) 4277c896fe29Sbellard 4278c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 4279c3fac113SEmilio G. Cota do { \ 4280d73415a3SStefan Hajnoczi typeof((from)->field) val__ = qatomic_read(&((from)->field)); \ 4281c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 4282c3fac113SEmilio G. Cota (to)->field = val__; \ 4283c3fac113SEmilio G. Cota } \ 4284c3fac113SEmilio G. Cota } while (0) 4285c3fac113SEmilio G. Cota 4286c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 4287c3fac113SEmilio G. Cota static inline 4288c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 4289c896fe29Sbellard { 42900e2d61cfSRichard Henderson unsigned int n_ctxs = qatomic_read(&tcg_cur_ctxs); 4291c3fac113SEmilio G. Cota unsigned int i; 4292c3fac113SEmilio G. Cota 42933468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 4294d73415a3SStefan Hajnoczi TCGContext *s = qatomic_read(&tcg_ctxs[i]); 42953468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 4296c3fac113SEmilio G. Cota 4297c3fac113SEmilio G. Cota if (counters) { 429872fd2efbSEmilio G. Cota PROF_ADD(prof, orig, cpu_exec_time); 4299c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 4300c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 4301c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 4302c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 4303c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 4304c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 4305c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 4306c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 4307c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 4308c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 4309c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 4310c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 4311c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 4312c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 4313c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 4314c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 4315c3fac113SEmilio G. Cota } 4316c3fac113SEmilio G. Cota if (table) { 4317c896fe29Sbellard int i; 4318d70724ceSzhanghailiang 431915fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 4320c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 4321c3fac113SEmilio G. Cota } 4322c3fac113SEmilio G. Cota } 4323c3fac113SEmilio G. Cota } 4324c3fac113SEmilio G. Cota } 4325c3fac113SEmilio G. Cota 4326c3fac113SEmilio G. Cota #undef PROF_ADD 4327c3fac113SEmilio G. Cota #undef PROF_MAX 4328c3fac113SEmilio G. Cota 4329c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 4330c3fac113SEmilio G. Cota { 4331c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 4332c3fac113SEmilio G. Cota } 4333c3fac113SEmilio G. Cota 4334c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 4335c3fac113SEmilio G. Cota { 4336c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 4337c3fac113SEmilio G. Cota } 4338c3fac113SEmilio G. Cota 4339b6a7f3e0SDaniel P. Berrangé void tcg_dump_op_count(GString *buf) 4340c3fac113SEmilio G. Cota { 4341c3fac113SEmilio G. Cota TCGProfile prof = {}; 4342c3fac113SEmilio G. Cota int i; 4343c3fac113SEmilio G. Cota 4344c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 4345c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 4346b6a7f3e0SDaniel P. Berrangé g_string_append_printf(buf, "%s %" PRId64 "\n", tcg_op_defs[i].name, 4347c3fac113SEmilio G. Cota prof.table_op_count[i]); 4348c896fe29Sbellard } 4349c896fe29Sbellard } 435072fd2efbSEmilio G. Cota 435172fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 435272fd2efbSEmilio G. Cota { 43530e2d61cfSRichard Henderson unsigned int n_ctxs = qatomic_read(&tcg_cur_ctxs); 435472fd2efbSEmilio G. Cota unsigned int i; 435572fd2efbSEmilio G. Cota int64_t ret = 0; 435672fd2efbSEmilio G. Cota 435772fd2efbSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 4358d73415a3SStefan Hajnoczi const TCGContext *s = qatomic_read(&tcg_ctxs[i]); 435972fd2efbSEmilio G. Cota const TCGProfile *prof = &s->prof; 436072fd2efbSEmilio G. Cota 4361d73415a3SStefan Hajnoczi ret += qatomic_read(&prof->cpu_exec_time); 436272fd2efbSEmilio G. Cota } 436372fd2efbSEmilio G. Cota return ret; 436472fd2efbSEmilio G. Cota } 4365246ae24dSMax Filippov #else 4366b6a7f3e0SDaniel P. Berrangé void tcg_dump_op_count(GString *buf) 4367246ae24dSMax Filippov { 4368b6a7f3e0SDaniel P. Berrangé g_string_append_printf(buf, "[TCG profiler not compiled]\n"); 4369246ae24dSMax Filippov } 437072fd2efbSEmilio G. Cota 437172fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 437272fd2efbSEmilio G. Cota { 437372fd2efbSEmilio G. Cota error_report("%s: TCG profiler not compiled", __func__); 437472fd2efbSEmilio G. Cota exit(EXIT_FAILURE); 437572fd2efbSEmilio G. Cota } 4376c896fe29Sbellard #endif 4377c896fe29Sbellard 4378c896fe29Sbellard 4379fbf59aadSRichard Henderson int tcg_gen_code(TCGContext *s, TranslationBlock *tb, target_ulong pc_start) 4380c896fe29Sbellard { 4381c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 4382c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 4383c3fac113SEmilio G. Cota #endif 438415fa08f8SRichard Henderson int i, num_insns; 438515fa08f8SRichard Henderson TCGOp *op; 4386c896fe29Sbellard 438704fe6400SRichard Henderson #ifdef CONFIG_PROFILER 438804fe6400SRichard Henderson { 4389c1f543b7SEmilio G. Cota int n = 0; 439004fe6400SRichard Henderson 439115fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 439215fa08f8SRichard Henderson n++; 439315fa08f8SRichard Henderson } 4394d73415a3SStefan Hajnoczi qatomic_set(&prof->op_count, prof->op_count + n); 4395c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 4396d73415a3SStefan Hajnoczi qatomic_set(&prof->op_count_max, n); 439704fe6400SRichard Henderson } 439804fe6400SRichard Henderson 439904fe6400SRichard Henderson n = s->nb_temps; 4400d73415a3SStefan Hajnoczi qatomic_set(&prof->temp_count, prof->temp_count + n); 4401c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 4402d73415a3SStefan Hajnoczi qatomic_set(&prof->temp_count_max, n); 440304fe6400SRichard Henderson } 440404fe6400SRichard Henderson } 440504fe6400SRichard Henderson #endif 440604fe6400SRichard Henderson 4407c896fe29Sbellard #ifdef DEBUG_DISAS 4408d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 4409fbf59aadSRichard Henderson && qemu_log_in_addr_range(pc_start))) { 4410c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 441178b54858SRichard Henderson if (logfile) { 441278b54858SRichard Henderson fprintf(logfile, "OP:\n"); 4413b7a83ff8SRichard Henderson tcg_dump_ops(s, logfile, false); 441478b54858SRichard Henderson fprintf(logfile, "\n"); 4415fc59d2d8SRobert Foley qemu_log_unlock(logfile); 4416c896fe29Sbellard } 441778b54858SRichard Henderson } 4418c896fe29Sbellard #endif 4419c896fe29Sbellard 4420bef16ab4SRichard Henderson #ifdef CONFIG_DEBUG_TCG 4421bef16ab4SRichard Henderson /* Ensure all labels referenced have been emitted. */ 4422bef16ab4SRichard Henderson { 4423bef16ab4SRichard Henderson TCGLabel *l; 4424bef16ab4SRichard Henderson bool error = false; 4425bef16ab4SRichard Henderson 4426bef16ab4SRichard Henderson QSIMPLEQ_FOREACH(l, &s->labels, next) { 4427bef16ab4SRichard Henderson if (unlikely(!l->present) && l->refs) { 4428bef16ab4SRichard Henderson qemu_log_mask(CPU_LOG_TB_OP, 4429bef16ab4SRichard Henderson "$L%d referenced but not present.\n", l->id); 4430bef16ab4SRichard Henderson error = true; 4431bef16ab4SRichard Henderson } 4432bef16ab4SRichard Henderson } 4433bef16ab4SRichard Henderson assert(!error); 4434bef16ab4SRichard Henderson } 4435bef16ab4SRichard Henderson #endif 4436bef16ab4SRichard Henderson 4437c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 4438d73415a3SStefan Hajnoczi qatomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 4439c5cc28ffSAurelien Jarno #endif 4440c5cc28ffSAurelien Jarno 44418f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 4442c45cb8bbSRichard Henderson tcg_optimize(s); 44438f2e8c07SKirill Batuzov #endif 44448f2e8c07SKirill Batuzov 4445a23a9ec6Sbellard #ifdef CONFIG_PROFILER 4446d73415a3SStefan Hajnoczi qatomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 4447d73415a3SStefan Hajnoczi qatomic_set(&prof->la_time, prof->la_time - profile_getclock()); 4448a23a9ec6Sbellard #endif 4449c5cc28ffSAurelien Jarno 4450b4fc67c7SRichard Henderson reachable_code_pass(s); 4451b83eabeaSRichard Henderson liveness_pass_1(s); 44525a18407fSRichard Henderson 44535a18407fSRichard Henderson if (s->nb_indirects > 0) { 44545a18407fSRichard Henderson #ifdef DEBUG_DISAS 44555a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 4456fbf59aadSRichard Henderson && qemu_log_in_addr_range(pc_start))) { 4457c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 445878b54858SRichard Henderson if (logfile) { 445978b54858SRichard Henderson fprintf(logfile, "OP before indirect lowering:\n"); 4460b7a83ff8SRichard Henderson tcg_dump_ops(s, logfile, false); 446178b54858SRichard Henderson fprintf(logfile, "\n"); 4462fc59d2d8SRobert Foley qemu_log_unlock(logfile); 44635a18407fSRichard Henderson } 446478b54858SRichard Henderson } 44655a18407fSRichard Henderson #endif 44665a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 4467b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 44685a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 4469b83eabeaSRichard Henderson liveness_pass_1(s); 44705a18407fSRichard Henderson } 44715a18407fSRichard Henderson } 4472c5cc28ffSAurelien Jarno 4473a23a9ec6Sbellard #ifdef CONFIG_PROFILER 4474d73415a3SStefan Hajnoczi qatomic_set(&prof->la_time, prof->la_time + profile_getclock()); 4475a23a9ec6Sbellard #endif 4476c896fe29Sbellard 4477c896fe29Sbellard #ifdef DEBUG_DISAS 4478d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 4479fbf59aadSRichard Henderson && qemu_log_in_addr_range(pc_start))) { 4480c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 448178b54858SRichard Henderson if (logfile) { 448278b54858SRichard Henderson fprintf(logfile, "OP after optimization and liveness analysis:\n"); 4483b7a83ff8SRichard Henderson tcg_dump_ops(s, logfile, true); 448478b54858SRichard Henderson fprintf(logfile, "\n"); 4485fc59d2d8SRobert Foley qemu_log_unlock(logfile); 4486c896fe29Sbellard } 448778b54858SRichard Henderson } 4488c896fe29Sbellard #endif 4489c896fe29Sbellard 449035abb009SRichard Henderson /* Initialize goto_tb jump offsets. */ 449135abb009SRichard Henderson tb->jmp_reset_offset[0] = TB_JMP_RESET_OFFSET_INVALID; 449235abb009SRichard Henderson tb->jmp_reset_offset[1] = TB_JMP_RESET_OFFSET_INVALID; 449335abb009SRichard Henderson tcg_ctx->tb_jmp_reset_offset = tb->jmp_reset_offset; 449435abb009SRichard Henderson if (TCG_TARGET_HAS_direct_jump) { 449535abb009SRichard Henderson tcg_ctx->tb_jmp_insn_offset = tb->jmp_target_arg; 449635abb009SRichard Henderson tcg_ctx->tb_jmp_target_addr = NULL; 449735abb009SRichard Henderson } else { 449835abb009SRichard Henderson tcg_ctx->tb_jmp_insn_offset = NULL; 449935abb009SRichard Henderson tcg_ctx->tb_jmp_target_addr = tb->jmp_target_arg; 450035abb009SRichard Henderson } 450135abb009SRichard Henderson 4502c896fe29Sbellard tcg_reg_alloc_start(s); 4503c896fe29Sbellard 4504db0c51a3SRichard Henderson /* 4505db0c51a3SRichard Henderson * Reset the buffer pointers when restarting after overflow. 4506db0c51a3SRichard Henderson * TODO: Move this into translate-all.c with the rest of the 4507db0c51a3SRichard Henderson * buffer management. Having only this done here is confusing. 4508db0c51a3SRichard Henderson */ 4509db0c51a3SRichard Henderson s->code_buf = tcg_splitwx_to_rw(tb->tc.ptr); 4510db0c51a3SRichard Henderson s->code_ptr = s->code_buf; 4511c896fe29Sbellard 4512659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 45136001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 4514659ef5cbSRichard Henderson #endif 451557a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 451657a26946SRichard Henderson s->pool_labels = NULL; 451757a26946SRichard Henderson #endif 45189ecefc84SRichard Henderson 4519fca8a500SRichard Henderson num_insns = -1; 452015fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 4521c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 4522b3db8758Sblueswir1 4523c896fe29Sbellard #ifdef CONFIG_PROFILER 4524d73415a3SStefan Hajnoczi qatomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 4525c896fe29Sbellard #endif 4526c45cb8bbSRichard Henderson 4527c896fe29Sbellard switch (opc) { 4528c896fe29Sbellard case INDEX_op_mov_i32: 4529c896fe29Sbellard case INDEX_op_mov_i64: 4530d2fd745fSRichard Henderson case INDEX_op_mov_vec: 4531dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 4532c896fe29Sbellard break; 4533bab1671fSRichard Henderson case INDEX_op_dup_vec: 4534bab1671fSRichard Henderson tcg_reg_alloc_dup(s, op); 4535bab1671fSRichard Henderson break; 4536765b842aSRichard Henderson case INDEX_op_insn_start: 4537fca8a500SRichard Henderson if (num_insns >= 0) { 45389f754620SRichard Henderson size_t off = tcg_current_code_size(s); 45399f754620SRichard Henderson s->gen_insn_end_off[num_insns] = off; 45409f754620SRichard Henderson /* Assert that we do not overflow our stored offset. */ 45419f754620SRichard Henderson assert(s->gen_insn_end_off[num_insns] == off); 4542fca8a500SRichard Henderson } 4543fca8a500SRichard Henderson num_insns++; 4544bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 4545bad729e2SRichard Henderson target_ulong a; 4546bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 4547efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 4548bad729e2SRichard Henderson #else 4549efee3746SRichard Henderson a = op->args[i]; 4550bad729e2SRichard Henderson #endif 4551fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 4552bad729e2SRichard Henderson } 4553c896fe29Sbellard break; 45545ff9d6a4Sbellard case INDEX_op_discard: 455543439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 45565ff9d6a4Sbellard break; 4557c896fe29Sbellard case INDEX_op_set_label: 4558e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 455992ab8e7dSRichard Henderson tcg_out_label(s, arg_label(op->args[0])); 4560c896fe29Sbellard break; 4561c896fe29Sbellard case INDEX_op_call: 4562dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 4563c45cb8bbSRichard Henderson break; 4564efe86b21SRichard Henderson case INDEX_op_dup2_vec: 4565efe86b21SRichard Henderson if (tcg_reg_alloc_dup2(s, op)) { 4566efe86b21SRichard Henderson break; 4567efe86b21SRichard Henderson } 4568efe86b21SRichard Henderson /* fall through */ 4569c896fe29Sbellard default: 457025c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 4571be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 4572c896fe29Sbellard /* Note: in order to speed up the code, it would be much 4573c896fe29Sbellard faster to have specialized register allocator functions for 4574c896fe29Sbellard some common argument patterns */ 4575dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 4576c896fe29Sbellard break; 4577c896fe29Sbellard } 4578b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 4579b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 4580b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 4581b125f9dcSRichard Henderson generating code without having to check during generation. */ 4582644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 4583b125f9dcSRichard Henderson return -1; 4584b125f9dcSRichard Henderson } 45856e6c4efeSRichard Henderson /* Test for TB overflow, as seen by gen_insn_end_off. */ 45866e6c4efeSRichard Henderson if (unlikely(tcg_current_code_size(s) > UINT16_MAX)) { 45876e6c4efeSRichard Henderson return -2; 45886e6c4efeSRichard Henderson } 4589c896fe29Sbellard } 4590fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 4591fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 4592c45cb8bbSRichard Henderson 4593b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 4594659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 4595aeee05f5SRichard Henderson i = tcg_out_ldst_finalize(s); 4596aeee05f5SRichard Henderson if (i < 0) { 4597aeee05f5SRichard Henderson return i; 459823dceda6SRichard Henderson } 4599659ef5cbSRichard Henderson #endif 460057a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 46011768987bSRichard Henderson i = tcg_out_pool_finalize(s); 46021768987bSRichard Henderson if (i < 0) { 46031768987bSRichard Henderson return i; 460457a26946SRichard Henderson } 460557a26946SRichard Henderson #endif 46067ecd02a0SRichard Henderson if (!tcg_resolve_relocs(s)) { 46077ecd02a0SRichard Henderson return -2; 46087ecd02a0SRichard Henderson } 4609c896fe29Sbellard 4610df5d2b16SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 4611c896fe29Sbellard /* flush instruction cache */ 4612db0c51a3SRichard Henderson flush_idcache_range((uintptr_t)tcg_splitwx_to_rx(s->code_buf), 4613db0c51a3SRichard Henderson (uintptr_t)s->code_buf, 46141da8de39SRichard Henderson tcg_ptr_byte_diff(s->code_ptr, s->code_buf)); 4615df5d2b16SRichard Henderson #endif 46162aeabc08SStefan Weil 46171813e175SRichard Henderson return tcg_current_code_size(s); 4618c896fe29Sbellard } 4619c896fe29Sbellard 4620a23a9ec6Sbellard #ifdef CONFIG_PROFILER 46213a841ab5SDaniel P. Berrangé void tcg_dump_info(GString *buf) 4622a23a9ec6Sbellard { 4623c3fac113SEmilio G. Cota TCGProfile prof = {}; 4624c3fac113SEmilio G. Cota const TCGProfile *s; 4625c3fac113SEmilio G. Cota int64_t tb_count; 4626c3fac113SEmilio G. Cota int64_t tb_div_count; 4627c3fac113SEmilio G. Cota int64_t tot; 4628c3fac113SEmilio G. Cota 4629c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 4630c3fac113SEmilio G. Cota s = &prof; 4631c3fac113SEmilio G. Cota tb_count = s->tb_count; 4632c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 4633c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 4634a23a9ec6Sbellard 46353a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "JIT cycles %" PRId64 46363a841ab5SDaniel P. Berrangé " (%0.3f s at 2.4 GHz)\n", 4637a23a9ec6Sbellard tot, tot / 2.4e9); 46383a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "translated TBs %" PRId64 46393a841ab5SDaniel P. Berrangé " (aborted=%" PRId64 " %0.1f%%)\n", 4640fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 4641fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 4642fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 46433a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg ops/TB %0.1f max=%d\n", 4644fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 46453a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "deleted ops/TB %0.2f\n", 4646fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 46473a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg temps/TB %0.2f max=%d\n", 46483a841ab5SDaniel P. Berrangé (double)s->temp_count / tb_div_count, 46493a841ab5SDaniel P. Berrangé s->temp_count_max); 46503a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg host code/TB %0.1f\n", 4651fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 46523a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg search data/TB %0.1f\n", 4653fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 4654a23a9ec6Sbellard 46553a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/op %0.1f\n", 4656a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 46573a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/in byte %0.1f\n", 4658a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 46593a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/out byte %0.1f\n", 4660a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 46613a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/search byte %0.1f\n", 46623a841ab5SDaniel P. Berrangé s->search_out_len ? 46633a841ab5SDaniel P. Berrangé (double)tot / s->search_out_len : 0); 4664fca8a500SRichard Henderson if (tot == 0) { 4665a23a9ec6Sbellard tot = 1; 4666fca8a500SRichard Henderson } 46673a841ab5SDaniel P. Berrangé g_string_append_printf(buf, " gen_interm time %0.1f%%\n", 4668a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 46693a841ab5SDaniel P. Berrangé g_string_append_printf(buf, " gen_code time %0.1f%%\n", 4670a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 46713a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "optim./code time %0.1f%%\n", 46723a841ab5SDaniel P. Berrangé (double)s->opt_time / (s->code_time ? 46733a841ab5SDaniel P. Berrangé s->code_time : 1) 4674c5cc28ffSAurelien Jarno * 100.0); 46753a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "liveness/code time %0.1f%%\n", 46763a841ab5SDaniel P. Berrangé (double)s->la_time / (s->code_time ? 46773a841ab5SDaniel P. Berrangé s->code_time : 1) * 100.0); 46783a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cpu_restore count %" PRId64 "\n", 4679a23a9ec6Sbellard s->restore_count); 46803a841ab5SDaniel P. Berrangé g_string_append_printf(buf, " avg cycles %0.1f\n", 46813a841ab5SDaniel P. Berrangé s->restore_count ? 46823a841ab5SDaniel P. Berrangé (double)s->restore_time / s->restore_count : 0); 4683a23a9ec6Sbellard } 4684a23a9ec6Sbellard #else 46853a841ab5SDaniel P. Berrangé void tcg_dump_info(GString *buf) 4686a23a9ec6Sbellard { 46873a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "[TCG profiler not compiled]\n"); 4688a23a9ec6Sbellard } 4689a23a9ec6Sbellard #endif 4690813da627SRichard Henderson 4691813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 46925872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 46935872bbf2SRichard Henderson 46945872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 46955872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 46965872bbf2SRichard Henderson 46975872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 46985872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 46995872bbf2SRichard Henderson prologue unwind info for the tcg machine. 47005872bbf2SRichard Henderson 47015872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 47025872bbf2SRichard Henderson */ 4703813da627SRichard Henderson 4704813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 4705813da627SRichard Henderson typedef enum { 4706813da627SRichard Henderson JIT_NOACTION = 0, 4707813da627SRichard Henderson JIT_REGISTER_FN, 4708813da627SRichard Henderson JIT_UNREGISTER_FN 4709813da627SRichard Henderson } jit_actions_t; 4710813da627SRichard Henderson 4711813da627SRichard Henderson struct jit_code_entry { 4712813da627SRichard Henderson struct jit_code_entry *next_entry; 4713813da627SRichard Henderson struct jit_code_entry *prev_entry; 4714813da627SRichard Henderson const void *symfile_addr; 4715813da627SRichard Henderson uint64_t symfile_size; 4716813da627SRichard Henderson }; 4717813da627SRichard Henderson 4718813da627SRichard Henderson struct jit_descriptor { 4719813da627SRichard Henderson uint32_t version; 4720813da627SRichard Henderson uint32_t action_flag; 4721813da627SRichard Henderson struct jit_code_entry *relevant_entry; 4722813da627SRichard Henderson struct jit_code_entry *first_entry; 4723813da627SRichard Henderson }; 4724813da627SRichard Henderson 4725813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 4726813da627SRichard Henderson void __jit_debug_register_code(void) 4727813da627SRichard Henderson { 4728813da627SRichard Henderson asm(""); 4729813da627SRichard Henderson } 4730813da627SRichard Henderson 4731813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 4732813da627SRichard Henderson the version before we can set it. */ 4733813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 4734813da627SRichard Henderson 4735813da627SRichard Henderson /* End GDB interface. */ 4736813da627SRichard Henderson 4737813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 4738813da627SRichard Henderson { 4739813da627SRichard Henderson const char *p = strtab + 1; 4740813da627SRichard Henderson 4741813da627SRichard Henderson while (1) { 4742813da627SRichard Henderson if (strcmp(p, str) == 0) { 4743813da627SRichard Henderson return p - strtab; 4744813da627SRichard Henderson } 4745813da627SRichard Henderson p += strlen(p) + 1; 4746813da627SRichard Henderson } 4747813da627SRichard Henderson } 4748813da627SRichard Henderson 4749755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf_ptr, size_t buf_size, 47502c90784aSRichard Henderson const void *debug_frame, 47512c90784aSRichard Henderson size_t debug_frame_size) 4752813da627SRichard Henderson { 47535872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 47545872bbf2SRichard Henderson uint32_t len; 47555872bbf2SRichard Henderson uint16_t version; 47565872bbf2SRichard Henderson uint32_t abbrev; 47575872bbf2SRichard Henderson uint8_t ptr_size; 47585872bbf2SRichard Henderson uint8_t cu_die; 47595872bbf2SRichard Henderson uint16_t cu_lang; 47605872bbf2SRichard Henderson uintptr_t cu_low_pc; 47615872bbf2SRichard Henderson uintptr_t cu_high_pc; 47625872bbf2SRichard Henderson uint8_t fn_die; 47635872bbf2SRichard Henderson char fn_name[16]; 47645872bbf2SRichard Henderson uintptr_t fn_low_pc; 47655872bbf2SRichard Henderson uintptr_t fn_high_pc; 47665872bbf2SRichard Henderson uint8_t cu_eoc; 47675872bbf2SRichard Henderson }; 4768813da627SRichard Henderson 4769813da627SRichard Henderson struct ElfImage { 4770813da627SRichard Henderson ElfW(Ehdr) ehdr; 4771813da627SRichard Henderson ElfW(Phdr) phdr; 47725872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 47735872bbf2SRichard Henderson ElfW(Sym) sym[2]; 47745872bbf2SRichard Henderson struct DebugInfo di; 47755872bbf2SRichard Henderson uint8_t da[24]; 47765872bbf2SRichard Henderson char str[80]; 47775872bbf2SRichard Henderson }; 47785872bbf2SRichard Henderson 47795872bbf2SRichard Henderson struct ElfImage *img; 47805872bbf2SRichard Henderson 47815872bbf2SRichard Henderson static const struct ElfImage img_template = { 47825872bbf2SRichard Henderson .ehdr = { 47835872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 47845872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 47855872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 47865872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 47875872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 47885872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 47895872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 47905872bbf2SRichard Henderson .e_type = ET_EXEC, 47915872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 47925872bbf2SRichard Henderson .e_version = EV_CURRENT, 47935872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 47945872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 47955872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 47965872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 47975872bbf2SRichard Henderson .e_phnum = 1, 47985872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 47995872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 48005872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 4801abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 4802abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 4803abbb3eaeSRichard Henderson #endif 4804abbb3eaeSRichard Henderson #ifdef ELF_OSABI 4805abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 4806abbb3eaeSRichard Henderson #endif 48075872bbf2SRichard Henderson }, 48085872bbf2SRichard Henderson .phdr = { 48095872bbf2SRichard Henderson .p_type = PT_LOAD, 48105872bbf2SRichard Henderson .p_flags = PF_X, 48115872bbf2SRichard Henderson }, 48125872bbf2SRichard Henderson .shdr = { 48135872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 48145872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 48155872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 48165872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 48175872bbf2SRichard Henderson will not look for contents. We can record any address. */ 48185872bbf2SRichard Henderson [1] = { /* .text */ 48195872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 48205872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 48215872bbf2SRichard Henderson }, 48225872bbf2SRichard Henderson [2] = { /* .debug_info */ 48235872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 48245872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 48255872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 48265872bbf2SRichard Henderson }, 48275872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 48285872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 48295872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 48305872bbf2SRichard Henderson .sh_size = sizeof(img->da), 48315872bbf2SRichard Henderson }, 48325872bbf2SRichard Henderson [4] = { /* .debug_frame */ 48335872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 48345872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 48355872bbf2SRichard Henderson }, 48365872bbf2SRichard Henderson [5] = { /* .symtab */ 48375872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 48385872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 48395872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 48405872bbf2SRichard Henderson .sh_info = 1, 48415872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 48425872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 48435872bbf2SRichard Henderson }, 48445872bbf2SRichard Henderson [6] = { /* .strtab */ 48455872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 48465872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 48475872bbf2SRichard Henderson .sh_size = sizeof(img->str), 48485872bbf2SRichard Henderson } 48495872bbf2SRichard Henderson }, 48505872bbf2SRichard Henderson .sym = { 48515872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 48525872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 48535872bbf2SRichard Henderson .st_shndx = 1, 48545872bbf2SRichard Henderson } 48555872bbf2SRichard Henderson }, 48565872bbf2SRichard Henderson .di = { 48575872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 48585872bbf2SRichard Henderson .version = 2, 48595872bbf2SRichard Henderson .ptr_size = sizeof(void *), 48605872bbf2SRichard Henderson .cu_die = 1, 48615872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 48625872bbf2SRichard Henderson .fn_die = 2, 48635872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 48645872bbf2SRichard Henderson }, 48655872bbf2SRichard Henderson .da = { 48665872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 48675872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 48685872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 48695872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 48705872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 48715872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 48725872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 48735872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 48745872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 48755872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 48765872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 48775872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 48785872bbf2SRichard Henderson 0 /* no more abbrev */ 48795872bbf2SRichard Henderson }, 48805872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 48815872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 4882813da627SRichard Henderson }; 4883813da627SRichard Henderson 4884813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 4885813da627SRichard Henderson static struct jit_code_entry one_entry; 4886813da627SRichard Henderson 48875872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 4888813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 48892c90784aSRichard Henderson DebugFrameHeader *dfh; 4890813da627SRichard Henderson 48915872bbf2SRichard Henderson img = g_malloc(img_size); 48925872bbf2SRichard Henderson *img = img_template; 4893813da627SRichard Henderson 48945872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 48955872bbf2SRichard Henderson img->phdr.p_paddr = buf; 48965872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 4897813da627SRichard Henderson 48985872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 48995872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 49005872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 4901813da627SRichard Henderson 49025872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 49035872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 49045872bbf2SRichard Henderson 49055872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 49065872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 49075872bbf2SRichard Henderson 49085872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 49095872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 49105872bbf2SRichard Henderson 49115872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 49125872bbf2SRichard Henderson img->sym[1].st_value = buf; 49135872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 49145872bbf2SRichard Henderson 49155872bbf2SRichard Henderson img->di.cu_low_pc = buf; 491645aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 49175872bbf2SRichard Henderson img->di.fn_low_pc = buf; 491845aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 4919813da627SRichard Henderson 49202c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 49212c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 49222c90784aSRichard Henderson dfh->fde.func_start = buf; 49232c90784aSRichard Henderson dfh->fde.func_len = buf_size; 49242c90784aSRichard Henderson 4925813da627SRichard Henderson #ifdef DEBUG_JIT 4926813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 4927813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 4928813da627SRichard Henderson { 4929eb6b2edfSBin Meng g_autofree char *jit = g_strdup_printf("%s/qemu.jit", g_get_tmp_dir()); 4930eb6b2edfSBin Meng FILE *f = fopen(jit, "w+b"); 4931813da627SRichard Henderson if (f) { 49325872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 4933813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 4934813da627SRichard Henderson } 4935813da627SRichard Henderson fclose(f); 4936813da627SRichard Henderson } 4937813da627SRichard Henderson } 4938813da627SRichard Henderson #endif 4939813da627SRichard Henderson 4940813da627SRichard Henderson one_entry.symfile_addr = img; 4941813da627SRichard Henderson one_entry.symfile_size = img_size; 4942813da627SRichard Henderson 4943813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 4944813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 4945813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 4946813da627SRichard Henderson __jit_debug_register_code(); 4947813da627SRichard Henderson } 4948813da627SRichard Henderson #else 49495872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 49505872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 4951813da627SRichard Henderson 4952755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf, size_t size, 49532c90784aSRichard Henderson const void *debug_frame, 49542c90784aSRichard Henderson size_t debug_frame_size) 4955813da627SRichard Henderson { 4956813da627SRichard Henderson } 4957813da627SRichard Henderson 4958755bf9e5SRichard Henderson void tcg_register_jit(const void *buf, size_t buf_size) 4959813da627SRichard Henderson { 4960813da627SRichard Henderson } 4961813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 4962db432672SRichard Henderson 4963db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 4964db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 4965db432672SRichard Henderson { 4966db432672SRichard Henderson g_assert_not_reached(); 4967db432672SRichard Henderson } 4968db432672SRichard Henderson #endif 4969