1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 3372fd2efbSEmilio G. Cota #include "qemu/error-report.h" 34f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 351de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 36d4c51a0aSMarkus Armbruster #include "qemu/qemu-print.h" 371de7afc9SPaolo Bonzini #include "qemu/timer.h" 38084cfca1SRichard Henderson #include "qemu/cacheflush.h" 39ad768e6fSPeter Maydell #include "qemu/cacheinfo.h" 40c896fe29Sbellard 41c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 42c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 43c896fe29Sbellard instructions */ 44c896fe29Sbellard #define NO_CPU_IO_DEFS 45c896fe29Sbellard 4663c91552SPaolo Bonzini #include "exec/exec-all.h" 47dcb32f1dSPhilippe Mathieu-Daudé #include "tcg/tcg-op.h" 48813da627SRichard Henderson 49edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 50813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 51edee2579SRichard Henderson #else 52edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 53813da627SRichard Henderson #endif 54e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 55813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 56813da627SRichard Henderson #else 57813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 58813da627SRichard Henderson #endif 59813da627SRichard Henderson 60c896fe29Sbellard #include "elf.h" 61508127e2SPaolo Bonzini #include "exec/log.h" 62d2ba8026SRichard Henderson #include "tcg/tcg-ldst.h" 635ff7258cSRichard Henderson #include "tcg-internal.h" 64c896fe29Sbellard 6522f15579SRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 6622f15579SRichard Henderson #include <ffi.h> 6722f15579SRichard Henderson #endif 6822f15579SRichard Henderson 69139c1837SPaolo Bonzini /* Forward declarations for functions declared in tcg-target.c.inc and 70ce151109SPeter Maydell used here. */ 71e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 72e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 736ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type, 742ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 75c896fe29Sbellard 76497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 77497a22ebSRichard Henderson typedef struct { 78497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 79497a22ebSRichard Henderson uint32_t id; 80497a22ebSRichard Henderson uint8_t version; 81497a22ebSRichard Henderson char augmentation[1]; 82497a22ebSRichard Henderson uint8_t code_align; 83497a22ebSRichard Henderson uint8_t data_align; 84497a22ebSRichard Henderson uint8_t return_column; 85497a22ebSRichard Henderson } DebugFrameCIE; 86497a22ebSRichard Henderson 87497a22ebSRichard Henderson typedef struct QEMU_PACKED { 88497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 89497a22ebSRichard Henderson uint32_t cie_offset; 90edee2579SRichard Henderson uintptr_t func_start; 91edee2579SRichard Henderson uintptr_t func_len; 92497a22ebSRichard Henderson } DebugFrameFDEHeader; 93497a22ebSRichard Henderson 942c90784aSRichard Henderson typedef struct QEMU_PACKED { 952c90784aSRichard Henderson DebugFrameCIE cie; 962c90784aSRichard Henderson DebugFrameFDEHeader fde; 972c90784aSRichard Henderson } DebugFrameHeader; 982c90784aSRichard Henderson 99755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf, size_t size, 1002c90784aSRichard Henderson const void *debug_frame, 1012c90784aSRichard Henderson size_t debug_frame_size) 102813da627SRichard Henderson __attribute__((unused)); 103813da627SRichard Henderson 104139c1837SPaolo Bonzini /* Forward declarations for functions declared and used in tcg-target.c.inc. */ 1052a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 106a05b5b9bSRichard Henderson intptr_t arg2); 10778113e83SRichard Henderson static bool tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 108c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1092a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 1105e8892dbSMiroslav Rezanina static void tcg_out_op(TCGContext *s, TCGOpcode opc, 1115e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1125e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]); 113d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 114e7632cfaSRichard Henderson static bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece, 115e7632cfaSRichard Henderson TCGReg dst, TCGReg src); 116d6ecb4a9SRichard Henderson static bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece, 117d6ecb4a9SRichard Henderson TCGReg dst, TCGReg base, intptr_t offset); 1184e186175SRichard Henderson static void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece, 1194e186175SRichard Henderson TCGReg dst, int64_t arg); 1205e8892dbSMiroslav Rezanina static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, 1215e8892dbSMiroslav Rezanina unsigned vecl, unsigned vece, 1225e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1235e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]); 124d2fd745fSRichard Henderson #else 125e7632cfaSRichard Henderson static inline bool tcg_out_dup_vec(TCGContext *s, TCGType type, unsigned vece, 126e7632cfaSRichard Henderson TCGReg dst, TCGReg src) 127e7632cfaSRichard Henderson { 128e7632cfaSRichard Henderson g_assert_not_reached(); 129e7632cfaSRichard Henderson } 130d6ecb4a9SRichard Henderson static inline bool tcg_out_dupm_vec(TCGContext *s, TCGType type, unsigned vece, 131d6ecb4a9SRichard Henderson TCGReg dst, TCGReg base, intptr_t offset) 132d6ecb4a9SRichard Henderson { 133d6ecb4a9SRichard Henderson g_assert_not_reached(); 134d6ecb4a9SRichard Henderson } 1354e186175SRichard Henderson static inline void tcg_out_dupi_vec(TCGContext *s, TCGType type, unsigned vece, 1364e186175SRichard Henderson TCGReg dst, int64_t arg) 137e7632cfaSRichard Henderson { 138e7632cfaSRichard Henderson g_assert_not_reached(); 139e7632cfaSRichard Henderson } 1405e8892dbSMiroslav Rezanina static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, 1415e8892dbSMiroslav Rezanina unsigned vecl, unsigned vece, 1425e8892dbSMiroslav Rezanina const TCGArg args[TCG_MAX_OP_ARGS], 1435e8892dbSMiroslav Rezanina const int const_args[TCG_MAX_OP_ARGS]) 144d2fd745fSRichard Henderson { 145d2fd745fSRichard Henderson g_assert_not_reached(); 146d2fd745fSRichard Henderson } 147d2fd745fSRichard Henderson #endif 1482a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 149a05b5b9bSRichard Henderson intptr_t arg2); 15059d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 15159d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 1527b7d8b2dSRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 1537b7d8b2dSRichard Henderson static void tcg_out_call(TCGContext *s, const tcg_insn_unit *target, 1547b7d8b2dSRichard Henderson ffi_cif *cif); 1557b7d8b2dSRichard Henderson #else 1562be7d76bSRichard Henderson static void tcg_out_call(TCGContext *s, const tcg_insn_unit *target); 1577b7d8b2dSRichard Henderson #endif 158a4fbbd77SRichard Henderson static bool tcg_target_const_match(int64_t val, TCGType type, int ct); 159659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 160aeee05f5SRichard Henderson static int tcg_out_ldst_finalize(TCGContext *s); 161659ef5cbSRichard Henderson #endif 162c896fe29Sbellard 16342eb6dfcSRichard Henderson TCGContext tcg_init_ctx; 16442eb6dfcSRichard Henderson __thread TCGContext *tcg_ctx; 16542eb6dfcSRichard Henderson 1665ff7258cSRichard Henderson TCGContext **tcg_ctxs; 1670e2d61cfSRichard Henderson unsigned int tcg_cur_ctxs; 1680e2d61cfSRichard Henderson unsigned int tcg_max_ctxs; 1691c2adb95SRichard Henderson TCGv_env cpu_env = 0; 170c8bc1168SRichard Henderson const void *tcg_code_gen_epilogue; 171db0c51a3SRichard Henderson uintptr_t tcg_splitwx_diff; 172df2cce29SEmilio G. Cota 173b91ccb31SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 174b91ccb31SRichard Henderson tcg_prologue_fn *tcg_qemu_tb_exec; 175b91ccb31SRichard Henderson #endif 176b91ccb31SRichard Henderson 177d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 178b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 179c896fe29Sbellard 1801813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1814196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 182c896fe29Sbellard { 183c896fe29Sbellard *s->code_ptr++ = v; 184c896fe29Sbellard } 185c896fe29Sbellard 1864196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1874196dca6SPeter Maydell uint8_t v) 1885c53bb81SPeter Maydell { 1891813e175SRichard Henderson *p = v; 1905c53bb81SPeter Maydell } 1911813e175SRichard Henderson #endif 1925c53bb81SPeter Maydell 1931813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1944196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 195c896fe29Sbellard { 1961813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1971813e175SRichard Henderson *s->code_ptr++ = v; 1981813e175SRichard Henderson } else { 1991813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2004387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2011813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 2021813e175SRichard Henderson } 203c896fe29Sbellard } 204c896fe29Sbellard 2054196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 2064196dca6SPeter Maydell uint16_t v) 2075c53bb81SPeter Maydell { 2081813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 2091813e175SRichard Henderson *p = v; 2101813e175SRichard Henderson } else { 2115c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2125c53bb81SPeter Maydell } 2131813e175SRichard Henderson } 2141813e175SRichard Henderson #endif 2155c53bb81SPeter Maydell 2161813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2174196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 218c896fe29Sbellard { 2191813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2201813e175SRichard Henderson *s->code_ptr++ = v; 2211813e175SRichard Henderson } else { 2221813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2234387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2241813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2251813e175SRichard Henderson } 226c896fe29Sbellard } 227c896fe29Sbellard 2284196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2294196dca6SPeter Maydell uint32_t v) 2305c53bb81SPeter Maydell { 2311813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2321813e175SRichard Henderson *p = v; 2331813e175SRichard Henderson } else { 2345c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2355c53bb81SPeter Maydell } 2361813e175SRichard Henderson } 2371813e175SRichard Henderson #endif 2385c53bb81SPeter Maydell 2391813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2404196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 241ac26eb69SRichard Henderson { 2421813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2431813e175SRichard Henderson *s->code_ptr++ = v; 2441813e175SRichard Henderson } else { 2451813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2464387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2471813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2481813e175SRichard Henderson } 249ac26eb69SRichard Henderson } 250ac26eb69SRichard Henderson 2514196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2524196dca6SPeter Maydell uint64_t v) 2535c53bb81SPeter Maydell { 2541813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2551813e175SRichard Henderson *p = v; 2561813e175SRichard Henderson } else { 2575c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2585c53bb81SPeter Maydell } 2591813e175SRichard Henderson } 2601813e175SRichard Henderson #endif 2615c53bb81SPeter Maydell 262c896fe29Sbellard /* label relocation processing */ 263c896fe29Sbellard 2641813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 265bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 266c896fe29Sbellard { 2677ecd02a0SRichard Henderson TCGRelocation *r = tcg_malloc(sizeof(TCGRelocation)); 268c896fe29Sbellard 269c896fe29Sbellard r->type = type; 270c896fe29Sbellard r->ptr = code_ptr; 271c896fe29Sbellard r->addend = addend; 2727ecd02a0SRichard Henderson QSIMPLEQ_INSERT_TAIL(&l->relocs, r, next); 273c896fe29Sbellard } 274c896fe29Sbellard 27592ab8e7dSRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l) 276c896fe29Sbellard { 277eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 278c896fe29Sbellard l->has_value = 1; 27992ab8e7dSRichard Henderson l->u.value_ptr = tcg_splitwx_to_rx(s->code_ptr); 280c896fe29Sbellard } 281c896fe29Sbellard 28242a268c2SRichard Henderson TCGLabel *gen_new_label(void) 283c896fe29Sbellard { 284b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 28551e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 286c896fe29Sbellard 2877ecd02a0SRichard Henderson memset(l, 0, sizeof(TCGLabel)); 2887ecd02a0SRichard Henderson l->id = s->nb_labels++; 2897ecd02a0SRichard Henderson QSIMPLEQ_INIT(&l->relocs); 2907ecd02a0SRichard Henderson 291bef16ab4SRichard Henderson QSIMPLEQ_INSERT_TAIL(&s->labels, l, next); 29242a268c2SRichard Henderson 29342a268c2SRichard Henderson return l; 294c896fe29Sbellard } 295c896fe29Sbellard 2967ecd02a0SRichard Henderson static bool tcg_resolve_relocs(TCGContext *s) 2977ecd02a0SRichard Henderson { 2987ecd02a0SRichard Henderson TCGLabel *l; 2997ecd02a0SRichard Henderson 3007ecd02a0SRichard Henderson QSIMPLEQ_FOREACH(l, &s->labels, next) { 3017ecd02a0SRichard Henderson TCGRelocation *r; 3027ecd02a0SRichard Henderson uintptr_t value = l->u.value; 3037ecd02a0SRichard Henderson 3047ecd02a0SRichard Henderson QSIMPLEQ_FOREACH(r, &l->relocs, next) { 3057ecd02a0SRichard Henderson if (!patch_reloc(r->ptr, r->type, value, r->addend)) { 3067ecd02a0SRichard Henderson return false; 3077ecd02a0SRichard Henderson } 3087ecd02a0SRichard Henderson } 3097ecd02a0SRichard Henderson } 3107ecd02a0SRichard Henderson return true; 3117ecd02a0SRichard Henderson } 3127ecd02a0SRichard Henderson 3139f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which) 3149f754620SRichard Henderson { 315f14bed3fSRichard Henderson /* 316f14bed3fSRichard Henderson * We will check for overflow at the end of the opcode loop in 317f14bed3fSRichard Henderson * tcg_gen_code, where we bound tcg_current_code_size to UINT16_MAX. 318f14bed3fSRichard Henderson */ 319f14bed3fSRichard Henderson s->tb_jmp_reset_offset[which] = tcg_current_code_size(s); 3209f754620SRichard Henderson } 3219f754620SRichard Henderson 322db6b7d0cSRichard Henderson /* Signal overflow, starting over with fewer guest insns. */ 3238905770bSMarc-André Lureau static G_NORETURN 3248905770bSMarc-André Lureau void tcg_raise_tb_overflow(TCGContext *s) 325db6b7d0cSRichard Henderson { 326db6b7d0cSRichard Henderson siglongjmp(s->jmp_trans, -2); 327db6b7d0cSRichard Henderson } 328db6b7d0cSRichard Henderson 3294c22e840SRichard Henderson #define C_PFX1(P, A) P##A 3304c22e840SRichard Henderson #define C_PFX2(P, A, B) P##A##_##B 3314c22e840SRichard Henderson #define C_PFX3(P, A, B, C) P##A##_##B##_##C 3324c22e840SRichard Henderson #define C_PFX4(P, A, B, C, D) P##A##_##B##_##C##_##D 3334c22e840SRichard Henderson #define C_PFX5(P, A, B, C, D, E) P##A##_##B##_##C##_##D##_##E 3344c22e840SRichard Henderson #define C_PFX6(P, A, B, C, D, E, F) P##A##_##B##_##C##_##D##_##E##_##F 3354c22e840SRichard Henderson 3364c22e840SRichard Henderson /* Define an enumeration for the various combinations. */ 3374c22e840SRichard Henderson 3384c22e840SRichard Henderson #define C_O0_I1(I1) C_PFX1(c_o0_i1_, I1), 3394c22e840SRichard Henderson #define C_O0_I2(I1, I2) C_PFX2(c_o0_i2_, I1, I2), 3404c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) C_PFX3(c_o0_i3_, I1, I2, I3), 3414c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) C_PFX4(c_o0_i4_, I1, I2, I3, I4), 3424c22e840SRichard Henderson 3434c22e840SRichard Henderson #define C_O1_I1(O1, I1) C_PFX2(c_o1_i1_, O1, I1), 3444c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) C_PFX3(c_o1_i2_, O1, I1, I2), 3454c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) C_PFX4(c_o1_i3_, O1, I1, I2, I3), 3464c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) C_PFX5(c_o1_i4_, O1, I1, I2, I3, I4), 3474c22e840SRichard Henderson 3484c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) C_PFX3(c_n1_i2_, O1, I1, I2), 3494c22e840SRichard Henderson 3504c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) C_PFX3(c_o2_i1_, O1, O2, I1), 3514c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) C_PFX4(c_o2_i2_, O1, O2, I1, I2), 3524c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) C_PFX5(c_o2_i3_, O1, O2, I1, I2, I3), 3534c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) C_PFX6(c_o2_i4_, O1, O2, I1, I2, I3, I4), 3544c22e840SRichard Henderson 3554c22e840SRichard Henderson typedef enum { 3564c22e840SRichard Henderson #include "tcg-target-con-set.h" 3574c22e840SRichard Henderson } TCGConstraintSetIndex; 3584c22e840SRichard Henderson 3594c22e840SRichard Henderson static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode); 3604c22e840SRichard Henderson 3614c22e840SRichard Henderson #undef C_O0_I1 3624c22e840SRichard Henderson #undef C_O0_I2 3634c22e840SRichard Henderson #undef C_O0_I3 3644c22e840SRichard Henderson #undef C_O0_I4 3654c22e840SRichard Henderson #undef C_O1_I1 3664c22e840SRichard Henderson #undef C_O1_I2 3674c22e840SRichard Henderson #undef C_O1_I3 3684c22e840SRichard Henderson #undef C_O1_I4 3694c22e840SRichard Henderson #undef C_N1_I2 3704c22e840SRichard Henderson #undef C_O2_I1 3714c22e840SRichard Henderson #undef C_O2_I2 3724c22e840SRichard Henderson #undef C_O2_I3 3734c22e840SRichard Henderson #undef C_O2_I4 3744c22e840SRichard Henderson 3754c22e840SRichard Henderson /* Put all of the constraint sets into an array, indexed by the enum. */ 3764c22e840SRichard Henderson 3774c22e840SRichard Henderson #define C_O0_I1(I1) { .args_ct_str = { #I1 } }, 3784c22e840SRichard Henderson #define C_O0_I2(I1, I2) { .args_ct_str = { #I1, #I2 } }, 3794c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) { .args_ct_str = { #I1, #I2, #I3 } }, 3804c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) { .args_ct_str = { #I1, #I2, #I3, #I4 } }, 3814c22e840SRichard Henderson 3824c22e840SRichard Henderson #define C_O1_I1(O1, I1) { .args_ct_str = { #O1, #I1 } }, 3834c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) { .args_ct_str = { #O1, #I1, #I2 } }, 3844c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) { .args_ct_str = { #O1, #I1, #I2, #I3 } }, 3854c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) { .args_ct_str = { #O1, #I1, #I2, #I3, #I4 } }, 3864c22e840SRichard Henderson 3874c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) { .args_ct_str = { "&" #O1, #I1, #I2 } }, 3884c22e840SRichard Henderson 3894c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) { .args_ct_str = { #O1, #O2, #I1 } }, 3904c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) { .args_ct_str = { #O1, #O2, #I1, #I2 } }, 3914c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) { .args_ct_str = { #O1, #O2, #I1, #I2, #I3 } }, 3924c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) { .args_ct_str = { #O1, #O2, #I1, #I2, #I3, #I4 } }, 3934c22e840SRichard Henderson 3944c22e840SRichard Henderson static const TCGTargetOpDef constraint_sets[] = { 3954c22e840SRichard Henderson #include "tcg-target-con-set.h" 3964c22e840SRichard Henderson }; 3974c22e840SRichard Henderson 3984c22e840SRichard Henderson 3994c22e840SRichard Henderson #undef C_O0_I1 4004c22e840SRichard Henderson #undef C_O0_I2 4014c22e840SRichard Henderson #undef C_O0_I3 4024c22e840SRichard Henderson #undef C_O0_I4 4034c22e840SRichard Henderson #undef C_O1_I1 4044c22e840SRichard Henderson #undef C_O1_I2 4054c22e840SRichard Henderson #undef C_O1_I3 4064c22e840SRichard Henderson #undef C_O1_I4 4074c22e840SRichard Henderson #undef C_N1_I2 4084c22e840SRichard Henderson #undef C_O2_I1 4094c22e840SRichard Henderson #undef C_O2_I2 4104c22e840SRichard Henderson #undef C_O2_I3 4114c22e840SRichard Henderson #undef C_O2_I4 4124c22e840SRichard Henderson 4134c22e840SRichard Henderson /* Expand the enumerator to be returned from tcg_target_op_def(). */ 4144c22e840SRichard Henderson 4154c22e840SRichard Henderson #define C_O0_I1(I1) C_PFX1(c_o0_i1_, I1) 4164c22e840SRichard Henderson #define C_O0_I2(I1, I2) C_PFX2(c_o0_i2_, I1, I2) 4174c22e840SRichard Henderson #define C_O0_I3(I1, I2, I3) C_PFX3(c_o0_i3_, I1, I2, I3) 4184c22e840SRichard Henderson #define C_O0_I4(I1, I2, I3, I4) C_PFX4(c_o0_i4_, I1, I2, I3, I4) 4194c22e840SRichard Henderson 4204c22e840SRichard Henderson #define C_O1_I1(O1, I1) C_PFX2(c_o1_i1_, O1, I1) 4214c22e840SRichard Henderson #define C_O1_I2(O1, I1, I2) C_PFX3(c_o1_i2_, O1, I1, I2) 4224c22e840SRichard Henderson #define C_O1_I3(O1, I1, I2, I3) C_PFX4(c_o1_i3_, O1, I1, I2, I3) 4234c22e840SRichard Henderson #define C_O1_I4(O1, I1, I2, I3, I4) C_PFX5(c_o1_i4_, O1, I1, I2, I3, I4) 4244c22e840SRichard Henderson 4254c22e840SRichard Henderson #define C_N1_I2(O1, I1, I2) C_PFX3(c_n1_i2_, O1, I1, I2) 4264c22e840SRichard Henderson 4274c22e840SRichard Henderson #define C_O2_I1(O1, O2, I1) C_PFX3(c_o2_i1_, O1, O2, I1) 4284c22e840SRichard Henderson #define C_O2_I2(O1, O2, I1, I2) C_PFX4(c_o2_i2_, O1, O2, I1, I2) 4294c22e840SRichard Henderson #define C_O2_I3(O1, O2, I1, I2, I3) C_PFX5(c_o2_i3_, O1, O2, I1, I2, I3) 4304c22e840SRichard Henderson #define C_O2_I4(O1, O2, I1, I2, I3, I4) C_PFX6(c_o2_i4_, O1, O2, I1, I2, I3, I4) 4314c22e840SRichard Henderson 432139c1837SPaolo Bonzini #include "tcg-target.c.inc" 433c896fe29Sbellard 43438b47b19SEmilio G. Cota static void alloc_tcg_plugin_context(TCGContext *s) 43538b47b19SEmilio G. Cota { 43638b47b19SEmilio G. Cota #ifdef CONFIG_PLUGIN 43738b47b19SEmilio G. Cota s->plugin_tb = g_new0(struct qemu_plugin_tb, 1); 43838b47b19SEmilio G. Cota s->plugin_tb->insns = 43938b47b19SEmilio G. Cota g_ptr_array_new_with_free_func(qemu_plugin_insn_cleanup_fn); 44038b47b19SEmilio G. Cota #endif 44138b47b19SEmilio G. Cota } 44238b47b19SEmilio G. Cota 443e8feb96fSEmilio G. Cota /* 4443468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 4453468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 4463468b59eSEmilio G. Cota * before initiating translation. 4473468b59eSEmilio G. Cota * 4483468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 4493468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 4503468b59eSEmilio G. Cota * 4513468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 4523468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 4533468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 4543468b59eSEmilio G. Cota * 4553468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 4563468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 4573468b59eSEmilio G. Cota */ 4583468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 4593468b59eSEmilio G. Cota void tcg_register_thread(void) 4603468b59eSEmilio G. Cota { 4613468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 4623468b59eSEmilio G. Cota } 4633468b59eSEmilio G. Cota #else 4643468b59eSEmilio G. Cota void tcg_register_thread(void) 4653468b59eSEmilio G. Cota { 4663468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 4673468b59eSEmilio G. Cota unsigned int i, n; 4683468b59eSEmilio G. Cota 4693468b59eSEmilio G. Cota *s = tcg_init_ctx; 4703468b59eSEmilio G. Cota 4713468b59eSEmilio G. Cota /* Relink mem_base. */ 4723468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 4733468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 4743468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 4753468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 4763468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 4773468b59eSEmilio G. Cota } 4783468b59eSEmilio G. Cota } 4793468b59eSEmilio G. Cota 4803468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 4810e2d61cfSRichard Henderson n = qatomic_fetch_inc(&tcg_cur_ctxs); 4820e2d61cfSRichard Henderson g_assert(n < tcg_max_ctxs); 483d73415a3SStefan Hajnoczi qatomic_set(&tcg_ctxs[n], s); 4843468b59eSEmilio G. Cota 48538b47b19SEmilio G. Cota if (n > 0) { 48638b47b19SEmilio G. Cota alloc_tcg_plugin_context(s); 487bf042e8eSRichard Henderson tcg_region_initial_alloc(s); 48838b47b19SEmilio G. Cota } 48938b47b19SEmilio G. Cota 4903468b59eSEmilio G. Cota tcg_ctx = s; 4913468b59eSEmilio G. Cota } 4923468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 4933468b59eSEmilio G. Cota 494c896fe29Sbellard /* pool based memory allocation */ 495c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 496c896fe29Sbellard { 497c896fe29Sbellard TCGPool *p; 498c896fe29Sbellard int pool_size; 499c896fe29Sbellard 500c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 501c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 5027267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 503c896fe29Sbellard p->size = size; 5044055299eSKirill Batuzov p->next = s->pool_first_large; 5054055299eSKirill Batuzov s->pool_first_large = p; 5064055299eSKirill Batuzov return p->data; 507c896fe29Sbellard } else { 508c896fe29Sbellard p = s->pool_current; 509c896fe29Sbellard if (!p) { 510c896fe29Sbellard p = s->pool_first; 511c896fe29Sbellard if (!p) 512c896fe29Sbellard goto new_pool; 513c896fe29Sbellard } else { 514c896fe29Sbellard if (!p->next) { 515c896fe29Sbellard new_pool: 516c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 5177267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 518c896fe29Sbellard p->size = pool_size; 519c896fe29Sbellard p->next = NULL; 520a813e36fSRichard Henderson if (s->pool_current) { 521c896fe29Sbellard s->pool_current->next = p; 522a813e36fSRichard Henderson } else { 523c896fe29Sbellard s->pool_first = p; 524a813e36fSRichard Henderson } 525c896fe29Sbellard } else { 526c896fe29Sbellard p = p->next; 527c896fe29Sbellard } 528c896fe29Sbellard } 529c896fe29Sbellard } 530c896fe29Sbellard s->pool_current = p; 531c896fe29Sbellard s->pool_cur = p->data + size; 532c896fe29Sbellard s->pool_end = p->data + p->size; 533c896fe29Sbellard return p->data; 534c896fe29Sbellard } 535c896fe29Sbellard 536c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 537c896fe29Sbellard { 5384055299eSKirill Batuzov TCGPool *p, *t; 5394055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 5404055299eSKirill Batuzov t = p->next; 5414055299eSKirill Batuzov g_free(p); 5424055299eSKirill Batuzov } 5434055299eSKirill Batuzov s->pool_first_large = NULL; 544c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 545c896fe29Sbellard s->pool_current = NULL; 546c896fe29Sbellard } 547c896fe29Sbellard 5482ef6175aSRichard Henderson #include "exec/helper-proto.h" 5492ef6175aSRichard Henderson 550100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 5512ef6175aSRichard Henderson #include "exec/helper-tcg.h" 552100b5e01SRichard Henderson }; 553619205fdSEmilio G. Cota static GHashTable *helper_table; 554100b5e01SRichard Henderson 55522f15579SRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 55622f15579SRichard Henderson static GHashTable *ffi_table; 55722f15579SRichard Henderson 55822f15579SRichard Henderson static ffi_type * const typecode_to_ffi[8] = { 55922f15579SRichard Henderson [dh_typecode_void] = &ffi_type_void, 56022f15579SRichard Henderson [dh_typecode_i32] = &ffi_type_uint32, 56122f15579SRichard Henderson [dh_typecode_s32] = &ffi_type_sint32, 56222f15579SRichard Henderson [dh_typecode_i64] = &ffi_type_uint64, 56322f15579SRichard Henderson [dh_typecode_s64] = &ffi_type_sint64, 56422f15579SRichard Henderson [dh_typecode_ptr] = &ffi_type_pointer, 56522f15579SRichard Henderson }; 56622f15579SRichard Henderson #endif 56722f15579SRichard Henderson 56891478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 569f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 5701c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 5711c2adb95SRichard Henderson TCGReg reg, const char *name); 57291478cefSRichard Henderson 57343b972b7SRichard Henderson static void tcg_context_init(unsigned max_cpus) 574c896fe29Sbellard { 575a76aabd3SRichard Henderson TCGContext *s = &tcg_init_ctx; 576100b5e01SRichard Henderson int op, total_args, n, i; 577c896fe29Sbellard TCGOpDef *def; 578c896fe29Sbellard TCGArgConstraint *args_ct; 5791c2adb95SRichard Henderson TCGTemp *ts; 580c896fe29Sbellard 581c896fe29Sbellard memset(s, 0, sizeof(*s)); 582c896fe29Sbellard s->nb_globals = 0; 583c896fe29Sbellard 584c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 585c896fe29Sbellard space */ 586c896fe29Sbellard total_args = 0; 587c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 588c896fe29Sbellard def = &tcg_op_defs[op]; 589c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 590c896fe29Sbellard total_args += n; 591c896fe29Sbellard } 592c896fe29Sbellard 593bc2b17e6SRichard Henderson args_ct = g_new0(TCGArgConstraint, total_args); 594c896fe29Sbellard 595c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 596c896fe29Sbellard def = &tcg_op_defs[op]; 597c896fe29Sbellard def->args_ct = args_ct; 598c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 599c896fe29Sbellard args_ct += n; 600c896fe29Sbellard } 601c896fe29Sbellard 6025cd8f621SRichard Henderson /* Register helpers. */ 60384fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 604619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 60584fd9dd3SRichard Henderson 606100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 60784fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 60872866e82SRichard Henderson (gpointer)&all_helpers[i]); 609100b5e01SRichard Henderson } 6105cd8f621SRichard Henderson 61122f15579SRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 61222f15579SRichard Henderson /* g_direct_hash/equal for direct comparisons on uint32_t. */ 61322f15579SRichard Henderson ffi_table = g_hash_table_new(NULL, NULL); 61422f15579SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 61522f15579SRichard Henderson struct { 61622f15579SRichard Henderson ffi_cif cif; 61722f15579SRichard Henderson ffi_type *args[]; 61822f15579SRichard Henderson } *ca; 61922f15579SRichard Henderson uint32_t typemask = all_helpers[i].typemask; 62022f15579SRichard Henderson gpointer hash = (gpointer)(uintptr_t)typemask; 62122f15579SRichard Henderson ffi_status status; 62222f15579SRichard Henderson int nargs; 62322f15579SRichard Henderson 62422f15579SRichard Henderson if (g_hash_table_lookup(ffi_table, hash)) { 62522f15579SRichard Henderson continue; 62622f15579SRichard Henderson } 62722f15579SRichard Henderson 62822f15579SRichard Henderson /* Ignoring the return type, find the last non-zero field. */ 62922f15579SRichard Henderson nargs = 32 - clz32(typemask >> 3); 63022f15579SRichard Henderson nargs = DIV_ROUND_UP(nargs, 3); 63122f15579SRichard Henderson 63222f15579SRichard Henderson ca = g_malloc0(sizeof(*ca) + nargs * sizeof(ffi_type *)); 63322f15579SRichard Henderson ca->cif.rtype = typecode_to_ffi[typemask & 7]; 63422f15579SRichard Henderson ca->cif.nargs = nargs; 63522f15579SRichard Henderson 63622f15579SRichard Henderson if (nargs != 0) { 63722f15579SRichard Henderson ca->cif.arg_types = ca->args; 6389dd1d56eSIcenowy Zheng for (int j = 0; j < nargs; ++j) { 6399dd1d56eSIcenowy Zheng int typecode = extract32(typemask, (j + 1) * 3, 3); 6409dd1d56eSIcenowy Zheng ca->args[j] = typecode_to_ffi[typecode]; 64122f15579SRichard Henderson } 64222f15579SRichard Henderson } 64322f15579SRichard Henderson 64422f15579SRichard Henderson status = ffi_prep_cif(&ca->cif, FFI_DEFAULT_ABI, nargs, 64522f15579SRichard Henderson ca->cif.rtype, ca->cif.arg_types); 64622f15579SRichard Henderson assert(status == FFI_OK); 64722f15579SRichard Henderson 64822f15579SRichard Henderson g_hash_table_insert(ffi_table, hash, (gpointer)&ca->cif); 64922f15579SRichard Henderson } 65022f15579SRichard Henderson #endif 65122f15579SRichard Henderson 652c896fe29Sbellard tcg_target_init(s); 653f69d277eSRichard Henderson process_op_defs(s); 65491478cefSRichard Henderson 65591478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 65691478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 65791478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 65891478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 65991478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 66091478cefSRichard Henderson break; 66191478cefSRichard Henderson } 66291478cefSRichard Henderson } 66391478cefSRichard Henderson for (i = 0; i < n; ++i) { 66491478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 66591478cefSRichard Henderson } 66691478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 66791478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 66891478cefSRichard Henderson } 669b1311c4aSEmilio G. Cota 67038b47b19SEmilio G. Cota alloc_tcg_plugin_context(s); 67138b47b19SEmilio G. Cota 672b1311c4aSEmilio G. Cota tcg_ctx = s; 6733468b59eSEmilio G. Cota /* 6743468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 6753468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 6763468b59eSEmilio G. Cota * reasoning behind this. 6773468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 6783468b59eSEmilio G. Cota */ 6793468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 680df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 6810e2d61cfSRichard Henderson tcg_cur_ctxs = 1; 6820e2d61cfSRichard Henderson tcg_max_ctxs = 1; 6833468b59eSEmilio G. Cota #else 6840e2d61cfSRichard Henderson tcg_max_ctxs = max_cpus; 6850e2d61cfSRichard Henderson tcg_ctxs = g_new0(TCGContext *, max_cpus); 6863468b59eSEmilio G. Cota #endif 6871c2adb95SRichard Henderson 6881c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 6891c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 6901c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 6919002ec79SRichard Henderson } 692b03cce8eSbellard 69343b972b7SRichard Henderson void tcg_init(size_t tb_size, int splitwx, unsigned max_cpus) 694a76aabd3SRichard Henderson { 69543b972b7SRichard Henderson tcg_context_init(max_cpus); 69643b972b7SRichard Henderson tcg_region_init(tb_size, splitwx, max_cpus); 697a76aabd3SRichard Henderson } 698a76aabd3SRichard Henderson 6996e3b2bfdSEmilio G. Cota /* 7006e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 7016e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 7026e3b2bfdSEmilio G. Cota */ 7036e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 7046e3b2bfdSEmilio G. Cota { 7056e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 7066e3b2bfdSEmilio G. Cota TranslationBlock *tb; 7076e3b2bfdSEmilio G. Cota void *next; 7086e3b2bfdSEmilio G. Cota 709e8feb96fSEmilio G. Cota retry: 7106e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 7116e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 7126e3b2bfdSEmilio G. Cota 7136e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 714e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 7156e3b2bfdSEmilio G. Cota return NULL; 7166e3b2bfdSEmilio G. Cota } 717e8feb96fSEmilio G. Cota goto retry; 718e8feb96fSEmilio G. Cota } 719d73415a3SStefan Hajnoczi qatomic_set(&s->code_gen_ptr, next); 72057a26946SRichard Henderson s->data_gen_ptr = NULL; 7216e3b2bfdSEmilio G. Cota return tb; 7226e3b2bfdSEmilio G. Cota } 7236e3b2bfdSEmilio G. Cota 7249002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 7259002ec79SRichard Henderson { 726b0a0794aSRichard Henderson size_t prologue_size; 7278163b749SRichard Henderson 728b0a0794aSRichard Henderson s->code_ptr = s->code_gen_ptr; 729b0a0794aSRichard Henderson s->code_buf = s->code_gen_ptr; 7305b38ee31SRichard Henderson s->data_gen_ptr = NULL; 731b91ccb31SRichard Henderson 732b91ccb31SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 733b0a0794aSRichard Henderson tcg_qemu_tb_exec = (tcg_prologue_fn *)tcg_splitwx_to_rx(s->code_ptr); 734b91ccb31SRichard Henderson #endif 7358163b749SRichard Henderson 7365b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 7375b38ee31SRichard Henderson s->pool_labels = NULL; 7385b38ee31SRichard Henderson #endif 7395b38ee31SRichard Henderson 740653b87ebSRoman Bolshakov qemu_thread_jit_write(); 7418163b749SRichard Henderson /* Generate the prologue. */ 742b03cce8eSbellard tcg_target_qemu_prologue(s); 7435b38ee31SRichard Henderson 7445b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 7455b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 7465b38ee31SRichard Henderson { 7471768987bSRichard Henderson int result = tcg_out_pool_finalize(s); 7481768987bSRichard Henderson tcg_debug_assert(result == 0); 7495b38ee31SRichard Henderson } 7505b38ee31SRichard Henderson #endif 7515b38ee31SRichard Henderson 752b0a0794aSRichard Henderson prologue_size = tcg_current_code_size(s); 753b0a0794aSRichard Henderson 754df5d2b16SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 755b0a0794aSRichard Henderson flush_idcache_range((uintptr_t)tcg_splitwx_to_rx(s->code_buf), 756b0a0794aSRichard Henderson (uintptr_t)s->code_buf, prologue_size); 757df5d2b16SRichard Henderson #endif 7588163b749SRichard Henderson 759d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 760d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 761c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 76278b54858SRichard Henderson if (logfile) { 76378b54858SRichard Henderson fprintf(logfile, "PROLOGUE: [size=%zu]\n", prologue_size); 7645b38ee31SRichard Henderson if (s->data_gen_ptr) { 765b0a0794aSRichard Henderson size_t code_size = s->data_gen_ptr - s->code_gen_ptr; 7665b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 7675b38ee31SRichard Henderson size_t i; 7685b38ee31SRichard Henderson 76978b54858SRichard Henderson disas(logfile, s->code_gen_ptr, code_size); 7705b38ee31SRichard Henderson 7715b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 7725b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 77378b54858SRichard Henderson fprintf(logfile, 77478b54858SRichard Henderson "0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 7755b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 7765b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 7775b38ee31SRichard Henderson } else { 77878b54858SRichard Henderson fprintf(logfile, 77978b54858SRichard Henderson "0x%08" PRIxPTR ": .long 0x%08x\n", 7805b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 7815b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 7825b38ee31SRichard Henderson } 7835b38ee31SRichard Henderson } 7845b38ee31SRichard Henderson } else { 78578b54858SRichard Henderson disas(logfile, s->code_gen_ptr, prologue_size); 7865b38ee31SRichard Henderson } 78778b54858SRichard Henderson fprintf(logfile, "\n"); 788fc59d2d8SRobert Foley qemu_log_unlock(logfile); 789d6b64b2bSRichard Henderson } 79078b54858SRichard Henderson } 791d6b64b2bSRichard Henderson #endif 792cedbcb01SEmilio G. Cota 7936eea0434SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 7946eea0434SRichard Henderson /* 7956eea0434SRichard Henderson * Assert that goto_ptr is implemented completely, setting an epilogue. 7966eea0434SRichard Henderson * For tci, we use NULL as the signal to return from the interpreter, 7976eea0434SRichard Henderson * so skip this check. 7986eea0434SRichard Henderson */ 7998b5c2b62SRichard Henderson tcg_debug_assert(tcg_code_gen_epilogue != NULL); 8006eea0434SRichard Henderson #endif 801d1c74ab3SRichard Henderson 802d1c74ab3SRichard Henderson tcg_region_prologue_set(s); 803c896fe29Sbellard } 804c896fe29Sbellard 805c896fe29Sbellard void tcg_func_start(TCGContext *s) 806c896fe29Sbellard { 807c896fe29Sbellard tcg_pool_reset(s); 808c896fe29Sbellard s->nb_temps = s->nb_globals; 8090ec9eabcSRichard Henderson 8100ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 8110ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 8120ec9eabcSRichard Henderson 813c0522136SRichard Henderson /* No constant temps have been previously allocated. */ 814c0522136SRichard Henderson for (int i = 0; i < TCG_TYPE_COUNT; ++i) { 815c0522136SRichard Henderson if (s->const_table[i]) { 816c0522136SRichard Henderson g_hash_table_remove_all(s->const_table[i]); 817c0522136SRichard Henderson } 818c0522136SRichard Henderson } 819c0522136SRichard Henderson 820abebf925SRichard Henderson s->nb_ops = 0; 821c896fe29Sbellard s->nb_labels = 0; 822c896fe29Sbellard s->current_frame_offset = s->frame_start; 823c896fe29Sbellard 8240a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 8250a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 8260a209d4bSRichard Henderson #endif 8270a209d4bSRichard Henderson 82815fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 82915fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 830bef16ab4SRichard Henderson QSIMPLEQ_INIT(&s->labels); 831c896fe29Sbellard } 832c896fe29Sbellard 833ae30e866SRichard Henderson static TCGTemp *tcg_temp_alloc(TCGContext *s) 8347ca4b752SRichard Henderson { 8357ca4b752SRichard Henderson int n = s->nb_temps++; 836ae30e866SRichard Henderson 837ae30e866SRichard Henderson if (n >= TCG_MAX_TEMPS) { 838db6b7d0cSRichard Henderson tcg_raise_tb_overflow(s); 839ae30e866SRichard Henderson } 8407ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 8417ca4b752SRichard Henderson } 8427ca4b752SRichard Henderson 843ae30e866SRichard Henderson static TCGTemp *tcg_global_alloc(TCGContext *s) 8447ca4b752SRichard Henderson { 845fa477d25SRichard Henderson TCGTemp *ts; 846fa477d25SRichard Henderson 8477ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 848ae30e866SRichard Henderson tcg_debug_assert(s->nb_globals < TCG_MAX_TEMPS); 8497ca4b752SRichard Henderson s->nb_globals++; 850fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 851ee17db83SRichard Henderson ts->kind = TEMP_GLOBAL; 852fa477d25SRichard Henderson 853fa477d25SRichard Henderson return ts; 854c896fe29Sbellard } 855c896fe29Sbellard 856085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 857b6638662SRichard Henderson TCGReg reg, const char *name) 858c896fe29Sbellard { 859c896fe29Sbellard TCGTemp *ts; 860c896fe29Sbellard 861b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 862c896fe29Sbellard tcg_abort(); 863b3a62939SRichard Henderson } 8647ca4b752SRichard Henderson 8657ca4b752SRichard Henderson ts = tcg_global_alloc(s); 866c896fe29Sbellard ts->base_type = type; 867c896fe29Sbellard ts->type = type; 868ee17db83SRichard Henderson ts->kind = TEMP_FIXED; 869c896fe29Sbellard ts->reg = reg; 870c896fe29Sbellard ts->name = name; 871c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 8727ca4b752SRichard Henderson 873085272b3SRichard Henderson return ts; 874a7812ae4Spbrook } 875a7812ae4Spbrook 876b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 877a7812ae4Spbrook { 878b3a62939SRichard Henderson s->frame_start = start; 879b3a62939SRichard Henderson s->frame_end = start + size; 880085272b3SRichard Henderson s->frame_temp 881085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 882b3a62939SRichard Henderson } 883a7812ae4Spbrook 884085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 885e1ccc054SRichard Henderson intptr_t offset, const char *name) 886c896fe29Sbellard { 887b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 888dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 8897ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 890*aef85402SRichard Henderson int indirect_reg = 0; 891c896fe29Sbellard 892c0522136SRichard Henderson switch (base_ts->kind) { 893c0522136SRichard Henderson case TEMP_FIXED: 894c0522136SRichard Henderson break; 895c0522136SRichard Henderson case TEMP_GLOBAL: 8965a18407fSRichard Henderson /* We do not support double-indirect registers. */ 8975a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 898b3915dbbSRichard Henderson base_ts->indirect_base = 1; 8995a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 9005a18407fSRichard Henderson ? 2 : 1); 9015a18407fSRichard Henderson indirect_reg = 1; 902c0522136SRichard Henderson break; 903c0522136SRichard Henderson default: 904c0522136SRichard Henderson g_assert_not_reached(); 905b3915dbbSRichard Henderson } 906b3915dbbSRichard Henderson 9077ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 9087ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 909c896fe29Sbellard char buf[64]; 9107ca4b752SRichard Henderson 9117ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 912c896fe29Sbellard ts->type = TCG_TYPE_I32; 913b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 914c896fe29Sbellard ts->mem_allocated = 1; 915b3a62939SRichard Henderson ts->mem_base = base_ts; 916*aef85402SRichard Henderson ts->mem_offset = offset; 917c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 918c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 919c896fe29Sbellard ts->name = strdup(buf); 920c896fe29Sbellard 9217ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 9227ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 9237ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 924b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 9257ca4b752SRichard Henderson ts2->mem_allocated = 1; 9267ca4b752SRichard Henderson ts2->mem_base = base_ts; 927*aef85402SRichard Henderson ts2->mem_offset = offset + 4; 928fac87bd2SRichard Henderson ts2->temp_subindex = 1; 929c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 930c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 931120c1084SRichard Henderson ts2->name = strdup(buf); 9327ca4b752SRichard Henderson } else { 933c896fe29Sbellard ts->base_type = type; 934c896fe29Sbellard ts->type = type; 935b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 936c896fe29Sbellard ts->mem_allocated = 1; 937b3a62939SRichard Henderson ts->mem_base = base_ts; 938c896fe29Sbellard ts->mem_offset = offset; 939c896fe29Sbellard ts->name = name; 940c896fe29Sbellard } 941085272b3SRichard Henderson return ts; 942c896fe29Sbellard } 943c896fe29Sbellard 9445bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 945c896fe29Sbellard { 946b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 947ee17db83SRichard Henderson TCGTempKind kind = temp_local ? TEMP_LOCAL : TEMP_NORMAL; 948c896fe29Sbellard TCGTemp *ts; 949641d5fbeSbellard int idx, k; 950c896fe29Sbellard 9510ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 9520ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 9530ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 9540ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 9550ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 9560ec9eabcSRichard Henderson 957e8996ee0Sbellard ts = &s->temps[idx]; 958e8996ee0Sbellard ts->temp_allocated = 1; 9597ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 960ee17db83SRichard Henderson tcg_debug_assert(ts->kind == kind); 961e8996ee0Sbellard } else { 9627ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 9637ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 9647ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 9657ca4b752SRichard Henderson 966c896fe29Sbellard ts->base_type = type; 967c896fe29Sbellard ts->type = TCG_TYPE_I32; 968e8996ee0Sbellard ts->temp_allocated = 1; 969ee17db83SRichard Henderson ts->kind = kind; 9707ca4b752SRichard Henderson 9717ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 9727ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 9737ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 9747ca4b752SRichard Henderson ts2->temp_allocated = 1; 975fac87bd2SRichard Henderson ts2->temp_subindex = 1; 976ee17db83SRichard Henderson ts2->kind = kind; 9777ca4b752SRichard Henderson } else { 978c896fe29Sbellard ts->base_type = type; 979c896fe29Sbellard ts->type = type; 980e8996ee0Sbellard ts->temp_allocated = 1; 981ee17db83SRichard Henderson ts->kind = kind; 982c896fe29Sbellard } 983e8996ee0Sbellard } 98427bfd83cSPeter Maydell 98527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 98627bfd83cSPeter Maydell s->temps_in_use++; 98727bfd83cSPeter Maydell #endif 988085272b3SRichard Henderson return ts; 989c896fe29Sbellard } 990c896fe29Sbellard 991d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 992d2fd745fSRichard Henderson { 993d2fd745fSRichard Henderson TCGTemp *t; 994d2fd745fSRichard Henderson 995d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 996d2fd745fSRichard Henderson switch (type) { 997d2fd745fSRichard Henderson case TCG_TYPE_V64: 998d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 999d2fd745fSRichard Henderson break; 1000d2fd745fSRichard Henderson case TCG_TYPE_V128: 1001d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 1002d2fd745fSRichard Henderson break; 1003d2fd745fSRichard Henderson case TCG_TYPE_V256: 1004d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 1005d2fd745fSRichard Henderson break; 1006d2fd745fSRichard Henderson default: 1007d2fd745fSRichard Henderson g_assert_not_reached(); 1008d2fd745fSRichard Henderson } 1009d2fd745fSRichard Henderson #endif 1010d2fd745fSRichard Henderson 1011d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 1012d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1013d2fd745fSRichard Henderson } 1014d2fd745fSRichard Henderson 1015d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 1016d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 1017d2fd745fSRichard Henderson { 1018d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 1019d2fd745fSRichard Henderson 1020d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 1021d2fd745fSRichard Henderson 1022d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 1023d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1024d2fd745fSRichard Henderson } 1025d2fd745fSRichard Henderson 10265bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 1027c896fe29Sbellard { 1028b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1029085272b3SRichard Henderson int k, idx; 1030c896fe29Sbellard 1031c7482438SRichard Henderson switch (ts->kind) { 1032c7482438SRichard Henderson case TEMP_CONST: 1033c7482438SRichard Henderson /* 1034c7482438SRichard Henderson * In order to simplify users of tcg_constant_*, 1035c7482438SRichard Henderson * silently ignore free. 1036c7482438SRichard Henderson */ 1037c0522136SRichard Henderson return; 1038c7482438SRichard Henderson case TEMP_NORMAL: 1039c7482438SRichard Henderson case TEMP_LOCAL: 1040c7482438SRichard Henderson break; 1041c7482438SRichard Henderson default: 1042c7482438SRichard Henderson g_assert_not_reached(); 1043c0522136SRichard Henderson } 1044c0522136SRichard Henderson 104527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 104627bfd83cSPeter Maydell s->temps_in_use--; 104727bfd83cSPeter Maydell if (s->temps_in_use < 0) { 104827bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 104927bfd83cSPeter Maydell } 105027bfd83cSPeter Maydell #endif 105127bfd83cSPeter Maydell 1052eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 1053e8996ee0Sbellard ts->temp_allocated = 0; 10540ec9eabcSRichard Henderson 1055085272b3SRichard Henderson idx = temp_idx(ts); 1056ee17db83SRichard Henderson k = ts->base_type + (ts->kind == TEMP_NORMAL ? 0 : TCG_TYPE_COUNT); 10570ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 1058e8996ee0Sbellard } 1059e8996ee0Sbellard 1060c0522136SRichard Henderson TCGTemp *tcg_constant_internal(TCGType type, int64_t val) 1061c0522136SRichard Henderson { 1062c0522136SRichard Henderson TCGContext *s = tcg_ctx; 1063c0522136SRichard Henderson GHashTable *h = s->const_table[type]; 1064c0522136SRichard Henderson TCGTemp *ts; 1065c0522136SRichard Henderson 1066c0522136SRichard Henderson if (h == NULL) { 1067c0522136SRichard Henderson h = g_hash_table_new(g_int64_hash, g_int64_equal); 1068c0522136SRichard Henderson s->const_table[type] = h; 1069c0522136SRichard Henderson } 1070c0522136SRichard Henderson 1071c0522136SRichard Henderson ts = g_hash_table_lookup(h, &val); 1072c0522136SRichard Henderson if (ts == NULL) { 1073*aef85402SRichard Henderson int64_t *val_ptr; 1074*aef85402SRichard Henderson 1075c0522136SRichard Henderson ts = tcg_temp_alloc(s); 1076c0522136SRichard Henderson 1077c0522136SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 1078c0522136SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 1079c0522136SRichard Henderson 1080*aef85402SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 1081*aef85402SRichard Henderson 1082c0522136SRichard Henderson ts->base_type = TCG_TYPE_I64; 1083c0522136SRichard Henderson ts->type = TCG_TYPE_I32; 1084c0522136SRichard Henderson ts->kind = TEMP_CONST; 1085c0522136SRichard Henderson ts->temp_allocated = 1; 1086c0522136SRichard Henderson 1087c0522136SRichard Henderson ts2->base_type = TCG_TYPE_I64; 1088c0522136SRichard Henderson ts2->type = TCG_TYPE_I32; 1089c0522136SRichard Henderson ts2->kind = TEMP_CONST; 1090c0522136SRichard Henderson ts2->temp_allocated = 1; 1091fac87bd2SRichard Henderson ts2->temp_subindex = 1; 1092*aef85402SRichard Henderson 1093*aef85402SRichard Henderson /* 1094*aef85402SRichard Henderson * Retain the full value of the 64-bit constant in the low 1095*aef85402SRichard Henderson * part, so that the hash table works. Actual uses will 1096*aef85402SRichard Henderson * truncate the value to the low part. 1097*aef85402SRichard Henderson */ 1098*aef85402SRichard Henderson ts[HOST_BIG_ENDIAN].val = val; 1099*aef85402SRichard Henderson ts[!HOST_BIG_ENDIAN].val = val >> 32; 1100*aef85402SRichard Henderson val_ptr = &ts[HOST_BIG_ENDIAN].val; 1101c0522136SRichard Henderson } else { 1102c0522136SRichard Henderson ts->base_type = type; 1103c0522136SRichard Henderson ts->type = type; 1104c0522136SRichard Henderson ts->kind = TEMP_CONST; 1105c0522136SRichard Henderson ts->temp_allocated = 1; 1106c0522136SRichard Henderson ts->val = val; 1107*aef85402SRichard Henderson val_ptr = &ts->val; 1108c0522136SRichard Henderson } 1109*aef85402SRichard Henderson g_hash_table_insert(h, val_ptr, ts); 1110c0522136SRichard Henderson } 1111c0522136SRichard Henderson 1112c0522136SRichard Henderson return ts; 1113c0522136SRichard Henderson } 1114c0522136SRichard Henderson 1115c0522136SRichard Henderson TCGv_vec tcg_constant_vec(TCGType type, unsigned vece, int64_t val) 1116c0522136SRichard Henderson { 1117c0522136SRichard Henderson val = dup_const(vece, val); 1118c0522136SRichard Henderson return temp_tcgv_vec(tcg_constant_internal(type, val)); 1119c0522136SRichard Henderson } 1120c0522136SRichard Henderson 112188d4005bSRichard Henderson TCGv_vec tcg_constant_vec_matching(TCGv_vec match, unsigned vece, int64_t val) 112288d4005bSRichard Henderson { 112388d4005bSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 112488d4005bSRichard Henderson 112588d4005bSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 112688d4005bSRichard Henderson return tcg_constant_vec(t->base_type, vece, val); 112788d4005bSRichard Henderson } 112888d4005bSRichard Henderson 1129a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1130a7812ae4Spbrook { 1131a7812ae4Spbrook TCGv_i32 t0; 1132a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1133e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1134e8996ee0Sbellard return t0; 1135c896fe29Sbellard } 1136c896fe29Sbellard 1137a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1138c896fe29Sbellard { 1139a7812ae4Spbrook TCGv_i64 t0; 1140a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1141e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1142e8996ee0Sbellard return t0; 1143c896fe29Sbellard } 1144c896fe29Sbellard 1145a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1146bdffd4a9Saurel32 { 1147a7812ae4Spbrook TCGv_i32 t0; 1148a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1149bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1150bdffd4a9Saurel32 return t0; 1151bdffd4a9Saurel32 } 1152bdffd4a9Saurel32 1153a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1154bdffd4a9Saurel32 { 1155a7812ae4Spbrook TCGv_i64 t0; 1156a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1157bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1158bdffd4a9Saurel32 return t0; 1159bdffd4a9Saurel32 } 1160bdffd4a9Saurel32 116127bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 116227bfd83cSPeter Maydell void tcg_clear_temp_count(void) 116327bfd83cSPeter Maydell { 1164b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 116527bfd83cSPeter Maydell s->temps_in_use = 0; 116627bfd83cSPeter Maydell } 116727bfd83cSPeter Maydell 116827bfd83cSPeter Maydell int tcg_check_temp_count(void) 116927bfd83cSPeter Maydell { 1170b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 117127bfd83cSPeter Maydell if (s->temps_in_use) { 117227bfd83cSPeter Maydell /* Clear the count so that we don't give another 117327bfd83cSPeter Maydell * warning immediately next time around. 117427bfd83cSPeter Maydell */ 117527bfd83cSPeter Maydell s->temps_in_use = 0; 117627bfd83cSPeter Maydell return 1; 117727bfd83cSPeter Maydell } 117827bfd83cSPeter Maydell return 0; 117927bfd83cSPeter Maydell } 118027bfd83cSPeter Maydell #endif 118127bfd83cSPeter Maydell 1182be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1183be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1184be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1185be0f34b5SRichard Henderson { 1186d2fd745fSRichard Henderson const bool have_vec 1187d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1188d2fd745fSRichard Henderson 1189be0f34b5SRichard Henderson switch (op) { 1190be0f34b5SRichard Henderson case INDEX_op_discard: 1191be0f34b5SRichard Henderson case INDEX_op_set_label: 1192be0f34b5SRichard Henderson case INDEX_op_call: 1193be0f34b5SRichard Henderson case INDEX_op_br: 1194be0f34b5SRichard Henderson case INDEX_op_mb: 1195be0f34b5SRichard Henderson case INDEX_op_insn_start: 1196be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1197be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1198f4e01e30SRichard Henderson case INDEX_op_goto_ptr: 1199be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1200be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1201be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1202be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1203be0f34b5SRichard Henderson return true; 1204be0f34b5SRichard Henderson 120507ce0b05SRichard Henderson case INDEX_op_qemu_st8_i32: 120607ce0b05SRichard Henderson return TCG_TARGET_HAS_qemu_st8_i32; 120707ce0b05SRichard Henderson 1208be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1209be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1210be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1211be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1212be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1213be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1214be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1215be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1216be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1217be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1218be0f34b5SRichard Henderson case INDEX_op_st_i32: 1219be0f34b5SRichard Henderson case INDEX_op_add_i32: 1220be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1221be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1222be0f34b5SRichard Henderson case INDEX_op_and_i32: 1223be0f34b5SRichard Henderson case INDEX_op_or_i32: 1224be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1225be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1226be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1227be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1228be0f34b5SRichard Henderson return true; 1229be0f34b5SRichard Henderson 1230be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1231be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1232be0f34b5SRichard Henderson case INDEX_op_div_i32: 1233be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1234be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1235be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1236be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1237be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1238be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1239be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1240be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1241be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1242be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1243be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1244be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1245be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1246be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1247be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1248be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1249be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1250fce1296fSRichard Henderson case INDEX_op_extract2_i32: 1251fce1296fSRichard Henderson return TCG_TARGET_HAS_extract2_i32; 1252be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1253be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1254be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1255be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1256be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1257be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1258be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1259be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1260be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1261be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1262be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1263be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1264be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1265be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1266be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1267be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1268be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1269be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1270be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1271be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1272be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1273be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1274be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1275be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1276be0f34b5SRichard Henderson case INDEX_op_not_i32: 1277be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1278be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1279be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1280be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1281be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1282be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1283be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1284be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1285be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1286be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1287be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1288be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1289be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1290be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1291be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1292be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1293be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1294be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1295be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1296be0f34b5SRichard Henderson 1297be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1298be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1299be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1300be0f34b5SRichard Henderson 1301be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1302be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1303be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1304be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1305be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1306be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1307be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1308be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1309be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1310be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1311be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1312be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1313be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1314be0f34b5SRichard Henderson case INDEX_op_st_i64: 1315be0f34b5SRichard Henderson case INDEX_op_add_i64: 1316be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1317be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1318be0f34b5SRichard Henderson case INDEX_op_and_i64: 1319be0f34b5SRichard Henderson case INDEX_op_or_i64: 1320be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1321be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1322be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1323be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1324be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1325be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1326be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1327be0f34b5SRichard Henderson 1328be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1329be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1330be0f34b5SRichard Henderson case INDEX_op_div_i64: 1331be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1332be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1333be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1334be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1335be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1336be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1337be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1338be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1339be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1340be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1341be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1342be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1343be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1344be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1345be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1346be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1347be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1348fce1296fSRichard Henderson case INDEX_op_extract2_i64: 1349fce1296fSRichard Henderson return TCG_TARGET_HAS_extract2_i64; 1350be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1351be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1352be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1353be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1354be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1355be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1356be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1357be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1358be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1359be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1360be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1361be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1362be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1363be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1364be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1365be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1366be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1367be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1368be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1369be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1370be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1371be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1372be0f34b5SRichard Henderson case INDEX_op_not_i64: 1373be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1374be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1375be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1376be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1377be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1378be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1379be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1380be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1381be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1382be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1383be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1384be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1385be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1386be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1387be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1388be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1389be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1390be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1391be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1392be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1393be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1394be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1395be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1396be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1397be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1398be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1399be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1400be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1401be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1402be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1403be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1404be0f34b5SRichard Henderson 1405d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1406d2fd745fSRichard Henderson case INDEX_op_dup_vec: 140737ee55a0SRichard Henderson case INDEX_op_dupm_vec: 1408d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1409d2fd745fSRichard Henderson case INDEX_op_st_vec: 1410d2fd745fSRichard Henderson case INDEX_op_add_vec: 1411d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1412d2fd745fSRichard Henderson case INDEX_op_and_vec: 1413d2fd745fSRichard Henderson case INDEX_op_or_vec: 1414d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1415212be173SRichard Henderson case INDEX_op_cmp_vec: 1416d2fd745fSRichard Henderson return have_vec; 1417d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1418d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1419d2fd745fSRichard Henderson case INDEX_op_not_vec: 1420d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1421d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1422d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1423bcefc902SRichard Henderson case INDEX_op_abs_vec: 1424bcefc902SRichard Henderson return have_vec && TCG_TARGET_HAS_abs_vec; 1425d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1426d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1427d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1428d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 1429ed523473SRichard Henderson case INDEX_op_nand_vec: 1430ed523473SRichard Henderson return have_vec && TCG_TARGET_HAS_nand_vec; 1431ed523473SRichard Henderson case INDEX_op_nor_vec: 1432ed523473SRichard Henderson return have_vec && TCG_TARGET_HAS_nor_vec; 1433ed523473SRichard Henderson case INDEX_op_eqv_vec: 1434ed523473SRichard Henderson return have_vec && TCG_TARGET_HAS_eqv_vec; 14353774030aSRichard Henderson case INDEX_op_mul_vec: 14363774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1437d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1438d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1439d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1440d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1441d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1442d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1443d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1444d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1445d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1446d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1447d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1448d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1449b0f7e744SRichard Henderson case INDEX_op_rotli_vec: 1450b0f7e744SRichard Henderson return have_vec && TCG_TARGET_HAS_roti_vec; 145123850a74SRichard Henderson case INDEX_op_rotls_vec: 145223850a74SRichard Henderson return have_vec && TCG_TARGET_HAS_rots_vec; 14535d0ceda9SRichard Henderson case INDEX_op_rotlv_vec: 14545d0ceda9SRichard Henderson case INDEX_op_rotrv_vec: 14555d0ceda9SRichard Henderson return have_vec && TCG_TARGET_HAS_rotv_vec; 14568afaf050SRichard Henderson case INDEX_op_ssadd_vec: 14578afaf050SRichard Henderson case INDEX_op_usadd_vec: 14588afaf050SRichard Henderson case INDEX_op_sssub_vec: 14598afaf050SRichard Henderson case INDEX_op_ussub_vec: 14608afaf050SRichard Henderson return have_vec && TCG_TARGET_HAS_sat_vec; 1461dd0a0fcdSRichard Henderson case INDEX_op_smin_vec: 1462dd0a0fcdSRichard Henderson case INDEX_op_umin_vec: 1463dd0a0fcdSRichard Henderson case INDEX_op_smax_vec: 1464dd0a0fcdSRichard Henderson case INDEX_op_umax_vec: 1465dd0a0fcdSRichard Henderson return have_vec && TCG_TARGET_HAS_minmax_vec; 146638dc1294SRichard Henderson case INDEX_op_bitsel_vec: 146738dc1294SRichard Henderson return have_vec && TCG_TARGET_HAS_bitsel_vec; 1468f75da298SRichard Henderson case INDEX_op_cmpsel_vec: 1469f75da298SRichard Henderson return have_vec && TCG_TARGET_HAS_cmpsel_vec; 1470d2fd745fSRichard Henderson 1471db432672SRichard Henderson default: 1472db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1473db432672SRichard Henderson return true; 1474be0f34b5SRichard Henderson } 1475be0f34b5SRichard Henderson } 1476be0f34b5SRichard Henderson 147739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 147839cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 147939cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1480ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1481c896fe29Sbellard { 148275e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 14833e92aa34SRichard Henderson unsigned typemask; 14843e92aa34SRichard Henderson const TCGHelperInfo *info; 148575e8b9b7SRichard Henderson TCGOp *op; 1486afb49896SRichard Henderson 1487619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 14887319d83aSRichard Henderson typemask = info->typemask; 14892bece2c8SRichard Henderson 149038b47b19SEmilio G. Cota #ifdef CONFIG_PLUGIN 149138b47b19SEmilio G. Cota /* detect non-plugin helpers */ 149238b47b19SEmilio G. Cota if (tcg_ctx->plugin_insn && unlikely(strncmp(info->name, "plugin_", 7))) { 149338b47b19SEmilio G. Cota tcg_ctx->plugin_insn->calls_helpers = true; 149438b47b19SEmilio G. Cota } 149538b47b19SEmilio G. Cota #endif 149638b47b19SEmilio G. Cota 14973a5f6805SRichard Henderson #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 14982bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 14997319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 15007319d83aSRichard Henderson bool is_32bit = (argtype & ~1) == dh_typecode_i32; 15017319d83aSRichard Henderson bool is_signed = argtype & 1; 15027319d83aSRichard Henderson 15037319d83aSRichard Henderson if (is_32bit) { 15042bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 150518cf3d07SRichard Henderson TCGv_i32 orig = temp_tcgv_i32(args[i]); 15062bece2c8SRichard Henderson if (is_signed) { 150718cf3d07SRichard Henderson tcg_gen_ext_i32_i64(temp, orig); 15082bece2c8SRichard Henderson } else { 150918cf3d07SRichard Henderson tcg_gen_extu_i32_i64(temp, orig); 15102bece2c8SRichard Henderson } 1511ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 15122bece2c8SRichard Henderson } 15132bece2c8SRichard Henderson } 15142bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 15152bece2c8SRichard Henderson 151615fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 151775e8b9b7SRichard Henderson 151875e8b9b7SRichard Henderson pi = 0; 1519ae8b75dcSRichard Henderson if (ret != NULL) { 15207319d83aSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (typemask & 6) == dh_typecode_i64) { 1521ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1522ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1523a7812ae4Spbrook nb_rets = 2; 152434b1a49cSRichard Henderson } else { 1525ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1526a7812ae4Spbrook nb_rets = 1; 1527a7812ae4Spbrook } 1528a7812ae4Spbrook } else { 1529a7812ae4Spbrook nb_rets = 0; 1530a7812ae4Spbrook } 1531cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 153275e8b9b7SRichard Henderson 1533a7812ae4Spbrook real_args = 0; 1534a7812ae4Spbrook for (i = 0; i < nargs; i++) { 15357319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 15367319d83aSRichard Henderson bool is_64bit = (argtype & ~1) == dh_typecode_i64; 15377b7d8b2dSRichard Henderson bool want_align = false; 15387319d83aSRichard Henderson 15397b7d8b2dSRichard Henderson #if defined(CONFIG_TCG_INTERPRETER) 15407b7d8b2dSRichard Henderson /* 15417b7d8b2dSRichard Henderson * Align all arguments, so that they land in predictable places 15427b7d8b2dSRichard Henderson * for passing off to ffi_call. 15437b7d8b2dSRichard Henderson */ 15447b7d8b2dSRichard Henderson want_align = true; 15457b7d8b2dSRichard Henderson #elif defined(TCG_TARGET_CALL_ALIGN_ARGS) 15467b7d8b2dSRichard Henderson /* Some targets want aligned 64 bit args */ 15477b7d8b2dSRichard Henderson want_align = is_64bit; 15487b7d8b2dSRichard Henderson #endif 15497b7d8b2dSRichard Henderson 15507b7d8b2dSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && want_align && (real_args & 1)) { 155175e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1552ebd486d5Smalc real_args++; 155339cf05d3Sbellard } 15547b7d8b2dSRichard Henderson 15557b7d8b2dSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 1556*aef85402SRichard Henderson op->args[pi++] = temp_arg(args[i]); 1557*aef85402SRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1558a7812ae4Spbrook real_args += 2; 15592bece2c8SRichard Henderson continue; 15602bece2c8SRichard Henderson } 15612bece2c8SRichard Henderson 1562ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1563a7812ae4Spbrook real_args++; 1564c896fe29Sbellard } 156575e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 15663e92aa34SRichard Henderson op->args[pi++] = (uintptr_t)info; 1567cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1568a7812ae4Spbrook 156975e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1570cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 157175e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 15722bece2c8SRichard Henderson 15733a5f6805SRichard Henderson #if defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 15742bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 15757319d83aSRichard Henderson int argtype = extract32(typemask, (i + 1) * 3, 3); 15767319d83aSRichard Henderson bool is_32bit = (argtype & ~1) == dh_typecode_i32; 15777319d83aSRichard Henderson 15787319d83aSRichard Henderson if (is_32bit) { 1579085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 15802bece2c8SRichard Henderson } 15812bece2c8SRichard Henderson } 15822bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1583a7812ae4Spbrook } 1584c896fe29Sbellard 15858fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1586c896fe29Sbellard { 1587ac3b8891SRichard Henderson int i, n; 1588ac3b8891SRichard Henderson 1589ee17db83SRichard Henderson for (i = 0, n = s->nb_temps; i < n; i++) { 1590ee17db83SRichard Henderson TCGTemp *ts = &s->temps[i]; 1591ee17db83SRichard Henderson TCGTempVal val = TEMP_VAL_MEM; 1592ee17db83SRichard Henderson 1593ee17db83SRichard Henderson switch (ts->kind) { 1594c0522136SRichard Henderson case TEMP_CONST: 1595c0522136SRichard Henderson val = TEMP_VAL_CONST; 1596c0522136SRichard Henderson break; 1597ee17db83SRichard Henderson case TEMP_FIXED: 1598ee17db83SRichard Henderson val = TEMP_VAL_REG; 1599ee17db83SRichard Henderson break; 1600ee17db83SRichard Henderson case TEMP_GLOBAL: 1601ee17db83SRichard Henderson break; 1602ee17db83SRichard Henderson case TEMP_NORMAL: 1603c7482438SRichard Henderson case TEMP_EBB: 1604ee17db83SRichard Henderson val = TEMP_VAL_DEAD; 1605ee17db83SRichard Henderson /* fall through */ 1606ee17db83SRichard Henderson case TEMP_LOCAL: 1607e8996ee0Sbellard ts->mem_allocated = 0; 1608ee17db83SRichard Henderson break; 1609ee17db83SRichard Henderson default: 1610ee17db83SRichard Henderson g_assert_not_reached(); 1611ee17db83SRichard Henderson } 1612ee17db83SRichard Henderson ts->val_type = val; 1613e8996ee0Sbellard } 1614f8b2f202SRichard Henderson 1615f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1616c896fe29Sbellard } 1617c896fe29Sbellard 1618f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1619f8b2f202SRichard Henderson TCGTemp *ts) 1620c896fe29Sbellard { 16211807f4c4SRichard Henderson int idx = temp_idx(ts); 1622ac56dd48Spbrook 1623ee17db83SRichard Henderson switch (ts->kind) { 1624ee17db83SRichard Henderson case TEMP_FIXED: 1625ee17db83SRichard Henderson case TEMP_GLOBAL: 1626ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1627ee17db83SRichard Henderson break; 1628ee17db83SRichard Henderson case TEMP_LOCAL: 1629641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1630ee17db83SRichard Henderson break; 1631c7482438SRichard Henderson case TEMP_EBB: 1632c7482438SRichard Henderson snprintf(buf, buf_size, "ebb%d", idx - s->nb_globals); 1633c7482438SRichard Henderson break; 1634ee17db83SRichard Henderson case TEMP_NORMAL: 1635ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1636ee17db83SRichard Henderson break; 1637c0522136SRichard Henderson case TEMP_CONST: 1638c0522136SRichard Henderson switch (ts->type) { 1639c0522136SRichard Henderson case TCG_TYPE_I32: 1640c0522136SRichard Henderson snprintf(buf, buf_size, "$0x%x", (int32_t)ts->val); 1641c0522136SRichard Henderson break; 1642c0522136SRichard Henderson #if TCG_TARGET_REG_BITS > 32 1643c0522136SRichard Henderson case TCG_TYPE_I64: 1644c0522136SRichard Henderson snprintf(buf, buf_size, "$0x%" PRIx64, ts->val); 1645c0522136SRichard Henderson break; 1646c0522136SRichard Henderson #endif 1647c0522136SRichard Henderson case TCG_TYPE_V64: 1648c0522136SRichard Henderson case TCG_TYPE_V128: 1649c0522136SRichard Henderson case TCG_TYPE_V256: 1650c0522136SRichard Henderson snprintf(buf, buf_size, "v%d$0x%" PRIx64, 1651c0522136SRichard Henderson 64 << (ts->type - TCG_TYPE_V64), ts->val); 1652c0522136SRichard Henderson break; 1653c0522136SRichard Henderson default: 1654c0522136SRichard Henderson g_assert_not_reached(); 1655c0522136SRichard Henderson } 1656c0522136SRichard Henderson break; 1657c896fe29Sbellard } 1658c896fe29Sbellard return buf; 1659c896fe29Sbellard } 1660c896fe29Sbellard 166143439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 166243439139SRichard Henderson int buf_size, TCGArg arg) 1663f8b2f202SRichard Henderson { 166443439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1665f8b2f202SRichard Henderson } 1666f8b2f202SRichard Henderson 1667f48f3edeSblueswir1 static const char * const cond_name[] = 1668f48f3edeSblueswir1 { 16690aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 16700aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1671f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1672f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1673f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1674f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1675f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1676f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1677f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1678f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1679f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1680f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1681f48f3edeSblueswir1 }; 1682f48f3edeSblueswir1 1683f713d6adSRichard Henderson static const char * const ldst_name[] = 1684f713d6adSRichard Henderson { 1685f713d6adSRichard Henderson [MO_UB] = "ub", 1686f713d6adSRichard Henderson [MO_SB] = "sb", 1687f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1688f713d6adSRichard Henderson [MO_LESW] = "lesw", 1689f713d6adSRichard Henderson [MO_LEUL] = "leul", 1690f713d6adSRichard Henderson [MO_LESL] = "lesl", 1691fc313c64SFrédéric Pétrot [MO_LEUQ] = "leq", 1692f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1693f713d6adSRichard Henderson [MO_BESW] = "besw", 1694f713d6adSRichard Henderson [MO_BEUL] = "beul", 1695f713d6adSRichard Henderson [MO_BESL] = "besl", 1696fc313c64SFrédéric Pétrot [MO_BEUQ] = "beq", 1697f713d6adSRichard Henderson }; 1698f713d6adSRichard Henderson 16991f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 170052bf9771Stony.nguyen@bt.com #ifdef TARGET_ALIGNED_ONLY 17011f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 17021f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 17031f00b27fSSergey Sorokin #else 17041f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 17051f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 17061f00b27fSSergey Sorokin #endif 17071f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 17081f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 17091f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 17101f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 17111f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 17121f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 17131f00b27fSSergey Sorokin }; 17141f00b27fSSergey Sorokin 1715587195bdSRichard Henderson static const char bswap_flag_name[][6] = { 1716587195bdSRichard Henderson [TCG_BSWAP_IZ] = "iz", 1717587195bdSRichard Henderson [TCG_BSWAP_OZ] = "oz", 1718587195bdSRichard Henderson [TCG_BSWAP_OS] = "os", 1719587195bdSRichard Henderson [TCG_BSWAP_IZ | TCG_BSWAP_OZ] = "iz,oz", 1720587195bdSRichard Henderson [TCG_BSWAP_IZ | TCG_BSWAP_OS] = "iz,os", 1721587195bdSRichard Henderson }; 1722587195bdSRichard Henderson 1723b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d) 1724b016486eSRichard Henderson { 1725b016486eSRichard Henderson return (d & (d - 1)) == 0; 1726b016486eSRichard Henderson } 1727b016486eSRichard Henderson 1728b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d) 1729b016486eSRichard Henderson { 1730b016486eSRichard Henderson if (TCG_TARGET_NB_REGS <= 32) { 1731b016486eSRichard Henderson return ctz32(d); 1732b016486eSRichard Henderson } else { 1733b016486eSRichard Henderson return ctz64(d); 1734b016486eSRichard Henderson } 1735b016486eSRichard Henderson } 1736b016486eSRichard Henderson 1737b7a83ff8SRichard Henderson /* Return only the number of characters output -- no error return. */ 1738b7a83ff8SRichard Henderson #define ne_fprintf(...) \ 1739b7a83ff8SRichard Henderson ({ int ret_ = fprintf(__VA_ARGS__); ret_ >= 0 ? ret_ : 0; }) 1740b7a83ff8SRichard Henderson 1741b7a83ff8SRichard Henderson static void tcg_dump_ops(TCGContext *s, FILE *f, bool have_prefs) 1742c896fe29Sbellard { 1743c896fe29Sbellard char buf[128]; 1744c45cb8bbSRichard Henderson TCGOp *op; 1745c896fe29Sbellard 174615fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1747c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1748c45cb8bbSRichard Henderson const TCGOpDef *def; 1749c45cb8bbSRichard Henderson TCGOpcode c; 1750bdfb460eSRichard Henderson int col = 0; 1751c45cb8bbSRichard Henderson 1752c45cb8bbSRichard Henderson c = op->opc; 1753c896fe29Sbellard def = &tcg_op_defs[c]; 1754c45cb8bbSRichard Henderson 1755765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1756b016486eSRichard Henderson nb_oargs = 0; 1757b7a83ff8SRichard Henderson col += ne_fprintf(f, "\n ----"); 17589aef40edSRichard Henderson 17599aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 17609aef40edSRichard Henderson target_ulong a; 17617e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1762efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 17637e4597d7Sbellard #else 1764efee3746SRichard Henderson a = op->args[i]; 17657e4597d7Sbellard #endif 1766b7a83ff8SRichard Henderson col += ne_fprintf(f, " " TARGET_FMT_lx, a); 1767eeacee4dSBlue Swirl } 17687e4597d7Sbellard } else if (c == INDEX_op_call) { 17693e92aa34SRichard Henderson const TCGHelperInfo *info = tcg_call_info(op); 1770fa52e660SRichard Henderson void *func = tcg_call_func(op); 17713e92aa34SRichard Henderson 1772c896fe29Sbellard /* variable number of arguments */ 1773cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1774cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1775c896fe29Sbellard nb_cargs = def->nb_cargs; 1776b03cce8eSbellard 1777b7a83ff8SRichard Henderson col += ne_fprintf(f, " %s ", def->name); 17783e92aa34SRichard Henderson 17793e92aa34SRichard Henderson /* 17803e92aa34SRichard Henderson * Print the function name from TCGHelperInfo, if available. 17813e92aa34SRichard Henderson * Note that plugins have a template function for the info, 17823e92aa34SRichard Henderson * but the actual function pointer comes from the plugin. 17833e92aa34SRichard Henderson */ 17843e92aa34SRichard Henderson if (func == info->func) { 1785b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s", info->name); 17863e92aa34SRichard Henderson } else { 1787b7a83ff8SRichard Henderson col += ne_fprintf(f, "plugin(%p)", func); 17883e92aa34SRichard Henderson } 17893e92aa34SRichard Henderson 1790b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%x,$%d", info->flags, nb_oargs); 1791b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 1792b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1793efee3746SRichard Henderson op->args[i])); 1794b03cce8eSbellard } 1795cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1796efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1797cf066674SRichard Henderson const char *t = "<dummy>"; 1798cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 179943439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1800b03cce8eSbellard } 1801b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", t); 1802e8996ee0Sbellard } 1803b03cce8eSbellard } else { 1804b7a83ff8SRichard Henderson col += ne_fprintf(f, " %s ", def->name); 1805c45cb8bbSRichard Henderson 1806c896fe29Sbellard nb_oargs = def->nb_oargs; 1807c896fe29Sbellard nb_iargs = def->nb_iargs; 1808c896fe29Sbellard nb_cargs = def->nb_cargs; 1809c896fe29Sbellard 1810d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1811b7a83ff8SRichard Henderson col += ne_fprintf(f, "v%d,e%d,", 64 << TCGOP_VECL(op), 1812d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1813d2fd745fSRichard Henderson } 1814d2fd745fSRichard Henderson 1815c896fe29Sbellard k = 0; 1816c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1817b7a83ff8SRichard Henderson const char *sep = k ? "," : ""; 1818b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s%s", sep, 1819b7a83ff8SRichard Henderson tcg_get_arg_str(s, buf, sizeof(buf), 1820efee3746SRichard Henderson op->args[k++])); 1821c896fe29Sbellard } 1822c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1823b7a83ff8SRichard Henderson const char *sep = k ? "," : ""; 1824b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s%s", sep, 1825b7a83ff8SRichard Henderson tcg_get_arg_str(s, buf, sizeof(buf), 1826efee3746SRichard Henderson op->args[k++])); 1827c896fe29Sbellard } 1828be210acbSRichard Henderson switch (c) { 1829be210acbSRichard Henderson case INDEX_op_brcond_i32: 1830ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1831ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1832be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1833be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1834ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1835be210acbSRichard Henderson case INDEX_op_setcond_i64: 1836ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1837212be173SRichard Henderson case INDEX_op_cmp_vec: 1838f75da298SRichard Henderson case INDEX_op_cmpsel_vec: 1839efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1840efee3746SRichard Henderson && cond_name[op->args[k]]) { 1841b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", cond_name[op->args[k++]]); 1842eeacee4dSBlue Swirl } else { 1843b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%" TCG_PRIlx, op->args[k++]); 1844eeacee4dSBlue Swirl } 1845f48f3edeSblueswir1 i = 1; 1846be210acbSRichard Henderson break; 1847f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1848f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 184907ce0b05SRichard Henderson case INDEX_op_qemu_st8_i32: 1850f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1851f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 185259227d5dSRichard Henderson { 18539002ffcbSRichard Henderson MemOpIdx oi = op->args[k++]; 185414776ab5STony Nguyen MemOp op = get_memop(oi); 185559227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 185659227d5dSRichard Henderson 185759c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1858b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%x,%u", op, ix); 185959c4b7e8SRichard Henderson } else { 18601f00b27fSSergey Sorokin const char *s_al, *s_op; 18611f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 186259c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1863b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s%s,%u", s_al, s_op, ix); 1864f713d6adSRichard Henderson } 1865f713d6adSRichard Henderson i = 1; 186659227d5dSRichard Henderson } 1867f713d6adSRichard Henderson break; 1868587195bdSRichard Henderson case INDEX_op_bswap16_i32: 1869587195bdSRichard Henderson case INDEX_op_bswap16_i64: 1870587195bdSRichard Henderson case INDEX_op_bswap32_i32: 1871587195bdSRichard Henderson case INDEX_op_bswap32_i64: 1872587195bdSRichard Henderson case INDEX_op_bswap64_i64: 1873587195bdSRichard Henderson { 1874587195bdSRichard Henderson TCGArg flags = op->args[k]; 1875587195bdSRichard Henderson const char *name = NULL; 1876587195bdSRichard Henderson 1877587195bdSRichard Henderson if (flags < ARRAY_SIZE(bswap_flag_name)) { 1878587195bdSRichard Henderson name = bswap_flag_name[flags]; 1879587195bdSRichard Henderson } 1880587195bdSRichard Henderson if (name) { 1881b7a83ff8SRichard Henderson col += ne_fprintf(f, ",%s", name); 1882587195bdSRichard Henderson } else { 1883b7a83ff8SRichard Henderson col += ne_fprintf(f, ",$0x%" TCG_PRIlx, flags); 1884587195bdSRichard Henderson } 1885587195bdSRichard Henderson i = k = 1; 1886587195bdSRichard Henderson } 1887587195bdSRichard Henderson break; 1888be210acbSRichard Henderson default: 1889f48f3edeSblueswir1 i = 0; 1890be210acbSRichard Henderson break; 1891be210acbSRichard Henderson } 189251e3972cSRichard Henderson switch (c) { 189351e3972cSRichard Henderson case INDEX_op_set_label: 189451e3972cSRichard Henderson case INDEX_op_br: 189551e3972cSRichard Henderson case INDEX_op_brcond_i32: 189651e3972cSRichard Henderson case INDEX_op_brcond_i64: 189751e3972cSRichard Henderson case INDEX_op_brcond2_i32: 1898b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s$L%d", k ? "," : "", 1899efee3746SRichard Henderson arg_label(op->args[k])->id); 190051e3972cSRichard Henderson i++, k++; 190151e3972cSRichard Henderson break; 190251e3972cSRichard Henderson default: 190351e3972cSRichard Henderson break; 1904eeacee4dSBlue Swirl } 190551e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 1906b7a83ff8SRichard Henderson col += ne_fprintf(f, "%s$0x%" TCG_PRIlx, k ? "," : "", 1907b7a83ff8SRichard Henderson op->args[k]); 1908bdfb460eSRichard Henderson } 1909bdfb460eSRichard Henderson } 1910bdfb460eSRichard Henderson 19111894f69aSRichard Henderson if (have_prefs || op->life) { 19121894f69aSRichard Henderson for (; col < 40; ++col) { 1913b7a83ff8SRichard Henderson putc(' ', f); 1914bdfb460eSRichard Henderson } 19151894f69aSRichard Henderson } 19161894f69aSRichard Henderson 19171894f69aSRichard Henderson if (op->life) { 19181894f69aSRichard Henderson unsigned life = op->life; 1919bdfb460eSRichard Henderson 1920bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 1921b7a83ff8SRichard Henderson ne_fprintf(f, " sync:"); 1922bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 1923bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 1924b7a83ff8SRichard Henderson ne_fprintf(f, " %d", i); 1925bdfb460eSRichard Henderson } 1926bdfb460eSRichard Henderson } 1927bdfb460eSRichard Henderson } 1928bdfb460eSRichard Henderson life /= DEAD_ARG; 1929bdfb460eSRichard Henderson if (life) { 1930b7a83ff8SRichard Henderson ne_fprintf(f, " dead:"); 1931bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 1932bdfb460eSRichard Henderson if (life & 1) { 1933b7a83ff8SRichard Henderson ne_fprintf(f, " %d", i); 1934bdfb460eSRichard Henderson } 1935bdfb460eSRichard Henderson } 1936c896fe29Sbellard } 1937b03cce8eSbellard } 19381894f69aSRichard Henderson 19391894f69aSRichard Henderson if (have_prefs) { 19401894f69aSRichard Henderson for (i = 0; i < nb_oargs; ++i) { 19411894f69aSRichard Henderson TCGRegSet set = op->output_pref[i]; 19421894f69aSRichard Henderson 19431894f69aSRichard Henderson if (i == 0) { 1944b7a83ff8SRichard Henderson ne_fprintf(f, " pref="); 19451894f69aSRichard Henderson } else { 1946b7a83ff8SRichard Henderson ne_fprintf(f, ","); 19471894f69aSRichard Henderson } 19481894f69aSRichard Henderson if (set == 0) { 1949b7a83ff8SRichard Henderson ne_fprintf(f, "none"); 19501894f69aSRichard Henderson } else if (set == MAKE_64BIT_MASK(0, TCG_TARGET_NB_REGS)) { 1951b7a83ff8SRichard Henderson ne_fprintf(f, "all"); 19521894f69aSRichard Henderson #ifdef CONFIG_DEBUG_TCG 19531894f69aSRichard Henderson } else if (tcg_regset_single(set)) { 19541894f69aSRichard Henderson TCGReg reg = tcg_regset_first(set); 1955b7a83ff8SRichard Henderson ne_fprintf(f, "%s", tcg_target_reg_names[reg]); 19561894f69aSRichard Henderson #endif 19571894f69aSRichard Henderson } else if (TCG_TARGET_NB_REGS <= 32) { 1958b7a83ff8SRichard Henderson ne_fprintf(f, "0x%x", (uint32_t)set); 19591894f69aSRichard Henderson } else { 1960b7a83ff8SRichard Henderson ne_fprintf(f, "0x%" PRIx64, (uint64_t)set); 19611894f69aSRichard Henderson } 19621894f69aSRichard Henderson } 19631894f69aSRichard Henderson } 19641894f69aSRichard Henderson 1965b7a83ff8SRichard Henderson putc('\n', f); 1966c896fe29Sbellard } 1967c896fe29Sbellard } 1968c896fe29Sbellard 1969c896fe29Sbellard /* we give more priority to constraints with less registers */ 1970c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 1971c896fe29Sbellard { 197274a11790SRichard Henderson const TCGArgConstraint *arg_ct = &def->args_ct[k]; 197329f5e925SRichard Henderson int n = ctpop64(arg_ct->regs); 1974c896fe29Sbellard 197529f5e925SRichard Henderson /* 197629f5e925SRichard Henderson * Sort constraints of a single register first, which includes output 197729f5e925SRichard Henderson * aliases (which must exactly match the input already allocated). 197829f5e925SRichard Henderson */ 197929f5e925SRichard Henderson if (n == 1 || arg_ct->oalias) { 198029f5e925SRichard Henderson return INT_MAX; 1981c896fe29Sbellard } 198229f5e925SRichard Henderson 198329f5e925SRichard Henderson /* 198429f5e925SRichard Henderson * Sort register pairs next, first then second immediately after. 198529f5e925SRichard Henderson * Arbitrarily sort multiple pairs by the index of the first reg; 198629f5e925SRichard Henderson * there shouldn't be many pairs. 198729f5e925SRichard Henderson */ 198829f5e925SRichard Henderson switch (arg_ct->pair) { 198929f5e925SRichard Henderson case 1: 199029f5e925SRichard Henderson case 3: 199129f5e925SRichard Henderson return (k + 1) * 2; 199229f5e925SRichard Henderson case 2: 199329f5e925SRichard Henderson return (arg_ct->pair_index + 1) * 2 - 1; 199429f5e925SRichard Henderson } 199529f5e925SRichard Henderson 199629f5e925SRichard Henderson /* Finally, sort by decreasing register count. */ 199729f5e925SRichard Henderson assert(n > 1); 199829f5e925SRichard Henderson return -n; 1999c896fe29Sbellard } 2000c896fe29Sbellard 2001c896fe29Sbellard /* sort from highest priority to lowest */ 2002c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 2003c896fe29Sbellard { 200466792f90SRichard Henderson int i, j; 200566792f90SRichard Henderson TCGArgConstraint *a = def->args_ct; 2006c896fe29Sbellard 200766792f90SRichard Henderson for (i = 0; i < n; i++) { 200866792f90SRichard Henderson a[start + i].sort_index = start + i; 200966792f90SRichard Henderson } 201066792f90SRichard Henderson if (n <= 1) { 2011c896fe29Sbellard return; 201266792f90SRichard Henderson } 2013c896fe29Sbellard for (i = 0; i < n - 1; i++) { 2014c896fe29Sbellard for (j = i + 1; j < n; j++) { 201566792f90SRichard Henderson int p1 = get_constraint_priority(def, a[start + i].sort_index); 201666792f90SRichard Henderson int p2 = get_constraint_priority(def, a[start + j].sort_index); 2017c896fe29Sbellard if (p1 < p2) { 201866792f90SRichard Henderson int tmp = a[start + i].sort_index; 201966792f90SRichard Henderson a[start + i].sort_index = a[start + j].sort_index; 202066792f90SRichard Henderson a[start + j].sort_index = tmp; 2021c896fe29Sbellard } 2022c896fe29Sbellard } 2023c896fe29Sbellard } 2024c896fe29Sbellard } 2025c896fe29Sbellard 2026f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 2027c896fe29Sbellard { 2028a9751609SRichard Henderson TCGOpcode op; 2029c896fe29Sbellard 2030f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 2031f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 2032f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 203329f5e925SRichard Henderson bool saw_alias_pair = false; 203429f5e925SRichard Henderson int i, o, i2, o2, nb_args; 2035f69d277eSRichard Henderson 2036f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 2037f69d277eSRichard Henderson continue; 2038f69d277eSRichard Henderson } 2039f69d277eSRichard Henderson 2040c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 2041f69d277eSRichard Henderson if (nb_args == 0) { 2042f69d277eSRichard Henderson continue; 2043f69d277eSRichard Henderson } 2044f69d277eSRichard Henderson 20454c22e840SRichard Henderson /* 20464c22e840SRichard Henderson * Macro magic should make it impossible, but double-check that 20474c22e840SRichard Henderson * the array index is in range. Since the signness of an enum 20484c22e840SRichard Henderson * is implementation defined, force the result to unsigned. 20494c22e840SRichard Henderson */ 20504c22e840SRichard Henderson unsigned con_set = tcg_target_op_def(op); 20514c22e840SRichard Henderson tcg_debug_assert(con_set < ARRAY_SIZE(constraint_sets)); 20524c22e840SRichard Henderson tdefs = &constraint_sets[con_set]; 2053f69d277eSRichard Henderson 2054c896fe29Sbellard for (i = 0; i < nb_args; i++) { 2055f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 20568940ea0dSPhilippe Mathieu-Daudé bool input_p = i >= def->nb_oargs; 20578940ea0dSPhilippe Mathieu-Daudé 2058f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2059eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2060f69d277eSRichard Henderson 206117280ff4SRichard Henderson switch (*ct_str) { 206217280ff4SRichard Henderson case '0' ... '9': 20638940ea0dSPhilippe Mathieu-Daudé o = *ct_str - '0'; 20648940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(input_p); 20658940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(o < def->nb_oargs); 20668940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(def->args_ct[o].regs != 0); 20678940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(!def->args_ct[o].oalias); 20688940ea0dSPhilippe Mathieu-Daudé def->args_ct[i] = def->args_ct[o]; 2069bc2b17e6SRichard Henderson /* The output sets oalias. */ 20708940ea0dSPhilippe Mathieu-Daudé def->args_ct[o].oalias = 1; 20718940ea0dSPhilippe Mathieu-Daudé def->args_ct[o].alias_index = i; 2072bc2b17e6SRichard Henderson /* The input sets ialias. */ 20738940ea0dSPhilippe Mathieu-Daudé def->args_ct[i].ialias = 1; 20748940ea0dSPhilippe Mathieu-Daudé def->args_ct[i].alias_index = o; 207529f5e925SRichard Henderson if (def->args_ct[i].pair) { 207629f5e925SRichard Henderson saw_alias_pair = true; 207729f5e925SRichard Henderson } 20788940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(ct_str[1] == '\0'); 20798940ea0dSPhilippe Mathieu-Daudé continue; 20808940ea0dSPhilippe Mathieu-Daudé 208182790a87SRichard Henderson case '&': 20828940ea0dSPhilippe Mathieu-Daudé tcg_debug_assert(!input_p); 2083bc2b17e6SRichard Henderson def->args_ct[i].newreg = true; 208482790a87SRichard Henderson ct_str++; 208582790a87SRichard Henderson break; 208629f5e925SRichard Henderson 208729f5e925SRichard Henderson case 'p': /* plus */ 208829f5e925SRichard Henderson /* Allocate to the register after the previous. */ 208929f5e925SRichard Henderson tcg_debug_assert(i > (input_p ? def->nb_oargs : 0)); 209029f5e925SRichard Henderson o = i - 1; 209129f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].pair); 209229f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].ct); 209329f5e925SRichard Henderson def->args_ct[i] = (TCGArgConstraint){ 209429f5e925SRichard Henderson .pair = 2, 209529f5e925SRichard Henderson .pair_index = o, 209629f5e925SRichard Henderson .regs = def->args_ct[o].regs << 1, 209729f5e925SRichard Henderson }; 209829f5e925SRichard Henderson def->args_ct[o].pair = 1; 209929f5e925SRichard Henderson def->args_ct[o].pair_index = i; 210029f5e925SRichard Henderson tcg_debug_assert(ct_str[1] == '\0'); 210129f5e925SRichard Henderson continue; 210229f5e925SRichard Henderson 210329f5e925SRichard Henderson case 'm': /* minus */ 210429f5e925SRichard Henderson /* Allocate to the register before the previous. */ 210529f5e925SRichard Henderson tcg_debug_assert(i > (input_p ? def->nb_oargs : 0)); 210629f5e925SRichard Henderson o = i - 1; 210729f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].pair); 210829f5e925SRichard Henderson tcg_debug_assert(!def->args_ct[o].ct); 210929f5e925SRichard Henderson def->args_ct[i] = (TCGArgConstraint){ 211029f5e925SRichard Henderson .pair = 1, 211129f5e925SRichard Henderson .pair_index = o, 211229f5e925SRichard Henderson .regs = def->args_ct[o].regs >> 1, 211329f5e925SRichard Henderson }; 211429f5e925SRichard Henderson def->args_ct[o].pair = 2; 211529f5e925SRichard Henderson def->args_ct[o].pair_index = i; 211629f5e925SRichard Henderson tcg_debug_assert(ct_str[1] == '\0'); 211729f5e925SRichard Henderson continue; 21188940ea0dSPhilippe Mathieu-Daudé } 21198940ea0dSPhilippe Mathieu-Daudé 21208940ea0dSPhilippe Mathieu-Daudé do { 21218940ea0dSPhilippe Mathieu-Daudé switch (*ct_str) { 2122c896fe29Sbellard case 'i': 2123c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2124c896fe29Sbellard break; 2125358b4923SRichard Henderson 2126358b4923SRichard Henderson /* Include all of the target-specific constraints. */ 2127358b4923SRichard Henderson 2128358b4923SRichard Henderson #undef CONST 2129358b4923SRichard Henderson #define CONST(CASE, MASK) \ 21308940ea0dSPhilippe Mathieu-Daudé case CASE: def->args_ct[i].ct |= MASK; break; 2131358b4923SRichard Henderson #define REGS(CASE, MASK) \ 21328940ea0dSPhilippe Mathieu-Daudé case CASE: def->args_ct[i].regs |= MASK; break; 2133358b4923SRichard Henderson 2134358b4923SRichard Henderson #include "tcg-target-con-str.h" 2135358b4923SRichard Henderson 2136358b4923SRichard Henderson #undef REGS 2137358b4923SRichard Henderson #undef CONST 2138c896fe29Sbellard default: 21398940ea0dSPhilippe Mathieu-Daudé case '0' ... '9': 21408940ea0dSPhilippe Mathieu-Daudé case '&': 214129f5e925SRichard Henderson case 'p': 214229f5e925SRichard Henderson case 'm': 2143358b4923SRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2144358b4923SRichard Henderson g_assert_not_reached(); 2145358b4923SRichard Henderson } 21468940ea0dSPhilippe Mathieu-Daudé } while (*++ct_str != '\0'); 2147c896fe29Sbellard } 2148c896fe29Sbellard 2149c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2150eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2151c68aaa18SStefan Weil 215229f5e925SRichard Henderson /* 215329f5e925SRichard Henderson * Fix up output pairs that are aliased with inputs. 215429f5e925SRichard Henderson * When we created the alias, we copied pair from the output. 215529f5e925SRichard Henderson * There are three cases: 215629f5e925SRichard Henderson * (1a) Pairs of inputs alias pairs of outputs. 215729f5e925SRichard Henderson * (1b) One input aliases the first of a pair of outputs. 215829f5e925SRichard Henderson * (2) One input aliases the second of a pair of outputs. 215929f5e925SRichard Henderson * 216029f5e925SRichard Henderson * Case 1a is handled by making sure that the pair_index'es are 216129f5e925SRichard Henderson * properly updated so that they appear the same as a pair of inputs. 216229f5e925SRichard Henderson * 216329f5e925SRichard Henderson * Case 1b is handled by setting the pair_index of the input to 216429f5e925SRichard Henderson * itself, simply so it doesn't point to an unrelated argument. 216529f5e925SRichard Henderson * Since we don't encounter the "second" during the input allocation 216629f5e925SRichard Henderson * phase, nothing happens with the second half of the input pair. 216729f5e925SRichard Henderson * 216829f5e925SRichard Henderson * Case 2 is handled by setting the second input to pair=3, the 216929f5e925SRichard Henderson * first output to pair=3, and the pair_index'es to match. 217029f5e925SRichard Henderson */ 217129f5e925SRichard Henderson if (saw_alias_pair) { 217229f5e925SRichard Henderson for (i = def->nb_oargs; i < nb_args; i++) { 217329f5e925SRichard Henderson /* 217429f5e925SRichard Henderson * Since [0-9pm] must be alone in the constraint string, 217529f5e925SRichard Henderson * the only way they can both be set is if the pair comes 217629f5e925SRichard Henderson * from the output alias. 217729f5e925SRichard Henderson */ 217829f5e925SRichard Henderson if (!def->args_ct[i].ialias) { 217929f5e925SRichard Henderson continue; 218029f5e925SRichard Henderson } 218129f5e925SRichard Henderson switch (def->args_ct[i].pair) { 218229f5e925SRichard Henderson case 0: 218329f5e925SRichard Henderson break; 218429f5e925SRichard Henderson case 1: 218529f5e925SRichard Henderson o = def->args_ct[i].alias_index; 218629f5e925SRichard Henderson o2 = def->args_ct[o].pair_index; 218729f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o].pair == 1); 218829f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o2].pair == 2); 218929f5e925SRichard Henderson if (def->args_ct[o2].oalias) { 219029f5e925SRichard Henderson /* Case 1a */ 219129f5e925SRichard Henderson i2 = def->args_ct[o2].alias_index; 219229f5e925SRichard Henderson tcg_debug_assert(def->args_ct[i2].pair == 2); 219329f5e925SRichard Henderson def->args_ct[i2].pair_index = i; 219429f5e925SRichard Henderson def->args_ct[i].pair_index = i2; 219529f5e925SRichard Henderson } else { 219629f5e925SRichard Henderson /* Case 1b */ 219729f5e925SRichard Henderson def->args_ct[i].pair_index = i; 219829f5e925SRichard Henderson } 219929f5e925SRichard Henderson break; 220029f5e925SRichard Henderson case 2: 220129f5e925SRichard Henderson o = def->args_ct[i].alias_index; 220229f5e925SRichard Henderson o2 = def->args_ct[o].pair_index; 220329f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o].pair == 2); 220429f5e925SRichard Henderson tcg_debug_assert(def->args_ct[o2].pair == 1); 220529f5e925SRichard Henderson if (def->args_ct[o2].oalias) { 220629f5e925SRichard Henderson /* Case 1a */ 220729f5e925SRichard Henderson i2 = def->args_ct[o2].alias_index; 220829f5e925SRichard Henderson tcg_debug_assert(def->args_ct[i2].pair == 1); 220929f5e925SRichard Henderson def->args_ct[i2].pair_index = i; 221029f5e925SRichard Henderson def->args_ct[i].pair_index = i2; 221129f5e925SRichard Henderson } else { 221229f5e925SRichard Henderson /* Case 2 */ 221329f5e925SRichard Henderson def->args_ct[i].pair = 3; 221429f5e925SRichard Henderson def->args_ct[o2].pair = 3; 221529f5e925SRichard Henderson def->args_ct[i].pair_index = o2; 221629f5e925SRichard Henderson def->args_ct[o2].pair_index = i; 221729f5e925SRichard Henderson } 221829f5e925SRichard Henderson break; 221929f5e925SRichard Henderson default: 222029f5e925SRichard Henderson g_assert_not_reached(); 222129f5e925SRichard Henderson } 222229f5e925SRichard Henderson } 222329f5e925SRichard Henderson } 222429f5e925SRichard Henderson 2225c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2226c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2227c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2228c896fe29Sbellard } 2229c896fe29Sbellard } 2230c896fe29Sbellard 22310c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 22320c627cdcSRichard Henderson { 2233d88a117eSRichard Henderson TCGLabel *label; 2234d88a117eSRichard Henderson 2235d88a117eSRichard Henderson switch (op->opc) { 2236d88a117eSRichard Henderson case INDEX_op_br: 2237d88a117eSRichard Henderson label = arg_label(op->args[0]); 2238d88a117eSRichard Henderson label->refs--; 2239d88a117eSRichard Henderson break; 2240d88a117eSRichard Henderson case INDEX_op_brcond_i32: 2241d88a117eSRichard Henderson case INDEX_op_brcond_i64: 2242d88a117eSRichard Henderson label = arg_label(op->args[3]); 2243d88a117eSRichard Henderson label->refs--; 2244d88a117eSRichard Henderson break; 2245d88a117eSRichard Henderson case INDEX_op_brcond2_i32: 2246d88a117eSRichard Henderson label = arg_label(op->args[5]); 2247d88a117eSRichard Henderson label->refs--; 2248d88a117eSRichard Henderson break; 2249d88a117eSRichard Henderson default: 2250d88a117eSRichard Henderson break; 2251d88a117eSRichard Henderson } 2252d88a117eSRichard Henderson 225315fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 225415fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2255abebf925SRichard Henderson s->nb_ops--; 22560c627cdcSRichard Henderson 22570c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2258d73415a3SStefan Hajnoczi qatomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 22590c627cdcSRichard Henderson #endif 22600c627cdcSRichard Henderson } 22610c627cdcSRichard Henderson 2262a80cdd31SRichard Henderson void tcg_remove_ops_after(TCGOp *op) 2263a80cdd31SRichard Henderson { 2264a80cdd31SRichard Henderson TCGContext *s = tcg_ctx; 2265a80cdd31SRichard Henderson 2266a80cdd31SRichard Henderson while (true) { 2267a80cdd31SRichard Henderson TCGOp *last = tcg_last_op(); 2268a80cdd31SRichard Henderson if (last == op) { 2269a80cdd31SRichard Henderson return; 2270a80cdd31SRichard Henderson } 2271a80cdd31SRichard Henderson tcg_op_remove(s, last); 2272a80cdd31SRichard Henderson } 2273a80cdd31SRichard Henderson } 2274a80cdd31SRichard Henderson 227515fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 227615fa08f8SRichard Henderson { 227715fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 227815fa08f8SRichard Henderson TCGOp *op; 227915fa08f8SRichard Henderson 228015fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 228115fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 228215fa08f8SRichard Henderson } else { 228315fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 228415fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 228515fa08f8SRichard Henderson } 228615fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 228715fa08f8SRichard Henderson op->opc = opc; 2288abebf925SRichard Henderson s->nb_ops++; 228915fa08f8SRichard Henderson 229015fa08f8SRichard Henderson return op; 229115fa08f8SRichard Henderson } 229215fa08f8SRichard Henderson 229315fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 229415fa08f8SRichard Henderson { 229515fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 229615fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 229715fa08f8SRichard Henderson return op; 229815fa08f8SRichard Henderson } 229915fa08f8SRichard Henderson 2300ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 23015a18407fSRichard Henderson { 230215fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 230315fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 23045a18407fSRichard Henderson return new_op; 23055a18407fSRichard Henderson } 23065a18407fSRichard Henderson 2307ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 23085a18407fSRichard Henderson { 230915fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 231015fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 23115a18407fSRichard Henderson return new_op; 23125a18407fSRichard Henderson } 23135a18407fSRichard Henderson 2314b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code. */ 2315b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s) 2316b4fc67c7SRichard Henderson { 2317b4fc67c7SRichard Henderson TCGOp *op, *op_next; 2318b4fc67c7SRichard Henderson bool dead = false; 2319b4fc67c7SRichard Henderson 2320b4fc67c7SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 2321b4fc67c7SRichard Henderson bool remove = dead; 2322b4fc67c7SRichard Henderson TCGLabel *label; 2323b4fc67c7SRichard Henderson 2324b4fc67c7SRichard Henderson switch (op->opc) { 2325b4fc67c7SRichard Henderson case INDEX_op_set_label: 2326b4fc67c7SRichard Henderson label = arg_label(op->args[0]); 2327b4fc67c7SRichard Henderson if (label->refs == 0) { 2328b4fc67c7SRichard Henderson /* 2329b4fc67c7SRichard Henderson * While there is an occasional backward branch, virtually 2330b4fc67c7SRichard Henderson * all branches generated by the translators are forward. 2331b4fc67c7SRichard Henderson * Which means that generally we will have already removed 2332b4fc67c7SRichard Henderson * all references to the label that will be, and there is 2333b4fc67c7SRichard Henderson * little to be gained by iterating. 2334b4fc67c7SRichard Henderson */ 2335b4fc67c7SRichard Henderson remove = true; 2336b4fc67c7SRichard Henderson } else { 2337b4fc67c7SRichard Henderson /* Once we see a label, insns become live again. */ 2338b4fc67c7SRichard Henderson dead = false; 2339b4fc67c7SRichard Henderson remove = false; 2340b4fc67c7SRichard Henderson 2341b4fc67c7SRichard Henderson /* 2342b4fc67c7SRichard Henderson * Optimization can fold conditional branches to unconditional. 2343b4fc67c7SRichard Henderson * If we find a label with one reference which is preceded by 2344b4fc67c7SRichard Henderson * an unconditional branch to it, remove both. This needed to 2345b4fc67c7SRichard Henderson * wait until the dead code in between them was removed. 2346b4fc67c7SRichard Henderson */ 2347b4fc67c7SRichard Henderson if (label->refs == 1) { 2348eae3eb3eSPaolo Bonzini TCGOp *op_prev = QTAILQ_PREV(op, link); 2349b4fc67c7SRichard Henderson if (op_prev->opc == INDEX_op_br && 2350b4fc67c7SRichard Henderson label == arg_label(op_prev->args[0])) { 2351b4fc67c7SRichard Henderson tcg_op_remove(s, op_prev); 2352b4fc67c7SRichard Henderson remove = true; 2353b4fc67c7SRichard Henderson } 2354b4fc67c7SRichard Henderson } 2355b4fc67c7SRichard Henderson } 2356b4fc67c7SRichard Henderson break; 2357b4fc67c7SRichard Henderson 2358b4fc67c7SRichard Henderson case INDEX_op_br: 2359b4fc67c7SRichard Henderson case INDEX_op_exit_tb: 2360b4fc67c7SRichard Henderson case INDEX_op_goto_ptr: 2361b4fc67c7SRichard Henderson /* Unconditional branches; everything following is dead. */ 2362b4fc67c7SRichard Henderson dead = true; 2363b4fc67c7SRichard Henderson break; 2364b4fc67c7SRichard Henderson 2365b4fc67c7SRichard Henderson case INDEX_op_call: 2366b4fc67c7SRichard Henderson /* Notice noreturn helper calls, raising exceptions. */ 236790163900SRichard Henderson if (tcg_call_flags(op) & TCG_CALL_NO_RETURN) { 2368b4fc67c7SRichard Henderson dead = true; 2369b4fc67c7SRichard Henderson } 2370b4fc67c7SRichard Henderson break; 2371b4fc67c7SRichard Henderson 2372b4fc67c7SRichard Henderson case INDEX_op_insn_start: 2373b4fc67c7SRichard Henderson /* Never remove -- we need to keep these for unwind. */ 2374b4fc67c7SRichard Henderson remove = false; 2375b4fc67c7SRichard Henderson break; 2376b4fc67c7SRichard Henderson 2377b4fc67c7SRichard Henderson default: 2378b4fc67c7SRichard Henderson break; 2379b4fc67c7SRichard Henderson } 2380b4fc67c7SRichard Henderson 2381b4fc67c7SRichard Henderson if (remove) { 2382b4fc67c7SRichard Henderson tcg_op_remove(s, op); 2383b4fc67c7SRichard Henderson } 2384b4fc67c7SRichard Henderson } 2385b4fc67c7SRichard Henderson } 2386b4fc67c7SRichard Henderson 2387c70fbf0aSRichard Henderson #define TS_DEAD 1 2388c70fbf0aSRichard Henderson #define TS_MEM 2 2389c70fbf0aSRichard Henderson 23905a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 23915a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 23925a18407fSRichard Henderson 239325f49c5fSRichard Henderson /* For liveness_pass_1, the register preferences for a given temp. */ 239425f49c5fSRichard Henderson static inline TCGRegSet *la_temp_pref(TCGTemp *ts) 239525f49c5fSRichard Henderson { 239625f49c5fSRichard Henderson return ts->state_ptr; 239725f49c5fSRichard Henderson } 239825f49c5fSRichard Henderson 239925f49c5fSRichard Henderson /* For liveness_pass_1, reset the preferences for a given temp to the 240025f49c5fSRichard Henderson * maximal regset for its type. 240125f49c5fSRichard Henderson */ 240225f49c5fSRichard Henderson static inline void la_reset_pref(TCGTemp *ts) 240325f49c5fSRichard Henderson { 240425f49c5fSRichard Henderson *la_temp_pref(ts) 240525f49c5fSRichard Henderson = (ts->state == TS_DEAD ? 0 : tcg_target_available_regs[ts->type]); 240625f49c5fSRichard Henderson } 240725f49c5fSRichard Henderson 24089c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 24099c43b68dSAurelien Jarno should be in memory. */ 24102616c808SRichard Henderson static void la_func_end(TCGContext *s, int ng, int nt) 2411c896fe29Sbellard { 2412b83eabeaSRichard Henderson int i; 2413b83eabeaSRichard Henderson 2414b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2415b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 241625f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 2417b83eabeaSRichard Henderson } 2418b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2419b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 242025f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 2421b83eabeaSRichard Henderson } 2422c896fe29Sbellard } 2423c896fe29Sbellard 24249c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 24259c43b68dSAurelien Jarno and local temps should be in memory. */ 24262616c808SRichard Henderson static void la_bb_end(TCGContext *s, int ng, int nt) 2427641d5fbeSbellard { 2428b83eabeaSRichard Henderson int i; 2429641d5fbeSbellard 2430ee17db83SRichard Henderson for (i = 0; i < nt; ++i) { 2431ee17db83SRichard Henderson TCGTemp *ts = &s->temps[i]; 2432ee17db83SRichard Henderson int state; 2433ee17db83SRichard Henderson 2434ee17db83SRichard Henderson switch (ts->kind) { 2435ee17db83SRichard Henderson case TEMP_FIXED: 2436ee17db83SRichard Henderson case TEMP_GLOBAL: 2437ee17db83SRichard Henderson case TEMP_LOCAL: 2438ee17db83SRichard Henderson state = TS_DEAD | TS_MEM; 2439ee17db83SRichard Henderson break; 2440ee17db83SRichard Henderson case TEMP_NORMAL: 2441c7482438SRichard Henderson case TEMP_EBB: 2442c0522136SRichard Henderson case TEMP_CONST: 2443ee17db83SRichard Henderson state = TS_DEAD; 2444ee17db83SRichard Henderson break; 2445ee17db83SRichard Henderson default: 2446ee17db83SRichard Henderson g_assert_not_reached(); 2447c70fbf0aSRichard Henderson } 2448ee17db83SRichard Henderson ts->state = state; 2449ee17db83SRichard Henderson la_reset_pref(ts); 2450641d5fbeSbellard } 2451641d5fbeSbellard } 2452641d5fbeSbellard 2453f65a061cSRichard Henderson /* liveness analysis: sync globals back to memory. */ 2454f65a061cSRichard Henderson static void la_global_sync(TCGContext *s, int ng) 2455f65a061cSRichard Henderson { 2456f65a061cSRichard Henderson int i; 2457f65a061cSRichard Henderson 2458f65a061cSRichard Henderson for (i = 0; i < ng; ++i) { 245925f49c5fSRichard Henderson int state = s->temps[i].state; 246025f49c5fSRichard Henderson s->temps[i].state = state | TS_MEM; 246125f49c5fSRichard Henderson if (state == TS_DEAD) { 246225f49c5fSRichard Henderson /* If the global was previously dead, reset prefs. */ 246325f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 246425f49c5fSRichard Henderson } 2465f65a061cSRichard Henderson } 2466f65a061cSRichard Henderson } 2467f65a061cSRichard Henderson 2468b4cb76e6SRichard Henderson /* 2469c7482438SRichard Henderson * liveness analysis: conditional branch: all temps are dead unless 2470c7482438SRichard Henderson * explicitly live-across-conditional-branch, globals and local temps 2471c7482438SRichard Henderson * should be synced. 2472b4cb76e6SRichard Henderson */ 2473b4cb76e6SRichard Henderson static void la_bb_sync(TCGContext *s, int ng, int nt) 2474b4cb76e6SRichard Henderson { 2475b4cb76e6SRichard Henderson la_global_sync(s, ng); 2476b4cb76e6SRichard Henderson 2477b4cb76e6SRichard Henderson for (int i = ng; i < nt; ++i) { 2478c0522136SRichard Henderson TCGTemp *ts = &s->temps[i]; 2479c0522136SRichard Henderson int state; 2480c0522136SRichard Henderson 2481c0522136SRichard Henderson switch (ts->kind) { 2482c0522136SRichard Henderson case TEMP_LOCAL: 2483c0522136SRichard Henderson state = ts->state; 2484c0522136SRichard Henderson ts->state = state | TS_MEM; 2485b4cb76e6SRichard Henderson if (state != TS_DEAD) { 2486b4cb76e6SRichard Henderson continue; 2487b4cb76e6SRichard Henderson } 2488c0522136SRichard Henderson break; 2489c0522136SRichard Henderson case TEMP_NORMAL: 2490b4cb76e6SRichard Henderson s->temps[i].state = TS_DEAD; 2491c0522136SRichard Henderson break; 2492c7482438SRichard Henderson case TEMP_EBB: 2493c0522136SRichard Henderson case TEMP_CONST: 2494c0522136SRichard Henderson continue; 2495c0522136SRichard Henderson default: 2496c0522136SRichard Henderson g_assert_not_reached(); 2497b4cb76e6SRichard Henderson } 2498b4cb76e6SRichard Henderson la_reset_pref(&s->temps[i]); 2499b4cb76e6SRichard Henderson } 2500b4cb76e6SRichard Henderson } 2501b4cb76e6SRichard Henderson 2502f65a061cSRichard Henderson /* liveness analysis: sync globals back to memory and kill. */ 2503f65a061cSRichard Henderson static void la_global_kill(TCGContext *s, int ng) 2504f65a061cSRichard Henderson { 2505f65a061cSRichard Henderson int i; 2506f65a061cSRichard Henderson 2507f65a061cSRichard Henderson for (i = 0; i < ng; i++) { 2508f65a061cSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 250925f49c5fSRichard Henderson la_reset_pref(&s->temps[i]); 251025f49c5fSRichard Henderson } 251125f49c5fSRichard Henderson } 251225f49c5fSRichard Henderson 251325f49c5fSRichard Henderson /* liveness analysis: note live globals crossing calls. */ 251425f49c5fSRichard Henderson static void la_cross_call(TCGContext *s, int nt) 251525f49c5fSRichard Henderson { 251625f49c5fSRichard Henderson TCGRegSet mask = ~tcg_target_call_clobber_regs; 251725f49c5fSRichard Henderson int i; 251825f49c5fSRichard Henderson 251925f49c5fSRichard Henderson for (i = 0; i < nt; i++) { 252025f49c5fSRichard Henderson TCGTemp *ts = &s->temps[i]; 252125f49c5fSRichard Henderson if (!(ts->state & TS_DEAD)) { 252225f49c5fSRichard Henderson TCGRegSet *pset = la_temp_pref(ts); 252325f49c5fSRichard Henderson TCGRegSet set = *pset; 252425f49c5fSRichard Henderson 252525f49c5fSRichard Henderson set &= mask; 252625f49c5fSRichard Henderson /* If the combination is not possible, restart. */ 252725f49c5fSRichard Henderson if (set == 0) { 252825f49c5fSRichard Henderson set = tcg_target_available_regs[ts->type] & mask; 252925f49c5fSRichard Henderson } 253025f49c5fSRichard Henderson *pset = set; 253125f49c5fSRichard Henderson } 2532f65a061cSRichard Henderson } 2533f65a061cSRichard Henderson } 2534f65a061cSRichard Henderson 2535a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2536c896fe29Sbellard given input arguments is dead. Instructions updating dead 2537c896fe29Sbellard temporaries are removed. */ 2538b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2539c896fe29Sbellard { 2540c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 25412616c808SRichard Henderson int nb_temps = s->nb_temps; 254215fa08f8SRichard Henderson TCGOp *op, *op_prev; 254325f49c5fSRichard Henderson TCGRegSet *prefs; 254425f49c5fSRichard Henderson int i; 254525f49c5fSRichard Henderson 254625f49c5fSRichard Henderson prefs = tcg_malloc(sizeof(TCGRegSet) * nb_temps); 254725f49c5fSRichard Henderson for (i = 0; i < nb_temps; ++i) { 254825f49c5fSRichard Henderson s->temps[i].state_ptr = prefs + i; 254925f49c5fSRichard Henderson } 2550c896fe29Sbellard 2551ae36a246SRichard Henderson /* ??? Should be redundant with the exit_tb that ends the TB. */ 25522616c808SRichard Henderson la_func_end(s, nb_globals, nb_temps); 2553c896fe29Sbellard 2554eae3eb3eSPaolo Bonzini QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, link, op_prev) { 255525f49c5fSRichard Henderson int nb_iargs, nb_oargs; 2556c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2557c45cb8bbSRichard Henderson bool have_opc_new2; 2558a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 255925f49c5fSRichard Henderson TCGTemp *ts; 2560c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2561c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2562c45cb8bbSRichard Henderson 2563c45cb8bbSRichard Henderson switch (opc) { 2564c896fe29Sbellard case INDEX_op_call: 2565c6e113f5Sbellard { 2566c6e113f5Sbellard int call_flags; 256725f49c5fSRichard Henderson int nb_call_regs; 2568c6e113f5Sbellard 2569cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2570cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 257190163900SRichard Henderson call_flags = tcg_call_flags(op); 2572c6e113f5Sbellard 2573c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 257478505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2575c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 257625f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 257725f49c5fSRichard Henderson if (ts->state != TS_DEAD) { 2578c6e113f5Sbellard goto do_not_remove_call; 2579c6e113f5Sbellard } 25809c43b68dSAurelien Jarno } 2581c45cb8bbSRichard Henderson goto do_remove; 2582152c35aaSRichard Henderson } 2583c6e113f5Sbellard do_not_remove_call: 2584c896fe29Sbellard 258525f49c5fSRichard Henderson /* Output args are dead. */ 2586c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 258725f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 258825f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2589a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 25906b64b624SAurelien Jarno } 259125f49c5fSRichard Henderson if (ts->state & TS_MEM) { 2592a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 25939c43b68dSAurelien Jarno } 259425f49c5fSRichard Henderson ts->state = TS_DEAD; 259525f49c5fSRichard Henderson la_reset_pref(ts); 259625f49c5fSRichard Henderson 259725f49c5fSRichard Henderson /* Not used -- it will be tcg_target_call_oarg_regs[i]. */ 259825f49c5fSRichard Henderson op->output_pref[i] = 0; 2599c896fe29Sbellard } 2600c896fe29Sbellard 260178505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 260278505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 2603f65a061cSRichard Henderson la_global_kill(s, nb_globals); 2604c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2605f65a061cSRichard Henderson la_global_sync(s, nb_globals); 2606b9c18f56Saurel32 } 2607c896fe29Sbellard 260825f49c5fSRichard Henderson /* Record arguments that die in this helper. */ 2609866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 261025f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 261125f49c5fSRichard Henderson if (ts && ts->state & TS_DEAD) { 2612a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2613c896fe29Sbellard } 2614c896fe29Sbellard } 261525f49c5fSRichard Henderson 261625f49c5fSRichard Henderson /* For all live registers, remove call-clobbered prefs. */ 261725f49c5fSRichard Henderson la_cross_call(s, nb_temps); 261825f49c5fSRichard Henderson 261925f49c5fSRichard Henderson nb_call_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 262025f49c5fSRichard Henderson 262125f49c5fSRichard Henderson /* Input arguments are live for preceding opcodes. */ 262225f49c5fSRichard Henderson for (i = 0; i < nb_iargs; i++) { 262325f49c5fSRichard Henderson ts = arg_temp(op->args[i + nb_oargs]); 262425f49c5fSRichard Henderson if (ts && ts->state & TS_DEAD) { 262525f49c5fSRichard Henderson /* For those arguments that die, and will be allocated 262625f49c5fSRichard Henderson * in registers, clear the register set for that arg, 262725f49c5fSRichard Henderson * to be filled in below. For args that will be on 262825f49c5fSRichard Henderson * the stack, reset to any available reg. 262925f49c5fSRichard Henderson */ 263025f49c5fSRichard Henderson *la_temp_pref(ts) 263125f49c5fSRichard Henderson = (i < nb_call_regs ? 0 : 263225f49c5fSRichard Henderson tcg_target_available_regs[ts->type]); 263325f49c5fSRichard Henderson ts->state &= ~TS_DEAD; 263425f49c5fSRichard Henderson } 263525f49c5fSRichard Henderson } 263625f49c5fSRichard Henderson 263725f49c5fSRichard Henderson /* For each input argument, add its input register to prefs. 263825f49c5fSRichard Henderson If a temp is used once, this produces a single set bit. */ 263925f49c5fSRichard Henderson for (i = 0; i < MIN(nb_call_regs, nb_iargs); i++) { 264025f49c5fSRichard Henderson ts = arg_temp(op->args[i + nb_oargs]); 264125f49c5fSRichard Henderson if (ts) { 264225f49c5fSRichard Henderson tcg_regset_set_reg(*la_temp_pref(ts), 264325f49c5fSRichard Henderson tcg_target_call_iarg_regs[i]); 2644c70fbf0aSRichard Henderson } 2645c19f47bfSAurelien Jarno } 2646c6e113f5Sbellard } 2647c896fe29Sbellard break; 2648765b842aSRichard Henderson case INDEX_op_insn_start: 2649c896fe29Sbellard break; 26505ff9d6a4Sbellard case INDEX_op_discard: 26515ff9d6a4Sbellard /* mark the temporary as dead */ 265225f49c5fSRichard Henderson ts = arg_temp(op->args[0]); 265325f49c5fSRichard Henderson ts->state = TS_DEAD; 265425f49c5fSRichard Henderson la_reset_pref(ts); 26555ff9d6a4Sbellard break; 26561305c451SRichard Henderson 26571305c451SRichard Henderson case INDEX_op_add2_i32: 2658c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2659f1fae40cSRichard Henderson goto do_addsub2; 26601305c451SRichard Henderson case INDEX_op_sub2_i32: 2661c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2662f1fae40cSRichard Henderson goto do_addsub2; 2663f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2664c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2665f1fae40cSRichard Henderson goto do_addsub2; 2666f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2667c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2668f1fae40cSRichard Henderson do_addsub2: 26691305c451SRichard Henderson nb_iargs = 4; 26701305c451SRichard Henderson nb_oargs = 2; 26711305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 26721305c451SRichard Henderson the low part. The result can be optimized to a simple 26731305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 26741305c451SRichard Henderson cpu mode is set to 32 bit. */ 2675b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2676b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 26771305c451SRichard Henderson goto do_remove; 26781305c451SRichard Henderson } 2679c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2680c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2681c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2682efee3746SRichard Henderson op->args[1] = op->args[2]; 2683efee3746SRichard Henderson op->args[2] = op->args[4]; 26841305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 26851305c451SRichard Henderson nb_iargs = 2; 26861305c451SRichard Henderson nb_oargs = 1; 26871305c451SRichard Henderson } 26881305c451SRichard Henderson goto do_not_remove; 26891305c451SRichard Henderson 26901414968aSRichard Henderson case INDEX_op_mulu2_i32: 2691c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2692c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2693c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 269403271524SRichard Henderson goto do_mul2; 2695f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2696c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2697c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2698c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2699f1fae40cSRichard Henderson goto do_mul2; 2700f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2701c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2702c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2703c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 270403271524SRichard Henderson goto do_mul2; 2705f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2706c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2707c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2708c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 270903271524SRichard Henderson goto do_mul2; 2710f1fae40cSRichard Henderson do_mul2: 27111414968aSRichard Henderson nb_iargs = 2; 27121414968aSRichard Henderson nb_oargs = 2; 2713b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2714b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 271503271524SRichard Henderson /* Both parts of the operation are dead. */ 27161414968aSRichard Henderson goto do_remove; 27171414968aSRichard Henderson } 271803271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2719c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2720efee3746SRichard Henderson op->args[1] = op->args[2]; 2721efee3746SRichard Henderson op->args[2] = op->args[3]; 2722b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 272303271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2724c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2725efee3746SRichard Henderson op->args[0] = op->args[1]; 2726efee3746SRichard Henderson op->args[1] = op->args[2]; 2727efee3746SRichard Henderson op->args[2] = op->args[3]; 272803271524SRichard Henderson } else { 272903271524SRichard Henderson goto do_not_remove; 273003271524SRichard Henderson } 273103271524SRichard Henderson /* Mark the single-word operation live. */ 27321414968aSRichard Henderson nb_oargs = 1; 27331414968aSRichard Henderson goto do_not_remove; 27341414968aSRichard Henderson 2735c896fe29Sbellard default: 27361305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2737c896fe29Sbellard nb_iargs = def->nb_iargs; 2738c896fe29Sbellard nb_oargs = def->nb_oargs; 2739c896fe29Sbellard 2740c896fe29Sbellard /* Test if the operation can be removed because all 27415ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 27425ff9d6a4Sbellard implies side effects */ 27435ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2744c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2745b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2746c896fe29Sbellard goto do_not_remove; 2747c896fe29Sbellard } 27489c43b68dSAurelien Jarno } 2749152c35aaSRichard Henderson goto do_remove; 2750152c35aaSRichard Henderson } 2751152c35aaSRichard Henderson goto do_not_remove; 2752152c35aaSRichard Henderson 27531305c451SRichard Henderson do_remove: 27540c627cdcSRichard Henderson tcg_op_remove(s, op); 2755152c35aaSRichard Henderson break; 2756152c35aaSRichard Henderson 2757c896fe29Sbellard do_not_remove: 2758c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 275925f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 276025f49c5fSRichard Henderson 276125f49c5fSRichard Henderson /* Remember the preference of the uses that followed. */ 276225f49c5fSRichard Henderson op->output_pref[i] = *la_temp_pref(ts); 276325f49c5fSRichard Henderson 276425f49c5fSRichard Henderson /* Output args are dead. */ 276525f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2766a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 27676b64b624SAurelien Jarno } 276825f49c5fSRichard Henderson if (ts->state & TS_MEM) { 2769a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 27709c43b68dSAurelien Jarno } 277125f49c5fSRichard Henderson ts->state = TS_DEAD; 277225f49c5fSRichard Henderson la_reset_pref(ts); 2773c896fe29Sbellard } 2774c896fe29Sbellard 277525f49c5fSRichard Henderson /* If end of basic block, update. */ 2776ae36a246SRichard Henderson if (def->flags & TCG_OPF_BB_EXIT) { 2777ae36a246SRichard Henderson la_func_end(s, nb_globals, nb_temps); 2778b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_COND_BRANCH) { 2779b4cb76e6SRichard Henderson la_bb_sync(s, nb_globals, nb_temps); 2780ae36a246SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 27812616c808SRichard Henderson la_bb_end(s, nb_globals, nb_temps); 27823d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 2783f65a061cSRichard Henderson la_global_sync(s, nb_globals); 278425f49c5fSRichard Henderson if (def->flags & TCG_OPF_CALL_CLOBBER) { 278525f49c5fSRichard Henderson la_cross_call(s, nb_temps); 278625f49c5fSRichard Henderson } 2787c896fe29Sbellard } 2788c896fe29Sbellard 278925f49c5fSRichard Henderson /* Record arguments that die in this opcode. */ 2790866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 279125f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 279225f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 2793a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2794c896fe29Sbellard } 2795c19f47bfSAurelien Jarno } 279625f49c5fSRichard Henderson 279725f49c5fSRichard Henderson /* Input arguments are live for preceding opcodes. */ 2798c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 279925f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 280025f49c5fSRichard Henderson if (ts->state & TS_DEAD) { 280125f49c5fSRichard Henderson /* For operands that were dead, initially allow 280225f49c5fSRichard Henderson all regs for the type. */ 280325f49c5fSRichard Henderson *la_temp_pref(ts) = tcg_target_available_regs[ts->type]; 280425f49c5fSRichard Henderson ts->state &= ~TS_DEAD; 280525f49c5fSRichard Henderson } 280625f49c5fSRichard Henderson } 280725f49c5fSRichard Henderson 280825f49c5fSRichard Henderson /* Incorporate constraints for this operand. */ 280925f49c5fSRichard Henderson switch (opc) { 281025f49c5fSRichard Henderson case INDEX_op_mov_i32: 281125f49c5fSRichard Henderson case INDEX_op_mov_i64: 281225f49c5fSRichard Henderson /* Note that these are TCG_OPF_NOT_PRESENT and do not 281325f49c5fSRichard Henderson have proper constraints. That said, special case 281425f49c5fSRichard Henderson moves to propagate preferences backward. */ 281525f49c5fSRichard Henderson if (IS_DEAD_ARG(1)) { 281625f49c5fSRichard Henderson *la_temp_pref(arg_temp(op->args[0])) 281725f49c5fSRichard Henderson = *la_temp_pref(arg_temp(op->args[1])); 281825f49c5fSRichard Henderson } 281925f49c5fSRichard Henderson break; 282025f49c5fSRichard Henderson 282125f49c5fSRichard Henderson default: 282225f49c5fSRichard Henderson for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 282325f49c5fSRichard Henderson const TCGArgConstraint *ct = &def->args_ct[i]; 282425f49c5fSRichard Henderson TCGRegSet set, *pset; 282525f49c5fSRichard Henderson 282625f49c5fSRichard Henderson ts = arg_temp(op->args[i]); 282725f49c5fSRichard Henderson pset = la_temp_pref(ts); 282825f49c5fSRichard Henderson set = *pset; 282925f49c5fSRichard Henderson 28309be0d080SRichard Henderson set &= ct->regs; 2831bc2b17e6SRichard Henderson if (ct->ialias) { 283225f49c5fSRichard Henderson set &= op->output_pref[ct->alias_index]; 283325f49c5fSRichard Henderson } 283425f49c5fSRichard Henderson /* If the combination is not possible, restart. */ 283525f49c5fSRichard Henderson if (set == 0) { 28369be0d080SRichard Henderson set = ct->regs; 283725f49c5fSRichard Henderson } 283825f49c5fSRichard Henderson *pset = set; 283925f49c5fSRichard Henderson } 284025f49c5fSRichard Henderson break; 2841c896fe29Sbellard } 2842c896fe29Sbellard break; 2843c896fe29Sbellard } 2844bee158cbSRichard Henderson op->life = arg_life; 2845c896fe29Sbellard } 28461ff0a2c5SEvgeny Voevodin } 2847c896fe29Sbellard 28485a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2849b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 28505a18407fSRichard Henderson { 28515a18407fSRichard Henderson int nb_globals = s->nb_globals; 285215fa08f8SRichard Henderson int nb_temps, i; 28535a18407fSRichard Henderson bool changes = false; 285415fa08f8SRichard Henderson TCGOp *op, *op_next; 28555a18407fSRichard Henderson 28565a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 28575a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 28585a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 28595a18407fSRichard Henderson if (its->indirect_reg) { 28605a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 28615a18407fSRichard Henderson dts->type = its->type; 28625a18407fSRichard Henderson dts->base_type = its->base_type; 2863c7482438SRichard Henderson dts->kind = TEMP_EBB; 2864b83eabeaSRichard Henderson its->state_ptr = dts; 2865b83eabeaSRichard Henderson } else { 2866b83eabeaSRichard Henderson its->state_ptr = NULL; 28675a18407fSRichard Henderson } 2868b83eabeaSRichard Henderson /* All globals begin dead. */ 2869b83eabeaSRichard Henderson its->state = TS_DEAD; 28705a18407fSRichard Henderson } 2871b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2872b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2873b83eabeaSRichard Henderson its->state_ptr = NULL; 2874b83eabeaSRichard Henderson its->state = TS_DEAD; 2875b83eabeaSRichard Henderson } 28765a18407fSRichard Henderson 287715fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 28785a18407fSRichard Henderson TCGOpcode opc = op->opc; 28795a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 28805a18407fSRichard Henderson TCGLifeData arg_life = op->life; 28815a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2882b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 28835a18407fSRichard Henderson 28845a18407fSRichard Henderson if (opc == INDEX_op_call) { 2885cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2886cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 288790163900SRichard Henderson call_flags = tcg_call_flags(op); 28885a18407fSRichard Henderson } else { 28895a18407fSRichard Henderson nb_iargs = def->nb_iargs; 28905a18407fSRichard Henderson nb_oargs = def->nb_oargs; 28915a18407fSRichard Henderson 28925a18407fSRichard Henderson /* Set flags similar to how calls require. */ 2893b4cb76e6SRichard Henderson if (def->flags & TCG_OPF_COND_BRANCH) { 2894b4cb76e6SRichard Henderson /* Like reading globals: sync_globals */ 2895b4cb76e6SRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 2896b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 28975a18407fSRichard Henderson /* Like writing globals: save_globals */ 28985a18407fSRichard Henderson call_flags = 0; 28995a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 29005a18407fSRichard Henderson /* Like reading globals: sync_globals */ 29015a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 29025a18407fSRichard Henderson } else { 29035a18407fSRichard Henderson /* No effect on globals. */ 29045a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 29055a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 29065a18407fSRichard Henderson } 29075a18407fSRichard Henderson } 29085a18407fSRichard Henderson 29095a18407fSRichard Henderson /* Make sure that input arguments are available. */ 29105a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2911b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2912b83eabeaSRichard Henderson if (arg_ts) { 2913b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2914b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2915b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 29165a18407fSRichard Henderson ? INDEX_op_ld_i32 29175a18407fSRichard Henderson : INDEX_op_ld_i64); 2918ac1043f6SEmilio G. Cota TCGOp *lop = tcg_op_insert_before(s, op, lopc); 29195a18407fSRichard Henderson 2920b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2921b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2922b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 29235a18407fSRichard Henderson 29245a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2925b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 29265a18407fSRichard Henderson } 29275a18407fSRichard Henderson } 29285a18407fSRichard Henderson } 29295a18407fSRichard Henderson 29305a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 29315a18407fSRichard Henderson No action is required except keeping temp_state up to date 29325a18407fSRichard Henderson so that we reload when needed. */ 29335a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2934b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2935b83eabeaSRichard Henderson if (arg_ts) { 2936b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2937b83eabeaSRichard Henderson if (dir_ts) { 2938b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 29395a18407fSRichard Henderson changes = true; 29405a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2941b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 29425a18407fSRichard Henderson } 29435a18407fSRichard Henderson } 29445a18407fSRichard Henderson } 29455a18407fSRichard Henderson } 29465a18407fSRichard Henderson 29475a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 29485a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 29495a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 29505a18407fSRichard Henderson /* Nothing to do */ 29515a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 29525a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 29535a18407fSRichard Henderson /* Liveness should see that globals are synced back, 29545a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2955b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2956b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2957b83eabeaSRichard Henderson || arg_ts->state != 0); 29585a18407fSRichard Henderson } 29595a18407fSRichard Henderson } else { 29605a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 29615a18407fSRichard Henderson /* Liveness should see that globals are saved back, 29625a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2963b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2964b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2965b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 29665a18407fSRichard Henderson } 29675a18407fSRichard Henderson } 29685a18407fSRichard Henderson 29695a18407fSRichard Henderson /* Outputs become available. */ 297061f15c48SRichard Henderson if (opc == INDEX_op_mov_i32 || opc == INDEX_op_mov_i64) { 297161f15c48SRichard Henderson arg_ts = arg_temp(op->args[0]); 297261f15c48SRichard Henderson dir_ts = arg_ts->state_ptr; 297361f15c48SRichard Henderson if (dir_ts) { 297461f15c48SRichard Henderson op->args[0] = temp_arg(dir_ts); 297561f15c48SRichard Henderson changes = true; 297661f15c48SRichard Henderson 297761f15c48SRichard Henderson /* The output is now live and modified. */ 297861f15c48SRichard Henderson arg_ts->state = 0; 297961f15c48SRichard Henderson 298061f15c48SRichard Henderson if (NEED_SYNC_ARG(0)) { 298161f15c48SRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 298261f15c48SRichard Henderson ? INDEX_op_st_i32 298361f15c48SRichard Henderson : INDEX_op_st_i64); 298461f15c48SRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc); 298561f15c48SRichard Henderson TCGTemp *out_ts = dir_ts; 298661f15c48SRichard Henderson 298761f15c48SRichard Henderson if (IS_DEAD_ARG(0)) { 298861f15c48SRichard Henderson out_ts = arg_temp(op->args[1]); 298961f15c48SRichard Henderson arg_ts->state = TS_DEAD; 299061f15c48SRichard Henderson tcg_op_remove(s, op); 299161f15c48SRichard Henderson } else { 299261f15c48SRichard Henderson arg_ts->state = TS_MEM; 299361f15c48SRichard Henderson } 299461f15c48SRichard Henderson 299561f15c48SRichard Henderson sop->args[0] = temp_arg(out_ts); 299661f15c48SRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 299761f15c48SRichard Henderson sop->args[2] = arg_ts->mem_offset; 299861f15c48SRichard Henderson } else { 299961f15c48SRichard Henderson tcg_debug_assert(!IS_DEAD_ARG(0)); 300061f15c48SRichard Henderson } 300161f15c48SRichard Henderson } 300261f15c48SRichard Henderson } else { 30035a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 3004b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 3005b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 3006b83eabeaSRichard Henderson if (!dir_ts) { 30075a18407fSRichard Henderson continue; 30085a18407fSRichard Henderson } 3009b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 30105a18407fSRichard Henderson changes = true; 30115a18407fSRichard Henderson 30125a18407fSRichard Henderson /* The output is now live and modified. */ 3013b83eabeaSRichard Henderson arg_ts->state = 0; 30145a18407fSRichard Henderson 30155a18407fSRichard Henderson /* Sync outputs upon their last write. */ 30165a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 3017b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 30185a18407fSRichard Henderson ? INDEX_op_st_i32 30195a18407fSRichard Henderson : INDEX_op_st_i64); 3020ac1043f6SEmilio G. Cota TCGOp *sop = tcg_op_insert_after(s, op, sopc); 30215a18407fSRichard Henderson 3022b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 3023b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 3024b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 30255a18407fSRichard Henderson 3026b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 30275a18407fSRichard Henderson } 30285a18407fSRichard Henderson /* Drop outputs that are dead. */ 30295a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 3030b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 30315a18407fSRichard Henderson } 30325a18407fSRichard Henderson } 30335a18407fSRichard Henderson } 303461f15c48SRichard Henderson } 30355a18407fSRichard Henderson 30365a18407fSRichard Henderson return changes; 30375a18407fSRichard Henderson } 30385a18407fSRichard Henderson 30392272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 3040c896fe29Sbellard { 3041c1c09194SRichard Henderson intptr_t off, size, align; 3042c1c09194SRichard Henderson 3043c1c09194SRichard Henderson switch (ts->type) { 3044c1c09194SRichard Henderson case TCG_TYPE_I32: 3045c1c09194SRichard Henderson size = align = 4; 3046c1c09194SRichard Henderson break; 3047c1c09194SRichard Henderson case TCG_TYPE_I64: 3048c1c09194SRichard Henderson case TCG_TYPE_V64: 3049c1c09194SRichard Henderson size = align = 8; 3050c1c09194SRichard Henderson break; 3051c1c09194SRichard Henderson case TCG_TYPE_V128: 3052c1c09194SRichard Henderson size = align = 16; 3053c1c09194SRichard Henderson break; 3054c1c09194SRichard Henderson case TCG_TYPE_V256: 3055c1c09194SRichard Henderson /* Note that we do not require aligned storage for V256. */ 3056c1c09194SRichard Henderson size = 32, align = 16; 3057c1c09194SRichard Henderson break; 3058c1c09194SRichard Henderson default: 3059c1c09194SRichard Henderson g_assert_not_reached(); 3060b591dc59SBlue Swirl } 3061c1c09194SRichard Henderson 3062b9537d59SRichard Henderson /* 3063b9537d59SRichard Henderson * Assume the stack is sufficiently aligned. 3064b9537d59SRichard Henderson * This affects e.g. ARM NEON, where we have 8 byte stack alignment 3065b9537d59SRichard Henderson * and do not require 16 byte vector alignment. This seems slightly 3066b9537d59SRichard Henderson * easier than fully parameterizing the above switch statement. 3067b9537d59SRichard Henderson */ 3068b9537d59SRichard Henderson align = MIN(TCG_TARGET_STACK_ALIGN, align); 3069c1c09194SRichard Henderson off = ROUND_UP(s->current_frame_offset, align); 3070732d5897SRichard Henderson 3071732d5897SRichard Henderson /* If we've exhausted the stack frame, restart with a smaller TB. */ 3072732d5897SRichard Henderson if (off + size > s->frame_end) { 3073732d5897SRichard Henderson tcg_raise_tb_overflow(s); 3074732d5897SRichard Henderson } 3075c1c09194SRichard Henderson s->current_frame_offset = off + size; 3076c1c09194SRichard Henderson 3077c1c09194SRichard Henderson ts->mem_offset = off; 30789defd1bdSRichard Henderson #if defined(__sparc__) 30799defd1bdSRichard Henderson ts->mem_offset += TCG_TARGET_STACK_BIAS; 30809defd1bdSRichard Henderson #endif 3081b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 3082c896fe29Sbellard ts->mem_allocated = 1; 3083c896fe29Sbellard } 3084c896fe29Sbellard 3085098859f1SRichard Henderson /* Assign @reg to @ts, and update reg_to_temp[]. */ 3086098859f1SRichard Henderson static void set_temp_val_reg(TCGContext *s, TCGTemp *ts, TCGReg reg) 3087098859f1SRichard Henderson { 3088098859f1SRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 3089098859f1SRichard Henderson TCGReg old = ts->reg; 3090098859f1SRichard Henderson tcg_debug_assert(s->reg_to_temp[old] == ts); 3091098859f1SRichard Henderson if (old == reg) { 3092098859f1SRichard Henderson return; 3093098859f1SRichard Henderson } 3094098859f1SRichard Henderson s->reg_to_temp[old] = NULL; 3095098859f1SRichard Henderson } 3096098859f1SRichard Henderson tcg_debug_assert(s->reg_to_temp[reg] == NULL); 3097098859f1SRichard Henderson s->reg_to_temp[reg] = ts; 3098098859f1SRichard Henderson ts->val_type = TEMP_VAL_REG; 3099098859f1SRichard Henderson ts->reg = reg; 3100098859f1SRichard Henderson } 3101098859f1SRichard Henderson 3102098859f1SRichard Henderson /* Assign a non-register value type to @ts, and update reg_to_temp[]. */ 3103098859f1SRichard Henderson static void set_temp_val_nonreg(TCGContext *s, TCGTemp *ts, TCGTempVal type) 3104098859f1SRichard Henderson { 3105098859f1SRichard Henderson tcg_debug_assert(type != TEMP_VAL_REG); 3106098859f1SRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 3107098859f1SRichard Henderson TCGReg reg = ts->reg; 3108098859f1SRichard Henderson tcg_debug_assert(s->reg_to_temp[reg] == ts); 3109098859f1SRichard Henderson s->reg_to_temp[reg] = NULL; 3110098859f1SRichard Henderson } 3111098859f1SRichard Henderson ts->val_type = type; 3112098859f1SRichard Henderson } 3113098859f1SRichard Henderson 3114b722452aSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet, TCGRegSet); 3115b3915dbbSRichard Henderson 311659d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 311759d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 311859d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 3119c896fe29Sbellard { 3120c0522136SRichard Henderson TCGTempVal new_type; 3121c0522136SRichard Henderson 3122c0522136SRichard Henderson switch (ts->kind) { 3123c0522136SRichard Henderson case TEMP_FIXED: 312459d7c14eSRichard Henderson return; 3125c0522136SRichard Henderson case TEMP_GLOBAL: 3126c0522136SRichard Henderson case TEMP_LOCAL: 3127c0522136SRichard Henderson new_type = TEMP_VAL_MEM; 3128c0522136SRichard Henderson break; 3129c0522136SRichard Henderson case TEMP_NORMAL: 3130c7482438SRichard Henderson case TEMP_EBB: 3131c0522136SRichard Henderson new_type = free_or_dead < 0 ? TEMP_VAL_MEM : TEMP_VAL_DEAD; 3132c0522136SRichard Henderson break; 3133c0522136SRichard Henderson case TEMP_CONST: 3134c0522136SRichard Henderson new_type = TEMP_VAL_CONST; 3135c0522136SRichard Henderson break; 3136c0522136SRichard Henderson default: 3137c0522136SRichard Henderson g_assert_not_reached(); 313859d7c14eSRichard Henderson } 3139098859f1SRichard Henderson set_temp_val_nonreg(s, ts, new_type); 314059d7c14eSRichard Henderson } 3141c896fe29Sbellard 314259d7c14eSRichard Henderson /* Mark a temporary as dead. */ 314359d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 314459d7c14eSRichard Henderson { 314559d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 314659d7c14eSRichard Henderson } 314759d7c14eSRichard Henderson 314859d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 314959d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 315059d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 315159d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 315298b4e186SRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs, 315398b4e186SRichard Henderson TCGRegSet preferred_regs, int free_or_dead) 315459d7c14eSRichard Henderson { 3155c0522136SRichard Henderson if (!temp_readonly(ts) && !ts->mem_coherent) { 31567f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 31572272e4a7SRichard Henderson temp_allocate_frame(s, ts); 315859d7c14eSRichard Henderson } 315959d7c14eSRichard Henderson switch (ts->val_type) { 316059d7c14eSRichard Henderson case TEMP_VAL_CONST: 316159d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 316259d7c14eSRichard Henderson require it later in a register, so attempt to store the 316359d7c14eSRichard Henderson constant to memory directly. */ 316459d7c14eSRichard Henderson if (free_or_dead 316559d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 316659d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 316759d7c14eSRichard Henderson break; 316859d7c14eSRichard Henderson } 316959d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 317098b4e186SRichard Henderson allocated_regs, preferred_regs); 317159d7c14eSRichard Henderson /* fallthrough */ 317259d7c14eSRichard Henderson 317359d7c14eSRichard Henderson case TEMP_VAL_REG: 317459d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 317559d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 317659d7c14eSRichard Henderson break; 317759d7c14eSRichard Henderson 317859d7c14eSRichard Henderson case TEMP_VAL_MEM: 317959d7c14eSRichard Henderson break; 318059d7c14eSRichard Henderson 318159d7c14eSRichard Henderson case TEMP_VAL_DEAD: 318259d7c14eSRichard Henderson default: 318359d7c14eSRichard Henderson tcg_abort(); 3184c896fe29Sbellard } 31857f6ceedfSAurelien Jarno ts->mem_coherent = 1; 31867f6ceedfSAurelien Jarno } 318759d7c14eSRichard Henderson if (free_or_dead) { 318859d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 318959d7c14eSRichard Henderson } 319059d7c14eSRichard Henderson } 31917f6ceedfSAurelien Jarno 31927f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 3193b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 31947f6ceedfSAurelien Jarno { 3195f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 3196f8b2f202SRichard Henderson if (ts != NULL) { 319798b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, -1); 3198c896fe29Sbellard } 3199c896fe29Sbellard } 3200c896fe29Sbellard 3201b016486eSRichard Henderson /** 3202b016486eSRichard Henderson * tcg_reg_alloc: 3203b016486eSRichard Henderson * @required_regs: Set of registers in which we must allocate. 3204b016486eSRichard Henderson * @allocated_regs: Set of registers which must be avoided. 3205b016486eSRichard Henderson * @preferred_regs: Set of registers we should prefer. 3206b016486eSRichard Henderson * @rev: True if we search the registers in "indirect" order. 3207b016486eSRichard Henderson * 3208b016486eSRichard Henderson * The allocated register must be in @required_regs & ~@allocated_regs, 3209b016486eSRichard Henderson * but if we can put it in @preferred_regs we may save a move later. 3210b016486eSRichard Henderson */ 3211b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs, 3212b016486eSRichard Henderson TCGRegSet allocated_regs, 3213b016486eSRichard Henderson TCGRegSet preferred_regs, bool rev) 3214c896fe29Sbellard { 3215b016486eSRichard Henderson int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 3216b016486eSRichard Henderson TCGRegSet reg_ct[2]; 321791478cefSRichard Henderson const int *order; 3218c896fe29Sbellard 3219b016486eSRichard Henderson reg_ct[1] = required_regs & ~allocated_regs; 3220b016486eSRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 3221b016486eSRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 3222b016486eSRichard Henderson 3223b016486eSRichard Henderson /* Skip the preferred_regs option if it cannot be satisfied, 3224b016486eSRichard Henderson or if the preference made no difference. */ 3225b016486eSRichard Henderson f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 3226b016486eSRichard Henderson 322791478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 3228c896fe29Sbellard 3229b016486eSRichard Henderson /* Try free registers, preferences first. */ 3230b016486eSRichard Henderson for (j = f; j < 2; j++) { 3231b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3232b016486eSRichard Henderson 3233b016486eSRichard Henderson if (tcg_regset_single(set)) { 3234b016486eSRichard Henderson /* One register in the set. */ 3235b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3236b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL) { 3237c896fe29Sbellard return reg; 3238c896fe29Sbellard } 3239b016486eSRichard Henderson } else { 324091478cefSRichard Henderson for (i = 0; i < n; i++) { 3241b016486eSRichard Henderson TCGReg reg = order[i]; 3242b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL && 3243b016486eSRichard Henderson tcg_regset_test_reg(set, reg)) { 3244b016486eSRichard Henderson return reg; 3245b016486eSRichard Henderson } 3246b016486eSRichard Henderson } 3247b016486eSRichard Henderson } 3248b016486eSRichard Henderson } 3249b016486eSRichard Henderson 3250b016486eSRichard Henderson /* We must spill something. */ 3251b016486eSRichard Henderson for (j = f; j < 2; j++) { 3252b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3253b016486eSRichard Henderson 3254b016486eSRichard Henderson if (tcg_regset_single(set)) { 3255b016486eSRichard Henderson /* One register in the set. */ 3256b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3257b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3258c896fe29Sbellard return reg; 3259b016486eSRichard Henderson } else { 3260b016486eSRichard Henderson for (i = 0; i < n; i++) { 3261b016486eSRichard Henderson TCGReg reg = order[i]; 3262b016486eSRichard Henderson if (tcg_regset_test_reg(set, reg)) { 3263b016486eSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3264b016486eSRichard Henderson return reg; 3265b016486eSRichard Henderson } 3266b016486eSRichard Henderson } 3267c896fe29Sbellard } 3268c896fe29Sbellard } 3269c896fe29Sbellard 3270c896fe29Sbellard tcg_abort(); 3271c896fe29Sbellard } 3272c896fe29Sbellard 327329f5e925SRichard Henderson static TCGReg tcg_reg_alloc_pair(TCGContext *s, TCGRegSet required_regs, 327429f5e925SRichard Henderson TCGRegSet allocated_regs, 327529f5e925SRichard Henderson TCGRegSet preferred_regs, bool rev) 327629f5e925SRichard Henderson { 327729f5e925SRichard Henderson int i, j, k, fmin, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 327829f5e925SRichard Henderson TCGRegSet reg_ct[2]; 327929f5e925SRichard Henderson const int *order; 328029f5e925SRichard Henderson 328129f5e925SRichard Henderson /* Ensure that if I is not in allocated_regs, I+1 is not either. */ 328229f5e925SRichard Henderson reg_ct[1] = required_regs & ~(allocated_regs | (allocated_regs >> 1)); 328329f5e925SRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 328429f5e925SRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 328529f5e925SRichard Henderson 328629f5e925SRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 328729f5e925SRichard Henderson 328829f5e925SRichard Henderson /* 328929f5e925SRichard Henderson * Skip the preferred_regs option if it cannot be satisfied, 329029f5e925SRichard Henderson * or if the preference made no difference. 329129f5e925SRichard Henderson */ 329229f5e925SRichard Henderson k = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 329329f5e925SRichard Henderson 329429f5e925SRichard Henderson /* 329529f5e925SRichard Henderson * Minimize the number of flushes by looking for 2 free registers first, 329629f5e925SRichard Henderson * then a single flush, then two flushes. 329729f5e925SRichard Henderson */ 329829f5e925SRichard Henderson for (fmin = 2; fmin >= 0; fmin--) { 329929f5e925SRichard Henderson for (j = k; j < 2; j++) { 330029f5e925SRichard Henderson TCGRegSet set = reg_ct[j]; 330129f5e925SRichard Henderson 330229f5e925SRichard Henderson for (i = 0; i < n; i++) { 330329f5e925SRichard Henderson TCGReg reg = order[i]; 330429f5e925SRichard Henderson 330529f5e925SRichard Henderson if (tcg_regset_test_reg(set, reg)) { 330629f5e925SRichard Henderson int f = !s->reg_to_temp[reg] + !s->reg_to_temp[reg + 1]; 330729f5e925SRichard Henderson if (f >= fmin) { 330829f5e925SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 330929f5e925SRichard Henderson tcg_reg_free(s, reg + 1, allocated_regs); 331029f5e925SRichard Henderson return reg; 331129f5e925SRichard Henderson } 331229f5e925SRichard Henderson } 331329f5e925SRichard Henderson } 331429f5e925SRichard Henderson } 331529f5e925SRichard Henderson } 331629f5e925SRichard Henderson tcg_abort(); 331729f5e925SRichard Henderson } 331829f5e925SRichard Henderson 331940ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 332040ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 332140ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 3322b722452aSRichard Henderson TCGRegSet allocated_regs, TCGRegSet preferred_regs) 332340ae5c62SRichard Henderson { 332440ae5c62SRichard Henderson TCGReg reg; 332540ae5c62SRichard Henderson 332640ae5c62SRichard Henderson switch (ts->val_type) { 332740ae5c62SRichard Henderson case TEMP_VAL_REG: 332840ae5c62SRichard Henderson return; 332940ae5c62SRichard Henderson case TEMP_VAL_CONST: 3330b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3331b722452aSRichard Henderson preferred_regs, ts->indirect_base); 33320a6a8bc8SRichard Henderson if (ts->type <= TCG_TYPE_I64) { 333340ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 33340a6a8bc8SRichard Henderson } else { 33354e186175SRichard Henderson uint64_t val = ts->val; 33364e186175SRichard Henderson MemOp vece = MO_64; 33374e186175SRichard Henderson 33384e186175SRichard Henderson /* 33394e186175SRichard Henderson * Find the minimal vector element that matches the constant. 33404e186175SRichard Henderson * The targets will, in general, have to do this search anyway, 33414e186175SRichard Henderson * do this generically. 33424e186175SRichard Henderson */ 33434e186175SRichard Henderson if (val == dup_const(MO_8, val)) { 33444e186175SRichard Henderson vece = MO_8; 33454e186175SRichard Henderson } else if (val == dup_const(MO_16, val)) { 33464e186175SRichard Henderson vece = MO_16; 33470b4286ddSRichard Henderson } else if (val == dup_const(MO_32, val)) { 33484e186175SRichard Henderson vece = MO_32; 33494e186175SRichard Henderson } 33504e186175SRichard Henderson 33514e186175SRichard Henderson tcg_out_dupi_vec(s, ts->type, vece, reg, ts->val); 33520a6a8bc8SRichard Henderson } 335340ae5c62SRichard Henderson ts->mem_coherent = 0; 335440ae5c62SRichard Henderson break; 335540ae5c62SRichard Henderson case TEMP_VAL_MEM: 3356b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3357b722452aSRichard Henderson preferred_regs, ts->indirect_base); 335840ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 335940ae5c62SRichard Henderson ts->mem_coherent = 1; 336040ae5c62SRichard Henderson break; 336140ae5c62SRichard Henderson case TEMP_VAL_DEAD: 336240ae5c62SRichard Henderson default: 336340ae5c62SRichard Henderson tcg_abort(); 336440ae5c62SRichard Henderson } 3365098859f1SRichard Henderson set_temp_val_reg(s, ts, reg); 336640ae5c62SRichard Henderson } 336740ae5c62SRichard Henderson 336859d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 3369e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 337059d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 33711ad80729SAurelien Jarno { 33722c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 3373eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 3374e01fa97dSRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || temp_readonly(ts)); 33751ad80729SAurelien Jarno } 33761ad80729SAurelien Jarno 33779814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 3378641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 3379641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 3380641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 3381641d5fbeSbellard { 3382ac3b8891SRichard Henderson int i, n; 3383641d5fbeSbellard 3384ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 3385b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 3386641d5fbeSbellard } 3387e5097dc8Sbellard } 3388e5097dc8Sbellard 33893d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 33903d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 33913d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 33923d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 33933d5c5f87SAurelien Jarno { 3394ac3b8891SRichard Henderson int i, n; 33953d5c5f87SAurelien Jarno 3396ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 339712b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 339812b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 3399ee17db83SRichard Henderson || ts->kind == TEMP_FIXED 340012b9b11aSRichard Henderson || ts->mem_coherent); 34013d5c5f87SAurelien Jarno } 34023d5c5f87SAurelien Jarno } 34033d5c5f87SAurelien Jarno 3404e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 3405e8996ee0Sbellard all globals are stored at their canonical location. */ 3406e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 3407e5097dc8Sbellard { 3408e5097dc8Sbellard int i; 3409e5097dc8Sbellard 3410c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 3411b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 3412c0522136SRichard Henderson 3413c0522136SRichard Henderson switch (ts->kind) { 3414c0522136SRichard Henderson case TEMP_LOCAL: 3415b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 3416c0522136SRichard Henderson break; 3417c0522136SRichard Henderson case TEMP_NORMAL: 3418c7482438SRichard Henderson case TEMP_EBB: 34192c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 3420eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 3421eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3422c0522136SRichard Henderson break; 3423c0522136SRichard Henderson case TEMP_CONST: 3424c0522136SRichard Henderson /* Similarly, we should have freed any allocated register. */ 3425c0522136SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_CONST); 3426c0522136SRichard Henderson break; 3427c0522136SRichard Henderson default: 3428c0522136SRichard Henderson g_assert_not_reached(); 3429c896fe29Sbellard } 3430641d5fbeSbellard } 3431e8996ee0Sbellard 3432e8996ee0Sbellard save_globals(s, allocated_regs); 3433c896fe29Sbellard } 3434c896fe29Sbellard 3435bab1671fSRichard Henderson /* 3436c7482438SRichard Henderson * At a conditional branch, we assume all temporaries are dead unless 3437c7482438SRichard Henderson * explicitly live-across-conditional-branch; all globals and local 3438c7482438SRichard Henderson * temps are synced to their location. 3439b4cb76e6SRichard Henderson */ 3440b4cb76e6SRichard Henderson static void tcg_reg_alloc_cbranch(TCGContext *s, TCGRegSet allocated_regs) 3441b4cb76e6SRichard Henderson { 3442b4cb76e6SRichard Henderson sync_globals(s, allocated_regs); 3443b4cb76e6SRichard Henderson 3444b4cb76e6SRichard Henderson for (int i = s->nb_globals; i < s->nb_temps; i++) { 3445b4cb76e6SRichard Henderson TCGTemp *ts = &s->temps[i]; 3446b4cb76e6SRichard Henderson /* 3447b4cb76e6SRichard Henderson * The liveness analysis already ensures that temps are dead. 3448b4cb76e6SRichard Henderson * Keep tcg_debug_asserts for safety. 3449b4cb76e6SRichard Henderson */ 3450c0522136SRichard Henderson switch (ts->kind) { 3451c0522136SRichard Henderson case TEMP_LOCAL: 3452b4cb76e6SRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG || ts->mem_coherent); 3453c0522136SRichard Henderson break; 3454c0522136SRichard Henderson case TEMP_NORMAL: 3455b4cb76e6SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3456c0522136SRichard Henderson break; 3457c7482438SRichard Henderson case TEMP_EBB: 3458c0522136SRichard Henderson case TEMP_CONST: 3459c0522136SRichard Henderson break; 3460c0522136SRichard Henderson default: 3461c0522136SRichard Henderson g_assert_not_reached(); 3462b4cb76e6SRichard Henderson } 3463b4cb76e6SRichard Henderson } 3464b4cb76e6SRichard Henderson } 3465b4cb76e6SRichard Henderson 3466b4cb76e6SRichard Henderson /* 3467c58f4c97SRichard Henderson * Specialized code generation for INDEX_op_mov_* with a constant. 3468bab1671fSRichard Henderson */ 34690fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 3470ba87719cSRichard Henderson tcg_target_ulong val, TCGLifeData arg_life, 3471ba87719cSRichard Henderson TCGRegSet preferred_regs) 3472e8996ee0Sbellard { 3473d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3474e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 347559d7c14eSRichard Henderson 347659d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 3477098859f1SRichard Henderson set_temp_val_nonreg(s, ots, TEMP_VAL_CONST); 3478e8996ee0Sbellard ots->val = val; 347959d7c14eSRichard Henderson ots->mem_coherent = 0; 3480ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 3481ba87719cSRichard Henderson temp_sync(s, ots, s->reserved_regs, preferred_regs, IS_DEAD_ARG(0)); 348259d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 3483f8bf00f1SRichard Henderson temp_dead(s, ots); 34844c4e1ab2SAurelien Jarno } 3485e8996ee0Sbellard } 3486e8996ee0Sbellard 3487bab1671fSRichard Henderson /* 3488bab1671fSRichard Henderson * Specialized code generation for INDEX_op_mov_*. 3489bab1671fSRichard Henderson */ 3490dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 3491c896fe29Sbellard { 3492dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 349369e3706dSRichard Henderson TCGRegSet allocated_regs, preferred_regs; 3494c896fe29Sbellard TCGTemp *ts, *ots; 3495450445d5SRichard Henderson TCGType otype, itype; 3496098859f1SRichard Henderson TCGReg oreg, ireg; 3497c896fe29Sbellard 3498d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 349969e3706dSRichard Henderson preferred_regs = op->output_pref[0]; 350043439139SRichard Henderson ots = arg_temp(op->args[0]); 350143439139SRichard Henderson ts = arg_temp(op->args[1]); 3502450445d5SRichard Henderson 3503d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3504e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3505d63e3b6eSRichard Henderson 3506450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 3507450445d5SRichard Henderson otype = ots->type; 3508450445d5SRichard Henderson itype = ts->type; 3509c896fe29Sbellard 35100fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 35110fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 35120fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 35130fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 35140fe4fca4SPaolo Bonzini temp_dead(s, ts); 35150fe4fca4SPaolo Bonzini } 351669e3706dSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, preferred_regs); 35170fe4fca4SPaolo Bonzini return; 35180fe4fca4SPaolo Bonzini } 35190fe4fca4SPaolo Bonzini 35200fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 35210fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 35220fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 35230fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 35240fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 352569e3706dSRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], 352669e3706dSRichard Henderson allocated_regs, preferred_regs); 3527c29c1d7eSAurelien Jarno } 35280fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 3529098859f1SRichard Henderson ireg = ts->reg; 3530098859f1SRichard Henderson 3531d63e3b6eSRichard Henderson if (IS_DEAD_ARG(0)) { 3532c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 3533c29c1d7eSAurelien Jarno liveness analysis disabled). */ 3534eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 3535c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 35362272e4a7SRichard Henderson temp_allocate_frame(s, ots); 3537c29c1d7eSAurelien Jarno } 3538098859f1SRichard Henderson tcg_out_st(s, otype, ireg, ots->mem_base->reg, ots->mem_offset); 3539c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 3540f8bf00f1SRichard Henderson temp_dead(s, ts); 3541c29c1d7eSAurelien Jarno } 3542f8bf00f1SRichard Henderson temp_dead(s, ots); 3543098859f1SRichard Henderson return; 3544098859f1SRichard Henderson } 3545098859f1SRichard Henderson 3546ee17db83SRichard Henderson if (IS_DEAD_ARG(1) && ts->kind != TEMP_FIXED) { 3547098859f1SRichard Henderson /* 3548098859f1SRichard Henderson * The mov can be suppressed. Kill input first, so that it 3549098859f1SRichard Henderson * is unlinked from reg_to_temp, then set the output to the 3550098859f1SRichard Henderson * reg that we saved from the input. 3551098859f1SRichard Henderson */ 3552f8bf00f1SRichard Henderson temp_dead(s, ts); 3553098859f1SRichard Henderson oreg = ireg; 3554c29c1d7eSAurelien Jarno } else { 3555098859f1SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 3556098859f1SRichard Henderson oreg = ots->reg; 3557098859f1SRichard Henderson } else { 3558098859f1SRichard Henderson /* Make sure to not spill the input register during allocation. */ 3559098859f1SRichard Henderson oreg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 3560098859f1SRichard Henderson allocated_regs | ((TCGRegSet)1 << ireg), 3561098859f1SRichard Henderson preferred_regs, ots->indirect_base); 3562c29c1d7eSAurelien Jarno } 3563098859f1SRichard Henderson if (!tcg_out_mov(s, otype, oreg, ireg)) { 3564240c08d0SRichard Henderson /* 3565240c08d0SRichard Henderson * Cross register class move not supported. 3566240c08d0SRichard Henderson * Store the source register into the destination slot 3567240c08d0SRichard Henderson * and leave the destination temp as TEMP_VAL_MEM. 3568240c08d0SRichard Henderson */ 3569e01fa97dSRichard Henderson assert(!temp_readonly(ots)); 3570240c08d0SRichard Henderson if (!ts->mem_allocated) { 3571240c08d0SRichard Henderson temp_allocate_frame(s, ots); 3572240c08d0SRichard Henderson } 3573098859f1SRichard Henderson tcg_out_st(s, ts->type, ireg, ots->mem_base->reg, ots->mem_offset); 3574098859f1SRichard Henderson set_temp_val_nonreg(s, ts, TEMP_VAL_MEM); 3575240c08d0SRichard Henderson ots->mem_coherent = 1; 3576240c08d0SRichard Henderson return; 357778113e83SRichard Henderson } 3578c29c1d7eSAurelien Jarno } 3579098859f1SRichard Henderson set_temp_val_reg(s, ots, oreg); 3580c896fe29Sbellard ots->mem_coherent = 0; 3581098859f1SRichard Henderson 3582ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 358398b4e186SRichard Henderson temp_sync(s, ots, allocated_regs, 0, 0); 3584c29c1d7eSAurelien Jarno } 3585ec7a869dSAurelien Jarno } 3586c896fe29Sbellard 3587bab1671fSRichard Henderson /* 3588bab1671fSRichard Henderson * Specialized code generation for INDEX_op_dup_vec. 3589bab1671fSRichard Henderson */ 3590bab1671fSRichard Henderson static void tcg_reg_alloc_dup(TCGContext *s, const TCGOp *op) 3591bab1671fSRichard Henderson { 3592bab1671fSRichard Henderson const TCGLifeData arg_life = op->life; 3593bab1671fSRichard Henderson TCGRegSet dup_out_regs, dup_in_regs; 3594bab1671fSRichard Henderson TCGTemp *its, *ots; 3595bab1671fSRichard Henderson TCGType itype, vtype; 3596d6ecb4a9SRichard Henderson intptr_t endian_fixup; 3597bab1671fSRichard Henderson unsigned vece; 3598bab1671fSRichard Henderson bool ok; 3599bab1671fSRichard Henderson 3600bab1671fSRichard Henderson ots = arg_temp(op->args[0]); 3601bab1671fSRichard Henderson its = arg_temp(op->args[1]); 3602bab1671fSRichard Henderson 3603bab1671fSRichard Henderson /* ENV should not be modified. */ 3604e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 3605bab1671fSRichard Henderson 3606bab1671fSRichard Henderson itype = its->type; 3607bab1671fSRichard Henderson vece = TCGOP_VECE(op); 3608bab1671fSRichard Henderson vtype = TCGOP_VECL(op) + TCG_TYPE_V64; 3609bab1671fSRichard Henderson 3610bab1671fSRichard Henderson if (its->val_type == TEMP_VAL_CONST) { 3611bab1671fSRichard Henderson /* Propagate constant via movi -> dupi. */ 3612bab1671fSRichard Henderson tcg_target_ulong val = its->val; 3613bab1671fSRichard Henderson if (IS_DEAD_ARG(1)) { 3614bab1671fSRichard Henderson temp_dead(s, its); 3615bab1671fSRichard Henderson } 3616bab1671fSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, op->output_pref[0]); 3617bab1671fSRichard Henderson return; 3618bab1671fSRichard Henderson } 3619bab1671fSRichard Henderson 36209be0d080SRichard Henderson dup_out_regs = tcg_op_defs[INDEX_op_dup_vec].args_ct[0].regs; 36219be0d080SRichard Henderson dup_in_regs = tcg_op_defs[INDEX_op_dup_vec].args_ct[1].regs; 3622bab1671fSRichard Henderson 3623bab1671fSRichard Henderson /* Allocate the output register now. */ 3624bab1671fSRichard Henderson if (ots->val_type != TEMP_VAL_REG) { 3625bab1671fSRichard Henderson TCGRegSet allocated_regs = s->reserved_regs; 3626098859f1SRichard Henderson TCGReg oreg; 3627bab1671fSRichard Henderson 3628bab1671fSRichard Henderson if (!IS_DEAD_ARG(1) && its->val_type == TEMP_VAL_REG) { 3629bab1671fSRichard Henderson /* Make sure to not spill the input register. */ 3630bab1671fSRichard Henderson tcg_regset_set_reg(allocated_regs, its->reg); 3631bab1671fSRichard Henderson } 3632098859f1SRichard Henderson oreg = tcg_reg_alloc(s, dup_out_regs, allocated_regs, 3633bab1671fSRichard Henderson op->output_pref[0], ots->indirect_base); 3634098859f1SRichard Henderson set_temp_val_reg(s, ots, oreg); 3635bab1671fSRichard Henderson } 3636bab1671fSRichard Henderson 3637bab1671fSRichard Henderson switch (its->val_type) { 3638bab1671fSRichard Henderson case TEMP_VAL_REG: 3639bab1671fSRichard Henderson /* 3640bab1671fSRichard Henderson * The dup constriaints must be broad, covering all possible VECE. 3641bab1671fSRichard Henderson * However, tcg_op_dup_vec() gets to see the VECE and we allow it 3642bab1671fSRichard Henderson * to fail, indicating that extra moves are required for that case. 3643bab1671fSRichard Henderson */ 3644bab1671fSRichard Henderson if (tcg_regset_test_reg(dup_in_regs, its->reg)) { 3645bab1671fSRichard Henderson if (tcg_out_dup_vec(s, vtype, vece, ots->reg, its->reg)) { 3646bab1671fSRichard Henderson goto done; 3647bab1671fSRichard Henderson } 3648bab1671fSRichard Henderson /* Try again from memory or a vector input register. */ 3649bab1671fSRichard Henderson } 3650bab1671fSRichard Henderson if (!its->mem_coherent) { 3651bab1671fSRichard Henderson /* 3652bab1671fSRichard Henderson * The input register is not synced, and so an extra store 3653bab1671fSRichard Henderson * would be required to use memory. Attempt an integer-vector 3654bab1671fSRichard Henderson * register move first. We do not have a TCGRegSet for this. 3655bab1671fSRichard Henderson */ 3656bab1671fSRichard Henderson if (tcg_out_mov(s, itype, ots->reg, its->reg)) { 3657bab1671fSRichard Henderson break; 3658bab1671fSRichard Henderson } 3659bab1671fSRichard Henderson /* Sync the temp back to its slot and load from there. */ 3660bab1671fSRichard Henderson temp_sync(s, its, s->reserved_regs, 0, 0); 3661bab1671fSRichard Henderson } 3662bab1671fSRichard Henderson /* fall through */ 3663bab1671fSRichard Henderson 3664bab1671fSRichard Henderson case TEMP_VAL_MEM: 3665e03b5686SMarc-André Lureau #if HOST_BIG_ENDIAN 3666d6ecb4a9SRichard Henderson endian_fixup = itype == TCG_TYPE_I32 ? 4 : 8; 3667d6ecb4a9SRichard Henderson endian_fixup -= 1 << vece; 3668d6ecb4a9SRichard Henderson #else 3669d6ecb4a9SRichard Henderson endian_fixup = 0; 3670d6ecb4a9SRichard Henderson #endif 3671098859f1SRichard Henderson /* Attempt to dup directly from the input memory slot. */ 3672d6ecb4a9SRichard Henderson if (tcg_out_dupm_vec(s, vtype, vece, ots->reg, its->mem_base->reg, 3673d6ecb4a9SRichard Henderson its->mem_offset + endian_fixup)) { 3674d6ecb4a9SRichard Henderson goto done; 3675d6ecb4a9SRichard Henderson } 3676098859f1SRichard Henderson /* Load the input into the destination vector register. */ 3677bab1671fSRichard Henderson tcg_out_ld(s, itype, ots->reg, its->mem_base->reg, its->mem_offset); 3678bab1671fSRichard Henderson break; 3679bab1671fSRichard Henderson 3680bab1671fSRichard Henderson default: 3681bab1671fSRichard Henderson g_assert_not_reached(); 3682bab1671fSRichard Henderson } 3683bab1671fSRichard Henderson 3684bab1671fSRichard Henderson /* We now have a vector input register, so dup must succeed. */ 3685bab1671fSRichard Henderson ok = tcg_out_dup_vec(s, vtype, vece, ots->reg, ots->reg); 3686bab1671fSRichard Henderson tcg_debug_assert(ok); 3687bab1671fSRichard Henderson 3688bab1671fSRichard Henderson done: 368936f5539cSRichard Henderson ots->mem_coherent = 0; 3690bab1671fSRichard Henderson if (IS_DEAD_ARG(1)) { 3691bab1671fSRichard Henderson temp_dead(s, its); 3692bab1671fSRichard Henderson } 3693bab1671fSRichard Henderson if (NEED_SYNC_ARG(0)) { 3694bab1671fSRichard Henderson temp_sync(s, ots, s->reserved_regs, 0, 0); 3695bab1671fSRichard Henderson } 3696bab1671fSRichard Henderson if (IS_DEAD_ARG(0)) { 3697bab1671fSRichard Henderson temp_dead(s, ots); 3698bab1671fSRichard Henderson } 3699bab1671fSRichard Henderson } 3700bab1671fSRichard Henderson 3701dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3702c896fe29Sbellard { 3703dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3704dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 370582790a87SRichard Henderson TCGRegSet i_allocated_regs; 370682790a87SRichard Henderson TCGRegSet o_allocated_regs; 3707b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3708b6638662SRichard Henderson TCGReg reg; 3709c896fe29Sbellard TCGArg arg; 3710c896fe29Sbellard const TCGArgConstraint *arg_ct; 3711c896fe29Sbellard TCGTemp *ts; 3712c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3713c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3714c896fe29Sbellard 3715c896fe29Sbellard nb_oargs = def->nb_oargs; 3716c896fe29Sbellard nb_iargs = def->nb_iargs; 3717c896fe29Sbellard 3718c896fe29Sbellard /* copy constants */ 3719c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3720dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3721c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3722c896fe29Sbellard 3723d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3724d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 372582790a87SRichard Henderson 3726c896fe29Sbellard /* satisfy input constraints */ 3727c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 372829f5e925SRichard Henderson TCGRegSet i_preferred_regs, i_required_regs; 372929f5e925SRichard Henderson bool allocate_new_reg, copyto_new_reg; 373029f5e925SRichard Henderson TCGTemp *ts2; 373129f5e925SRichard Henderson int i1, i2; 3732d62816f2SRichard Henderson 373366792f90SRichard Henderson i = def->args_ct[nb_oargs + k].sort_index; 3734dd186292SRichard Henderson arg = op->args[i]; 3735c896fe29Sbellard arg_ct = &def->args_ct[i]; 373643439139SRichard Henderson ts = arg_temp(arg); 373740ae5c62SRichard Henderson 373840ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 3739a4fbbd77SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct->ct)) { 3740c896fe29Sbellard /* constant is OK for instruction */ 3741c896fe29Sbellard const_args[i] = 1; 3742c896fe29Sbellard new_args[i] = ts->val; 3743d62816f2SRichard Henderson continue; 3744c896fe29Sbellard } 374540ae5c62SRichard Henderson 37461c1824dcSRichard Henderson reg = ts->reg; 37471c1824dcSRichard Henderson i_preferred_regs = 0; 374829f5e925SRichard Henderson i_required_regs = arg_ct->regs; 37491c1824dcSRichard Henderson allocate_new_reg = false; 375029f5e925SRichard Henderson copyto_new_reg = false; 37511c1824dcSRichard Henderson 375229f5e925SRichard Henderson switch (arg_ct->pair) { 375329f5e925SRichard Henderson case 0: /* not paired */ 3754bc2b17e6SRichard Henderson if (arg_ct->ialias) { 37551c1824dcSRichard Henderson i_preferred_regs = op->output_pref[arg_ct->alias_index]; 3756c0522136SRichard Henderson 3757c0522136SRichard Henderson /* 3758c0522136SRichard Henderson * If the input is readonly, then it cannot also be an 3759c0522136SRichard Henderson * output and aliased to itself. If the input is not 3760c0522136SRichard Henderson * dead after the instruction, we must allocate a new 3761c0522136SRichard Henderson * register and move it. 3762c0522136SRichard Henderson */ 3763c0522136SRichard Henderson if (temp_readonly(ts) || !IS_DEAD_ARG(i)) { 37641c1824dcSRichard Henderson allocate_new_reg = true; 37651c1824dcSRichard Henderson } else if (ts->val_type == TEMP_VAL_REG) { 3766c0522136SRichard Henderson /* 37671c1824dcSRichard Henderson * Check if the current register has already been 37681c1824dcSRichard Henderson * allocated for another input. 3769c0522136SRichard Henderson */ 377029f5e925SRichard Henderson allocate_new_reg = 377129f5e925SRichard Henderson tcg_regset_test_reg(i_allocated_regs, reg); 37727e1df267SAurelien Jarno } 37737e1df267SAurelien Jarno } 37741c1824dcSRichard Henderson if (!allocate_new_reg) { 377529f5e925SRichard Henderson temp_load(s, ts, i_required_regs, i_allocated_regs, 377629f5e925SRichard Henderson i_preferred_regs); 3777c896fe29Sbellard reg = ts->reg; 377829f5e925SRichard Henderson allocate_new_reg = !tcg_regset_test_reg(i_required_regs, reg); 37791c1824dcSRichard Henderson } 37801c1824dcSRichard Henderson if (allocate_new_reg) { 3781c0522136SRichard Henderson /* 3782c0522136SRichard Henderson * Allocate a new register matching the constraint 3783c0522136SRichard Henderson * and move the temporary register into it. 3784c0522136SRichard Henderson */ 3785d62816f2SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 3786d62816f2SRichard Henderson i_allocated_regs, 0); 378729f5e925SRichard Henderson reg = tcg_reg_alloc(s, i_required_regs, i_allocated_regs, 37881c1824dcSRichard Henderson i_preferred_regs, ts->indirect_base); 378929f5e925SRichard Henderson copyto_new_reg = true; 379029f5e925SRichard Henderson } 379129f5e925SRichard Henderson break; 379229f5e925SRichard Henderson 379329f5e925SRichard Henderson case 1: 379429f5e925SRichard Henderson /* First of an input pair; if i1 == i2, the second is an output. */ 379529f5e925SRichard Henderson i1 = i; 379629f5e925SRichard Henderson i2 = arg_ct->pair_index; 379729f5e925SRichard Henderson ts2 = i1 != i2 ? arg_temp(op->args[i2]) : NULL; 379829f5e925SRichard Henderson 379929f5e925SRichard Henderson /* 380029f5e925SRichard Henderson * It is easier to default to allocating a new pair 380129f5e925SRichard Henderson * and to identify a few cases where it's not required. 380229f5e925SRichard Henderson */ 380329f5e925SRichard Henderson if (arg_ct->ialias) { 380429f5e925SRichard Henderson i_preferred_regs = op->output_pref[arg_ct->alias_index]; 380529f5e925SRichard Henderson if (IS_DEAD_ARG(i1) && 380629f5e925SRichard Henderson IS_DEAD_ARG(i2) && 380729f5e925SRichard Henderson !temp_readonly(ts) && 380829f5e925SRichard Henderson ts->val_type == TEMP_VAL_REG && 380929f5e925SRichard Henderson ts->reg < TCG_TARGET_NB_REGS - 1 && 381029f5e925SRichard Henderson tcg_regset_test_reg(i_required_regs, reg) && 381129f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg) && 381229f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg + 1) && 381329f5e925SRichard Henderson (ts2 381429f5e925SRichard Henderson ? ts2->val_type == TEMP_VAL_REG && 381529f5e925SRichard Henderson ts2->reg == reg + 1 && 381629f5e925SRichard Henderson !temp_readonly(ts2) 381729f5e925SRichard Henderson : s->reg_to_temp[reg + 1] == NULL)) { 381829f5e925SRichard Henderson break; 381929f5e925SRichard Henderson } 382029f5e925SRichard Henderson } else { 382129f5e925SRichard Henderson /* Without aliasing, the pair must also be an input. */ 382229f5e925SRichard Henderson tcg_debug_assert(ts2); 382329f5e925SRichard Henderson if (ts->val_type == TEMP_VAL_REG && 382429f5e925SRichard Henderson ts2->val_type == TEMP_VAL_REG && 382529f5e925SRichard Henderson ts2->reg == reg + 1 && 382629f5e925SRichard Henderson tcg_regset_test_reg(i_required_regs, reg)) { 382729f5e925SRichard Henderson break; 382829f5e925SRichard Henderson } 382929f5e925SRichard Henderson } 383029f5e925SRichard Henderson reg = tcg_reg_alloc_pair(s, i_required_regs, i_allocated_regs, 383129f5e925SRichard Henderson 0, ts->indirect_base); 383229f5e925SRichard Henderson goto do_pair; 383329f5e925SRichard Henderson 383429f5e925SRichard Henderson case 2: /* pair second */ 383529f5e925SRichard Henderson reg = new_args[arg_ct->pair_index] + 1; 383629f5e925SRichard Henderson goto do_pair; 383729f5e925SRichard Henderson 383829f5e925SRichard Henderson case 3: /* ialias with second output, no first input */ 383929f5e925SRichard Henderson tcg_debug_assert(arg_ct->ialias); 384029f5e925SRichard Henderson i_preferred_regs = op->output_pref[arg_ct->alias_index]; 384129f5e925SRichard Henderson 384229f5e925SRichard Henderson if (IS_DEAD_ARG(i) && 384329f5e925SRichard Henderson !temp_readonly(ts) && 384429f5e925SRichard Henderson ts->val_type == TEMP_VAL_REG && 384529f5e925SRichard Henderson reg > 0 && 384629f5e925SRichard Henderson s->reg_to_temp[reg - 1] == NULL && 384729f5e925SRichard Henderson tcg_regset_test_reg(i_required_regs, reg) && 384829f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg) && 384929f5e925SRichard Henderson !tcg_regset_test_reg(i_allocated_regs, reg - 1)) { 385029f5e925SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg - 1); 385129f5e925SRichard Henderson break; 385229f5e925SRichard Henderson } 385329f5e925SRichard Henderson reg = tcg_reg_alloc_pair(s, i_required_regs >> 1, 385429f5e925SRichard Henderson i_allocated_regs, 0, 385529f5e925SRichard Henderson ts->indirect_base); 385629f5e925SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 385729f5e925SRichard Henderson reg += 1; 385829f5e925SRichard Henderson goto do_pair; 385929f5e925SRichard Henderson 386029f5e925SRichard Henderson do_pair: 386129f5e925SRichard Henderson /* 386229f5e925SRichard Henderson * If an aliased input is not dead after the instruction, 386329f5e925SRichard Henderson * we must allocate a new register and move it. 386429f5e925SRichard Henderson */ 386529f5e925SRichard Henderson if (arg_ct->ialias && (!IS_DEAD_ARG(i) || temp_readonly(ts))) { 386629f5e925SRichard Henderson TCGRegSet t_allocated_regs = i_allocated_regs; 386729f5e925SRichard Henderson 386829f5e925SRichard Henderson /* 386929f5e925SRichard Henderson * Because of the alias, and the continued life, make sure 387029f5e925SRichard Henderson * that the temp is somewhere *other* than the reg pair, 387129f5e925SRichard Henderson * and we get a copy in reg. 387229f5e925SRichard Henderson */ 387329f5e925SRichard Henderson tcg_regset_set_reg(t_allocated_regs, reg); 387429f5e925SRichard Henderson tcg_regset_set_reg(t_allocated_regs, reg + 1); 387529f5e925SRichard Henderson if (ts->val_type == TEMP_VAL_REG && ts->reg == reg) { 387629f5e925SRichard Henderson /* If ts was already in reg, copy it somewhere else. */ 387729f5e925SRichard Henderson TCGReg nr; 387829f5e925SRichard Henderson bool ok; 387929f5e925SRichard Henderson 388029f5e925SRichard Henderson tcg_debug_assert(ts->kind != TEMP_FIXED); 388129f5e925SRichard Henderson nr = tcg_reg_alloc(s, tcg_target_available_regs[ts->type], 388229f5e925SRichard Henderson t_allocated_regs, 0, ts->indirect_base); 388329f5e925SRichard Henderson ok = tcg_out_mov(s, ts->type, nr, reg); 388429f5e925SRichard Henderson tcg_debug_assert(ok); 388529f5e925SRichard Henderson 388629f5e925SRichard Henderson set_temp_val_reg(s, ts, nr); 388729f5e925SRichard Henderson } else { 388829f5e925SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 388929f5e925SRichard Henderson t_allocated_regs, 0); 389029f5e925SRichard Henderson copyto_new_reg = true; 389129f5e925SRichard Henderson } 389229f5e925SRichard Henderson } else { 389329f5e925SRichard Henderson /* Preferably allocate to reg, otherwise copy. */ 389429f5e925SRichard Henderson i_required_regs = (TCGRegSet)1 << reg; 389529f5e925SRichard Henderson temp_load(s, ts, i_required_regs, i_allocated_regs, 389629f5e925SRichard Henderson i_preferred_regs); 389729f5e925SRichard Henderson copyto_new_reg = ts->reg != reg; 389829f5e925SRichard Henderson } 389929f5e925SRichard Henderson break; 390029f5e925SRichard Henderson 390129f5e925SRichard Henderson default: 390229f5e925SRichard Henderson g_assert_not_reached(); 390329f5e925SRichard Henderson } 390429f5e925SRichard Henderson 390529f5e925SRichard Henderson if (copyto_new_reg) { 390678113e83SRichard Henderson if (!tcg_out_mov(s, ts->type, reg, ts->reg)) { 3907240c08d0SRichard Henderson /* 3908240c08d0SRichard Henderson * Cross register class move not supported. Sync the 3909240c08d0SRichard Henderson * temp back to its slot and load from there. 3910240c08d0SRichard Henderson */ 3911240c08d0SRichard Henderson temp_sync(s, ts, i_allocated_regs, 0, 0); 3912240c08d0SRichard Henderson tcg_out_ld(s, ts->type, reg, 3913240c08d0SRichard Henderson ts->mem_base->reg, ts->mem_offset); 391478113e83SRichard Henderson } 3915c896fe29Sbellard } 3916c896fe29Sbellard new_args[i] = reg; 3917c896fe29Sbellard const_args[i] = 0; 391882790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3919c896fe29Sbellard } 3920c896fe29Sbellard 3921c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3922866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3923866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 392443439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3925c896fe29Sbellard } 3926c896fe29Sbellard } 3927c896fe29Sbellard 3928b4cb76e6SRichard Henderson if (def->flags & TCG_OPF_COND_BRANCH) { 3929b4cb76e6SRichard Henderson tcg_reg_alloc_cbranch(s, i_allocated_regs); 3930b4cb76e6SRichard Henderson } else if (def->flags & TCG_OPF_BB_END) { 393182790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3932a52ad07eSAurelien Jarno } else { 3933c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3934b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3935c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3936c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 393782790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3938c896fe29Sbellard } 3939c896fe29Sbellard } 39403d5c5f87SAurelien Jarno } 39413d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 39423d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 39433d5c5f87SAurelien Jarno an exception. */ 394482790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3945c896fe29Sbellard } 3946c896fe29Sbellard 3947c896fe29Sbellard /* satisfy the output constraints */ 3948c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 394966792f90SRichard Henderson i = def->args_ct[k].sort_index; 3950dd186292SRichard Henderson arg = op->args[i]; 3951c896fe29Sbellard arg_ct = &def->args_ct[i]; 395243439139SRichard Henderson ts = arg_temp(arg); 3953d63e3b6eSRichard Henderson 3954d63e3b6eSRichard Henderson /* ENV should not be modified. */ 3955e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 3956d63e3b6eSRichard Henderson 395729f5e925SRichard Henderson switch (arg_ct->pair) { 395829f5e925SRichard Henderson case 0: /* not paired */ 3959bc2b17e6SRichard Henderson if (arg_ct->oalias && !const_args[arg_ct->alias_index]) { 39605ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 3961bc2b17e6SRichard Henderson } else if (arg_ct->newreg) { 39629be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, 396382790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 396469e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3965c896fe29Sbellard } else { 39669be0d080SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->regs, o_allocated_regs, 396769e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3968c896fe29Sbellard } 396929f5e925SRichard Henderson break; 397029f5e925SRichard Henderson 397129f5e925SRichard Henderson case 1: /* first of pair */ 397229f5e925SRichard Henderson tcg_debug_assert(!arg_ct->newreg); 397329f5e925SRichard Henderson if (arg_ct->oalias) { 397429f5e925SRichard Henderson reg = new_args[arg_ct->alias_index]; 397529f5e925SRichard Henderson break; 397629f5e925SRichard Henderson } 397729f5e925SRichard Henderson reg = tcg_reg_alloc_pair(s, arg_ct->regs, o_allocated_regs, 397829f5e925SRichard Henderson op->output_pref[k], ts->indirect_base); 397929f5e925SRichard Henderson break; 398029f5e925SRichard Henderson 398129f5e925SRichard Henderson case 2: /* second of pair */ 398229f5e925SRichard Henderson tcg_debug_assert(!arg_ct->newreg); 398329f5e925SRichard Henderson if (arg_ct->oalias) { 398429f5e925SRichard Henderson reg = new_args[arg_ct->alias_index]; 398529f5e925SRichard Henderson } else { 398629f5e925SRichard Henderson reg = new_args[arg_ct->pair_index] + 1; 398729f5e925SRichard Henderson } 398829f5e925SRichard Henderson break; 398929f5e925SRichard Henderson 399029f5e925SRichard Henderson case 3: /* first of pair, aliasing with a second input */ 399129f5e925SRichard Henderson tcg_debug_assert(!arg_ct->newreg); 399229f5e925SRichard Henderson reg = new_args[arg_ct->pair_index] - 1; 399329f5e925SRichard Henderson break; 399429f5e925SRichard Henderson 399529f5e925SRichard Henderson default: 399629f5e925SRichard Henderson g_assert_not_reached(); 399729f5e925SRichard Henderson } 399882790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 3999098859f1SRichard Henderson set_temp_val_reg(s, ts, reg); 4000c896fe29Sbellard ts->mem_coherent = 0; 4001c896fe29Sbellard new_args[i] = reg; 4002c896fe29Sbellard } 4003e8996ee0Sbellard } 4004c896fe29Sbellard 4005c896fe29Sbellard /* emit instruction */ 4006d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 4007d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 4008d2fd745fSRichard Henderson new_args, const_args); 4009d2fd745fSRichard Henderson } else { 4010dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 4011d2fd745fSRichard Henderson } 4012c896fe29Sbellard 4013c896fe29Sbellard /* move the outputs in the correct register if needed */ 4014c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 401543439139SRichard Henderson ts = arg_temp(op->args[i]); 4016d63e3b6eSRichard Henderson 4017d63e3b6eSRichard Henderson /* ENV should not be modified. */ 4018e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 4019d63e3b6eSRichard Henderson 4020ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 402198b4e186SRichard Henderson temp_sync(s, ts, o_allocated_regs, 0, IS_DEAD_ARG(i)); 402259d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 4023f8bf00f1SRichard Henderson temp_dead(s, ts); 4024ec7a869dSAurelien Jarno } 4025c896fe29Sbellard } 4026c896fe29Sbellard } 4027c896fe29Sbellard 4028efe86b21SRichard Henderson static bool tcg_reg_alloc_dup2(TCGContext *s, const TCGOp *op) 4029efe86b21SRichard Henderson { 4030efe86b21SRichard Henderson const TCGLifeData arg_life = op->life; 4031efe86b21SRichard Henderson TCGTemp *ots, *itsl, *itsh; 4032efe86b21SRichard Henderson TCGType vtype = TCGOP_VECL(op) + TCG_TYPE_V64; 4033efe86b21SRichard Henderson 4034efe86b21SRichard Henderson /* This opcode is only valid for 32-bit hosts, for 64-bit elements. */ 4035efe86b21SRichard Henderson tcg_debug_assert(TCG_TARGET_REG_BITS == 32); 4036efe86b21SRichard Henderson tcg_debug_assert(TCGOP_VECE(op) == MO_64); 4037efe86b21SRichard Henderson 4038efe86b21SRichard Henderson ots = arg_temp(op->args[0]); 4039efe86b21SRichard Henderson itsl = arg_temp(op->args[1]); 4040efe86b21SRichard Henderson itsh = arg_temp(op->args[2]); 4041efe86b21SRichard Henderson 4042efe86b21SRichard Henderson /* ENV should not be modified. */ 4043efe86b21SRichard Henderson tcg_debug_assert(!temp_readonly(ots)); 4044efe86b21SRichard Henderson 4045efe86b21SRichard Henderson /* Allocate the output register now. */ 4046efe86b21SRichard Henderson if (ots->val_type != TEMP_VAL_REG) { 4047efe86b21SRichard Henderson TCGRegSet allocated_regs = s->reserved_regs; 4048efe86b21SRichard Henderson TCGRegSet dup_out_regs = 4049efe86b21SRichard Henderson tcg_op_defs[INDEX_op_dup_vec].args_ct[0].regs; 4050098859f1SRichard Henderson TCGReg oreg; 4051efe86b21SRichard Henderson 4052efe86b21SRichard Henderson /* Make sure to not spill the input registers. */ 4053efe86b21SRichard Henderson if (!IS_DEAD_ARG(1) && itsl->val_type == TEMP_VAL_REG) { 4054efe86b21SRichard Henderson tcg_regset_set_reg(allocated_regs, itsl->reg); 4055efe86b21SRichard Henderson } 4056efe86b21SRichard Henderson if (!IS_DEAD_ARG(2) && itsh->val_type == TEMP_VAL_REG) { 4057efe86b21SRichard Henderson tcg_regset_set_reg(allocated_regs, itsh->reg); 4058efe86b21SRichard Henderson } 4059efe86b21SRichard Henderson 4060098859f1SRichard Henderson oreg = tcg_reg_alloc(s, dup_out_regs, allocated_regs, 4061efe86b21SRichard Henderson op->output_pref[0], ots->indirect_base); 4062098859f1SRichard Henderson set_temp_val_reg(s, ots, oreg); 4063efe86b21SRichard Henderson } 4064efe86b21SRichard Henderson 4065efe86b21SRichard Henderson /* Promote dup2 of immediates to dupi_vec. */ 4066efe86b21SRichard Henderson if (itsl->val_type == TEMP_VAL_CONST && itsh->val_type == TEMP_VAL_CONST) { 4067efe86b21SRichard Henderson uint64_t val = deposit64(itsl->val, 32, 32, itsh->val); 4068efe86b21SRichard Henderson MemOp vece = MO_64; 4069efe86b21SRichard Henderson 4070efe86b21SRichard Henderson if (val == dup_const(MO_8, val)) { 4071efe86b21SRichard Henderson vece = MO_8; 4072efe86b21SRichard Henderson } else if (val == dup_const(MO_16, val)) { 4073efe86b21SRichard Henderson vece = MO_16; 4074efe86b21SRichard Henderson } else if (val == dup_const(MO_32, val)) { 4075efe86b21SRichard Henderson vece = MO_32; 4076efe86b21SRichard Henderson } 4077efe86b21SRichard Henderson 4078efe86b21SRichard Henderson tcg_out_dupi_vec(s, vtype, vece, ots->reg, val); 4079efe86b21SRichard Henderson goto done; 4080efe86b21SRichard Henderson } 4081efe86b21SRichard Henderson 4082efe86b21SRichard Henderson /* If the two inputs form one 64-bit value, try dupm_vec. */ 4083*aef85402SRichard Henderson if (itsl->temp_subindex == HOST_BIG_ENDIAN && 4084*aef85402SRichard Henderson itsh->temp_subindex == !HOST_BIG_ENDIAN && 4085*aef85402SRichard Henderson itsl == itsh + (HOST_BIG_ENDIAN ? 1 : -1)) { 4086*aef85402SRichard Henderson TCGTemp *its = itsl - HOST_BIG_ENDIAN; 4087*aef85402SRichard Henderson 4088*aef85402SRichard Henderson temp_sync(s, its + 0, s->reserved_regs, 0, 0); 4089*aef85402SRichard Henderson temp_sync(s, its + 1, s->reserved_regs, 0, 0); 4090*aef85402SRichard Henderson 4091efe86b21SRichard Henderson if (tcg_out_dupm_vec(s, vtype, MO_64, ots->reg, 4092efe86b21SRichard Henderson its->mem_base->reg, its->mem_offset)) { 4093efe86b21SRichard Henderson goto done; 4094efe86b21SRichard Henderson } 4095efe86b21SRichard Henderson } 4096efe86b21SRichard Henderson 4097efe86b21SRichard Henderson /* Fall back to generic expansion. */ 4098efe86b21SRichard Henderson return false; 4099efe86b21SRichard Henderson 4100efe86b21SRichard Henderson done: 410136f5539cSRichard Henderson ots->mem_coherent = 0; 4102efe86b21SRichard Henderson if (IS_DEAD_ARG(1)) { 4103efe86b21SRichard Henderson temp_dead(s, itsl); 4104efe86b21SRichard Henderson } 4105efe86b21SRichard Henderson if (IS_DEAD_ARG(2)) { 4106efe86b21SRichard Henderson temp_dead(s, itsh); 4107efe86b21SRichard Henderson } 4108efe86b21SRichard Henderson if (NEED_SYNC_ARG(0)) { 4109efe86b21SRichard Henderson temp_sync(s, ots, s->reserved_regs, 0, IS_DEAD_ARG(0)); 4110efe86b21SRichard Henderson } else if (IS_DEAD_ARG(0)) { 4111efe86b21SRichard Henderson temp_dead(s, ots); 4112efe86b21SRichard Henderson } 4113efe86b21SRichard Henderson return true; 4114efe86b21SRichard Henderson } 4115efe86b21SRichard Henderson 4116dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 4117c896fe29Sbellard { 4118cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 4119cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 4120dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 41217b7d8b2dSRichard Henderson const TCGHelperInfo *info; 4122b6638662SRichard Henderson int flags, nb_regs, i; 4123b6638662SRichard Henderson TCGReg reg; 4124cf066674SRichard Henderson TCGArg arg; 4125c896fe29Sbellard TCGTemp *ts; 4126d3452f1fSRichard Henderson intptr_t stack_offset; 4127d3452f1fSRichard Henderson size_t call_stack_size; 4128cf066674SRichard Henderson tcg_insn_unit *func_addr; 4129cf066674SRichard Henderson int allocate_args; 4130c896fe29Sbellard TCGRegSet allocated_regs; 4131c896fe29Sbellard 4132fa52e660SRichard Henderson func_addr = tcg_call_func(op); 41337b7d8b2dSRichard Henderson info = tcg_call_info(op); 41347b7d8b2dSRichard Henderson flags = info->flags; 4135c896fe29Sbellard 41366e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 4137c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 4138c45cb8bbSRichard Henderson nb_regs = nb_iargs; 4139cf066674SRichard Henderson } 4140c896fe29Sbellard 4141c896fe29Sbellard /* assign stack slots first */ 4142c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 4143c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 4144c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 4145b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 4146b03cce8eSbellard if (allocate_args) { 4147345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 4148345649c0SBlue Swirl preallocate call stack */ 4149345649c0SBlue Swirl tcg_abort(); 4150b03cce8eSbellard } 415139cf05d3Sbellard 415239cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 4153c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 4154dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 415539cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 415643439139SRichard Henderson ts = arg_temp(arg); 415740ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 4158b722452aSRichard Henderson s->reserved_regs, 0); 4159e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 416039cf05d3Sbellard } 416139cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 4162c896fe29Sbellard } 4163c896fe29Sbellard 4164c896fe29Sbellard /* assign input registers */ 4165d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 4166c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 4167dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 416839cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 416943439139SRichard Henderson ts = arg_temp(arg); 4170c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 417140ae5c62SRichard Henderson 4172c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 4173c896fe29Sbellard if (ts->reg != reg) { 41744250da10SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 417578113e83SRichard Henderson if (!tcg_out_mov(s, ts->type, reg, ts->reg)) { 4176240c08d0SRichard Henderson /* 4177240c08d0SRichard Henderson * Cross register class move not supported. Sync the 4178240c08d0SRichard Henderson * temp back to its slot and load from there. 4179240c08d0SRichard Henderson */ 4180240c08d0SRichard Henderson temp_sync(s, ts, allocated_regs, 0, 0); 4181240c08d0SRichard Henderson tcg_out_ld(s, ts->type, reg, 4182240c08d0SRichard Henderson ts->mem_base->reg, ts->mem_offset); 418378113e83SRichard Henderson } 4184c896fe29Sbellard } 4185c896fe29Sbellard } else { 4186ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 418740ae5c62SRichard Henderson 41884250da10SRichard Henderson tcg_reg_free(s, reg, allocated_regs); 418940ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 4190b722452aSRichard Henderson temp_load(s, ts, arg_set, allocated_regs, 0); 4191c896fe29Sbellard } 419240ae5c62SRichard Henderson 4193c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 4194c896fe29Sbellard } 419539cf05d3Sbellard } 4196c896fe29Sbellard 4197c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 4198866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 4199866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 420043439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 4201c896fe29Sbellard } 4202c896fe29Sbellard } 4203c896fe29Sbellard 4204c896fe29Sbellard /* clobber call registers */ 4205c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 4206c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 4207b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 4208c896fe29Sbellard } 4209c896fe29Sbellard } 4210c896fe29Sbellard 421178505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 421278505279SAurelien Jarno they might be read. */ 421378505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 421478505279SAurelien Jarno /* Nothing to do */ 421578505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 421678505279SAurelien Jarno sync_globals(s, allocated_regs); 421778505279SAurelien Jarno } else { 4218e8996ee0Sbellard save_globals(s, allocated_regs); 4219b9c18f56Saurel32 } 4220c896fe29Sbellard 42217b7d8b2dSRichard Henderson #ifdef CONFIG_TCG_INTERPRETER 42227b7d8b2dSRichard Henderson { 42237b7d8b2dSRichard Henderson gpointer hash = (gpointer)(uintptr_t)info->typemask; 42247b7d8b2dSRichard Henderson ffi_cif *cif = g_hash_table_lookup(ffi_table, hash); 42257b7d8b2dSRichard Henderson assert(cif != NULL); 42267b7d8b2dSRichard Henderson tcg_out_call(s, func_addr, cif); 42277b7d8b2dSRichard Henderson } 42287b7d8b2dSRichard Henderson #else 4229cf066674SRichard Henderson tcg_out_call(s, func_addr); 42307b7d8b2dSRichard Henderson #endif 4231c896fe29Sbellard 4232c896fe29Sbellard /* assign output registers and emit moves if needed */ 4233c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 4234dd186292SRichard Henderson arg = op->args[i]; 423543439139SRichard Henderson ts = arg_temp(arg); 4236d63e3b6eSRichard Henderson 4237d63e3b6eSRichard Henderson /* ENV should not be modified. */ 4238e01fa97dSRichard Henderson tcg_debug_assert(!temp_readonly(ts)); 4239d63e3b6eSRichard Henderson 4240c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 4241098859f1SRichard Henderson set_temp_val_reg(s, ts, reg); 4242c896fe29Sbellard ts->mem_coherent = 0; 4243ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 424498b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, IS_DEAD_ARG(i)); 424559d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 4246f8bf00f1SRichard Henderson temp_dead(s, ts); 4247c896fe29Sbellard } 4248c896fe29Sbellard } 42498c11ad25SAurelien Jarno } 4250c896fe29Sbellard 4251c896fe29Sbellard #ifdef CONFIG_PROFILER 4252c896fe29Sbellard 4253c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 4254c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 4255c3fac113SEmilio G. Cota do { \ 4256d73415a3SStefan Hajnoczi (to)->field += qatomic_read(&((from)->field)); \ 4257c3fac113SEmilio G. Cota } while (0) 4258c896fe29Sbellard 4259c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 4260c3fac113SEmilio G. Cota do { \ 4261d73415a3SStefan Hajnoczi typeof((from)->field) val__ = qatomic_read(&((from)->field)); \ 4262c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 4263c3fac113SEmilio G. Cota (to)->field = val__; \ 4264c3fac113SEmilio G. Cota } \ 4265c3fac113SEmilio G. Cota } while (0) 4266c3fac113SEmilio G. Cota 4267c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 4268c3fac113SEmilio G. Cota static inline 4269c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 4270c896fe29Sbellard { 42710e2d61cfSRichard Henderson unsigned int n_ctxs = qatomic_read(&tcg_cur_ctxs); 4272c3fac113SEmilio G. Cota unsigned int i; 4273c3fac113SEmilio G. Cota 42743468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 4275d73415a3SStefan Hajnoczi TCGContext *s = qatomic_read(&tcg_ctxs[i]); 42763468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 4277c3fac113SEmilio G. Cota 4278c3fac113SEmilio G. Cota if (counters) { 427972fd2efbSEmilio G. Cota PROF_ADD(prof, orig, cpu_exec_time); 4280c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 4281c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 4282c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 4283c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 4284c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 4285c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 4286c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 4287c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 4288c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 4289c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 4290c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 4291c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 4292c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 4293c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 4294c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 4295c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 4296c3fac113SEmilio G. Cota } 4297c3fac113SEmilio G. Cota if (table) { 4298c896fe29Sbellard int i; 4299d70724ceSzhanghailiang 430015fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 4301c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 4302c3fac113SEmilio G. Cota } 4303c3fac113SEmilio G. Cota } 4304c3fac113SEmilio G. Cota } 4305c3fac113SEmilio G. Cota } 4306c3fac113SEmilio G. Cota 4307c3fac113SEmilio G. Cota #undef PROF_ADD 4308c3fac113SEmilio G. Cota #undef PROF_MAX 4309c3fac113SEmilio G. Cota 4310c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 4311c3fac113SEmilio G. Cota { 4312c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 4313c3fac113SEmilio G. Cota } 4314c3fac113SEmilio G. Cota 4315c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 4316c3fac113SEmilio G. Cota { 4317c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 4318c3fac113SEmilio G. Cota } 4319c3fac113SEmilio G. Cota 4320b6a7f3e0SDaniel P. Berrangé void tcg_dump_op_count(GString *buf) 4321c3fac113SEmilio G. Cota { 4322c3fac113SEmilio G. Cota TCGProfile prof = {}; 4323c3fac113SEmilio G. Cota int i; 4324c3fac113SEmilio G. Cota 4325c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 4326c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 4327b6a7f3e0SDaniel P. Berrangé g_string_append_printf(buf, "%s %" PRId64 "\n", tcg_op_defs[i].name, 4328c3fac113SEmilio G. Cota prof.table_op_count[i]); 4329c896fe29Sbellard } 4330c896fe29Sbellard } 433172fd2efbSEmilio G. Cota 433272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 433372fd2efbSEmilio G. Cota { 43340e2d61cfSRichard Henderson unsigned int n_ctxs = qatomic_read(&tcg_cur_ctxs); 433572fd2efbSEmilio G. Cota unsigned int i; 433672fd2efbSEmilio G. Cota int64_t ret = 0; 433772fd2efbSEmilio G. Cota 433872fd2efbSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 4339d73415a3SStefan Hajnoczi const TCGContext *s = qatomic_read(&tcg_ctxs[i]); 434072fd2efbSEmilio G. Cota const TCGProfile *prof = &s->prof; 434172fd2efbSEmilio G. Cota 4342d73415a3SStefan Hajnoczi ret += qatomic_read(&prof->cpu_exec_time); 434372fd2efbSEmilio G. Cota } 434472fd2efbSEmilio G. Cota return ret; 434572fd2efbSEmilio G. Cota } 4346246ae24dSMax Filippov #else 4347b6a7f3e0SDaniel P. Berrangé void tcg_dump_op_count(GString *buf) 4348246ae24dSMax Filippov { 4349b6a7f3e0SDaniel P. Berrangé g_string_append_printf(buf, "[TCG profiler not compiled]\n"); 4350246ae24dSMax Filippov } 435172fd2efbSEmilio G. Cota 435272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 435372fd2efbSEmilio G. Cota { 435472fd2efbSEmilio G. Cota error_report("%s: TCG profiler not compiled", __func__); 435572fd2efbSEmilio G. Cota exit(EXIT_FAILURE); 435672fd2efbSEmilio G. Cota } 4357c896fe29Sbellard #endif 4358c896fe29Sbellard 4359c896fe29Sbellard 4360fbf59aadSRichard Henderson int tcg_gen_code(TCGContext *s, TranslationBlock *tb, target_ulong pc_start) 4361c896fe29Sbellard { 4362c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 4363c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 4364c3fac113SEmilio G. Cota #endif 436515fa08f8SRichard Henderson int i, num_insns; 436615fa08f8SRichard Henderson TCGOp *op; 4367c896fe29Sbellard 436804fe6400SRichard Henderson #ifdef CONFIG_PROFILER 436904fe6400SRichard Henderson { 4370c1f543b7SEmilio G. Cota int n = 0; 437104fe6400SRichard Henderson 437215fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 437315fa08f8SRichard Henderson n++; 437415fa08f8SRichard Henderson } 4375d73415a3SStefan Hajnoczi qatomic_set(&prof->op_count, prof->op_count + n); 4376c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 4377d73415a3SStefan Hajnoczi qatomic_set(&prof->op_count_max, n); 437804fe6400SRichard Henderson } 437904fe6400SRichard Henderson 438004fe6400SRichard Henderson n = s->nb_temps; 4381d73415a3SStefan Hajnoczi qatomic_set(&prof->temp_count, prof->temp_count + n); 4382c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 4383d73415a3SStefan Hajnoczi qatomic_set(&prof->temp_count_max, n); 438404fe6400SRichard Henderson } 438504fe6400SRichard Henderson } 438604fe6400SRichard Henderson #endif 438704fe6400SRichard Henderson 4388c896fe29Sbellard #ifdef DEBUG_DISAS 4389d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 4390fbf59aadSRichard Henderson && qemu_log_in_addr_range(pc_start))) { 4391c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 439278b54858SRichard Henderson if (logfile) { 439378b54858SRichard Henderson fprintf(logfile, "OP:\n"); 4394b7a83ff8SRichard Henderson tcg_dump_ops(s, logfile, false); 439578b54858SRichard Henderson fprintf(logfile, "\n"); 4396fc59d2d8SRobert Foley qemu_log_unlock(logfile); 4397c896fe29Sbellard } 439878b54858SRichard Henderson } 4399c896fe29Sbellard #endif 4400c896fe29Sbellard 4401bef16ab4SRichard Henderson #ifdef CONFIG_DEBUG_TCG 4402bef16ab4SRichard Henderson /* Ensure all labels referenced have been emitted. */ 4403bef16ab4SRichard Henderson { 4404bef16ab4SRichard Henderson TCGLabel *l; 4405bef16ab4SRichard Henderson bool error = false; 4406bef16ab4SRichard Henderson 4407bef16ab4SRichard Henderson QSIMPLEQ_FOREACH(l, &s->labels, next) { 4408bef16ab4SRichard Henderson if (unlikely(!l->present) && l->refs) { 4409bef16ab4SRichard Henderson qemu_log_mask(CPU_LOG_TB_OP, 4410bef16ab4SRichard Henderson "$L%d referenced but not present.\n", l->id); 4411bef16ab4SRichard Henderson error = true; 4412bef16ab4SRichard Henderson } 4413bef16ab4SRichard Henderson } 4414bef16ab4SRichard Henderson assert(!error); 4415bef16ab4SRichard Henderson } 4416bef16ab4SRichard Henderson #endif 4417bef16ab4SRichard Henderson 4418c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 4419d73415a3SStefan Hajnoczi qatomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 4420c5cc28ffSAurelien Jarno #endif 4421c5cc28ffSAurelien Jarno 44228f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 4423c45cb8bbSRichard Henderson tcg_optimize(s); 44248f2e8c07SKirill Batuzov #endif 44258f2e8c07SKirill Batuzov 4426a23a9ec6Sbellard #ifdef CONFIG_PROFILER 4427d73415a3SStefan Hajnoczi qatomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 4428d73415a3SStefan Hajnoczi qatomic_set(&prof->la_time, prof->la_time - profile_getclock()); 4429a23a9ec6Sbellard #endif 4430c5cc28ffSAurelien Jarno 4431b4fc67c7SRichard Henderson reachable_code_pass(s); 4432b83eabeaSRichard Henderson liveness_pass_1(s); 44335a18407fSRichard Henderson 44345a18407fSRichard Henderson if (s->nb_indirects > 0) { 44355a18407fSRichard Henderson #ifdef DEBUG_DISAS 44365a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 4437fbf59aadSRichard Henderson && qemu_log_in_addr_range(pc_start))) { 4438c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 443978b54858SRichard Henderson if (logfile) { 444078b54858SRichard Henderson fprintf(logfile, "OP before indirect lowering:\n"); 4441b7a83ff8SRichard Henderson tcg_dump_ops(s, logfile, false); 444278b54858SRichard Henderson fprintf(logfile, "\n"); 4443fc59d2d8SRobert Foley qemu_log_unlock(logfile); 44445a18407fSRichard Henderson } 444578b54858SRichard Henderson } 44465a18407fSRichard Henderson #endif 44475a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 4448b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 44495a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 4450b83eabeaSRichard Henderson liveness_pass_1(s); 44515a18407fSRichard Henderson } 44525a18407fSRichard Henderson } 4453c5cc28ffSAurelien Jarno 4454a23a9ec6Sbellard #ifdef CONFIG_PROFILER 4455d73415a3SStefan Hajnoczi qatomic_set(&prof->la_time, prof->la_time + profile_getclock()); 4456a23a9ec6Sbellard #endif 4457c896fe29Sbellard 4458c896fe29Sbellard #ifdef DEBUG_DISAS 4459d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 4460fbf59aadSRichard Henderson && qemu_log_in_addr_range(pc_start))) { 4461c60f599bSRichard Henderson FILE *logfile = qemu_log_trylock(); 446278b54858SRichard Henderson if (logfile) { 446378b54858SRichard Henderson fprintf(logfile, "OP after optimization and liveness analysis:\n"); 4464b7a83ff8SRichard Henderson tcg_dump_ops(s, logfile, true); 446578b54858SRichard Henderson fprintf(logfile, "\n"); 4466fc59d2d8SRobert Foley qemu_log_unlock(logfile); 4467c896fe29Sbellard } 446878b54858SRichard Henderson } 4469c896fe29Sbellard #endif 4470c896fe29Sbellard 447135abb009SRichard Henderson /* Initialize goto_tb jump offsets. */ 447235abb009SRichard Henderson tb->jmp_reset_offset[0] = TB_JMP_RESET_OFFSET_INVALID; 447335abb009SRichard Henderson tb->jmp_reset_offset[1] = TB_JMP_RESET_OFFSET_INVALID; 447435abb009SRichard Henderson tcg_ctx->tb_jmp_reset_offset = tb->jmp_reset_offset; 447535abb009SRichard Henderson if (TCG_TARGET_HAS_direct_jump) { 447635abb009SRichard Henderson tcg_ctx->tb_jmp_insn_offset = tb->jmp_target_arg; 447735abb009SRichard Henderson tcg_ctx->tb_jmp_target_addr = NULL; 447835abb009SRichard Henderson } else { 447935abb009SRichard Henderson tcg_ctx->tb_jmp_insn_offset = NULL; 448035abb009SRichard Henderson tcg_ctx->tb_jmp_target_addr = tb->jmp_target_arg; 448135abb009SRichard Henderson } 448235abb009SRichard Henderson 4483c896fe29Sbellard tcg_reg_alloc_start(s); 4484c896fe29Sbellard 4485db0c51a3SRichard Henderson /* 4486db0c51a3SRichard Henderson * Reset the buffer pointers when restarting after overflow. 4487db0c51a3SRichard Henderson * TODO: Move this into translate-all.c with the rest of the 4488db0c51a3SRichard Henderson * buffer management. Having only this done here is confusing. 4489db0c51a3SRichard Henderson */ 4490db0c51a3SRichard Henderson s->code_buf = tcg_splitwx_to_rw(tb->tc.ptr); 4491db0c51a3SRichard Henderson s->code_ptr = s->code_buf; 4492c896fe29Sbellard 4493659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 44946001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 4495659ef5cbSRichard Henderson #endif 449657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 449757a26946SRichard Henderson s->pool_labels = NULL; 449857a26946SRichard Henderson #endif 44999ecefc84SRichard Henderson 4500fca8a500SRichard Henderson num_insns = -1; 450115fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 4502c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 4503b3db8758Sblueswir1 4504c896fe29Sbellard #ifdef CONFIG_PROFILER 4505d73415a3SStefan Hajnoczi qatomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 4506c896fe29Sbellard #endif 4507c45cb8bbSRichard Henderson 4508c896fe29Sbellard switch (opc) { 4509c896fe29Sbellard case INDEX_op_mov_i32: 4510c896fe29Sbellard case INDEX_op_mov_i64: 4511d2fd745fSRichard Henderson case INDEX_op_mov_vec: 4512dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 4513c896fe29Sbellard break; 4514bab1671fSRichard Henderson case INDEX_op_dup_vec: 4515bab1671fSRichard Henderson tcg_reg_alloc_dup(s, op); 4516bab1671fSRichard Henderson break; 4517765b842aSRichard Henderson case INDEX_op_insn_start: 4518fca8a500SRichard Henderson if (num_insns >= 0) { 45199f754620SRichard Henderson size_t off = tcg_current_code_size(s); 45209f754620SRichard Henderson s->gen_insn_end_off[num_insns] = off; 45219f754620SRichard Henderson /* Assert that we do not overflow our stored offset. */ 45229f754620SRichard Henderson assert(s->gen_insn_end_off[num_insns] == off); 4523fca8a500SRichard Henderson } 4524fca8a500SRichard Henderson num_insns++; 4525bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 4526bad729e2SRichard Henderson target_ulong a; 4527bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 4528efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 4529bad729e2SRichard Henderson #else 4530efee3746SRichard Henderson a = op->args[i]; 4531bad729e2SRichard Henderson #endif 4532fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 4533bad729e2SRichard Henderson } 4534c896fe29Sbellard break; 45355ff9d6a4Sbellard case INDEX_op_discard: 453643439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 45375ff9d6a4Sbellard break; 4538c896fe29Sbellard case INDEX_op_set_label: 4539e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 454092ab8e7dSRichard Henderson tcg_out_label(s, arg_label(op->args[0])); 4541c896fe29Sbellard break; 4542c896fe29Sbellard case INDEX_op_call: 4543dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 4544c45cb8bbSRichard Henderson break; 4545efe86b21SRichard Henderson case INDEX_op_dup2_vec: 4546efe86b21SRichard Henderson if (tcg_reg_alloc_dup2(s, op)) { 4547efe86b21SRichard Henderson break; 4548efe86b21SRichard Henderson } 4549efe86b21SRichard Henderson /* fall through */ 4550c896fe29Sbellard default: 455125c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 4552be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 4553c896fe29Sbellard /* Note: in order to speed up the code, it would be much 4554c896fe29Sbellard faster to have specialized register allocator functions for 4555c896fe29Sbellard some common argument patterns */ 4556dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 4557c896fe29Sbellard break; 4558c896fe29Sbellard } 4559b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 4560b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 4561b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 4562b125f9dcSRichard Henderson generating code without having to check during generation. */ 4563644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 4564b125f9dcSRichard Henderson return -1; 4565b125f9dcSRichard Henderson } 45666e6c4efeSRichard Henderson /* Test for TB overflow, as seen by gen_insn_end_off. */ 45676e6c4efeSRichard Henderson if (unlikely(tcg_current_code_size(s) > UINT16_MAX)) { 45686e6c4efeSRichard Henderson return -2; 45696e6c4efeSRichard Henderson } 4570c896fe29Sbellard } 4571fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 4572fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 4573c45cb8bbSRichard Henderson 4574b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 4575659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 4576aeee05f5SRichard Henderson i = tcg_out_ldst_finalize(s); 4577aeee05f5SRichard Henderson if (i < 0) { 4578aeee05f5SRichard Henderson return i; 457923dceda6SRichard Henderson } 4580659ef5cbSRichard Henderson #endif 458157a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 45821768987bSRichard Henderson i = tcg_out_pool_finalize(s); 45831768987bSRichard Henderson if (i < 0) { 45841768987bSRichard Henderson return i; 458557a26946SRichard Henderson } 458657a26946SRichard Henderson #endif 45877ecd02a0SRichard Henderson if (!tcg_resolve_relocs(s)) { 45887ecd02a0SRichard Henderson return -2; 45897ecd02a0SRichard Henderson } 4590c896fe29Sbellard 4591df5d2b16SRichard Henderson #ifndef CONFIG_TCG_INTERPRETER 4592c896fe29Sbellard /* flush instruction cache */ 4593db0c51a3SRichard Henderson flush_idcache_range((uintptr_t)tcg_splitwx_to_rx(s->code_buf), 4594db0c51a3SRichard Henderson (uintptr_t)s->code_buf, 45951da8de39SRichard Henderson tcg_ptr_byte_diff(s->code_ptr, s->code_buf)); 4596df5d2b16SRichard Henderson #endif 45972aeabc08SStefan Weil 45981813e175SRichard Henderson return tcg_current_code_size(s); 4599c896fe29Sbellard } 4600c896fe29Sbellard 4601a23a9ec6Sbellard #ifdef CONFIG_PROFILER 46023a841ab5SDaniel P. Berrangé void tcg_dump_info(GString *buf) 4603a23a9ec6Sbellard { 4604c3fac113SEmilio G. Cota TCGProfile prof = {}; 4605c3fac113SEmilio G. Cota const TCGProfile *s; 4606c3fac113SEmilio G. Cota int64_t tb_count; 4607c3fac113SEmilio G. Cota int64_t tb_div_count; 4608c3fac113SEmilio G. Cota int64_t tot; 4609c3fac113SEmilio G. Cota 4610c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 4611c3fac113SEmilio G. Cota s = &prof; 4612c3fac113SEmilio G. Cota tb_count = s->tb_count; 4613c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 4614c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 4615a23a9ec6Sbellard 46163a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "JIT cycles %" PRId64 46173a841ab5SDaniel P. Berrangé " (%0.3f s at 2.4 GHz)\n", 4618a23a9ec6Sbellard tot, tot / 2.4e9); 46193a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "translated TBs %" PRId64 46203a841ab5SDaniel P. Berrangé " (aborted=%" PRId64 " %0.1f%%)\n", 4621fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 4622fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 4623fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 46243a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg ops/TB %0.1f max=%d\n", 4625fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 46263a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "deleted ops/TB %0.2f\n", 4627fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 46283a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg temps/TB %0.2f max=%d\n", 46293a841ab5SDaniel P. Berrangé (double)s->temp_count / tb_div_count, 46303a841ab5SDaniel P. Berrangé s->temp_count_max); 46313a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg host code/TB %0.1f\n", 4632fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 46333a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "avg search data/TB %0.1f\n", 4634fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 4635a23a9ec6Sbellard 46363a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/op %0.1f\n", 4637a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 46383a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/in byte %0.1f\n", 4639a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 46403a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/out byte %0.1f\n", 4641a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 46423a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cycles/search byte %0.1f\n", 46433a841ab5SDaniel P. Berrangé s->search_out_len ? 46443a841ab5SDaniel P. Berrangé (double)tot / s->search_out_len : 0); 4645fca8a500SRichard Henderson if (tot == 0) { 4646a23a9ec6Sbellard tot = 1; 4647fca8a500SRichard Henderson } 46483a841ab5SDaniel P. Berrangé g_string_append_printf(buf, " gen_interm time %0.1f%%\n", 4649a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 46503a841ab5SDaniel P. Berrangé g_string_append_printf(buf, " gen_code time %0.1f%%\n", 4651a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 46523a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "optim./code time %0.1f%%\n", 46533a841ab5SDaniel P. Berrangé (double)s->opt_time / (s->code_time ? 46543a841ab5SDaniel P. Berrangé s->code_time : 1) 4655c5cc28ffSAurelien Jarno * 100.0); 46563a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "liveness/code time %0.1f%%\n", 46573a841ab5SDaniel P. Berrangé (double)s->la_time / (s->code_time ? 46583a841ab5SDaniel P. Berrangé s->code_time : 1) * 100.0); 46593a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "cpu_restore count %" PRId64 "\n", 4660a23a9ec6Sbellard s->restore_count); 46613a841ab5SDaniel P. Berrangé g_string_append_printf(buf, " avg cycles %0.1f\n", 46623a841ab5SDaniel P. Berrangé s->restore_count ? 46633a841ab5SDaniel P. Berrangé (double)s->restore_time / s->restore_count : 0); 4664a23a9ec6Sbellard } 4665a23a9ec6Sbellard #else 46663a841ab5SDaniel P. Berrangé void tcg_dump_info(GString *buf) 4667a23a9ec6Sbellard { 46683a841ab5SDaniel P. Berrangé g_string_append_printf(buf, "[TCG profiler not compiled]\n"); 4669a23a9ec6Sbellard } 4670a23a9ec6Sbellard #endif 4671813da627SRichard Henderson 4672813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 46735872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 46745872bbf2SRichard Henderson 46755872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 46765872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 46775872bbf2SRichard Henderson 46785872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 46795872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 46805872bbf2SRichard Henderson prologue unwind info for the tcg machine. 46815872bbf2SRichard Henderson 46825872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 46835872bbf2SRichard Henderson */ 4684813da627SRichard Henderson 4685813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 4686813da627SRichard Henderson typedef enum { 4687813da627SRichard Henderson JIT_NOACTION = 0, 4688813da627SRichard Henderson JIT_REGISTER_FN, 4689813da627SRichard Henderson JIT_UNREGISTER_FN 4690813da627SRichard Henderson } jit_actions_t; 4691813da627SRichard Henderson 4692813da627SRichard Henderson struct jit_code_entry { 4693813da627SRichard Henderson struct jit_code_entry *next_entry; 4694813da627SRichard Henderson struct jit_code_entry *prev_entry; 4695813da627SRichard Henderson const void *symfile_addr; 4696813da627SRichard Henderson uint64_t symfile_size; 4697813da627SRichard Henderson }; 4698813da627SRichard Henderson 4699813da627SRichard Henderson struct jit_descriptor { 4700813da627SRichard Henderson uint32_t version; 4701813da627SRichard Henderson uint32_t action_flag; 4702813da627SRichard Henderson struct jit_code_entry *relevant_entry; 4703813da627SRichard Henderson struct jit_code_entry *first_entry; 4704813da627SRichard Henderson }; 4705813da627SRichard Henderson 4706813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 4707813da627SRichard Henderson void __jit_debug_register_code(void) 4708813da627SRichard Henderson { 4709813da627SRichard Henderson asm(""); 4710813da627SRichard Henderson } 4711813da627SRichard Henderson 4712813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 4713813da627SRichard Henderson the version before we can set it. */ 4714813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 4715813da627SRichard Henderson 4716813da627SRichard Henderson /* End GDB interface. */ 4717813da627SRichard Henderson 4718813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 4719813da627SRichard Henderson { 4720813da627SRichard Henderson const char *p = strtab + 1; 4721813da627SRichard Henderson 4722813da627SRichard Henderson while (1) { 4723813da627SRichard Henderson if (strcmp(p, str) == 0) { 4724813da627SRichard Henderson return p - strtab; 4725813da627SRichard Henderson } 4726813da627SRichard Henderson p += strlen(p) + 1; 4727813da627SRichard Henderson } 4728813da627SRichard Henderson } 4729813da627SRichard Henderson 4730755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf_ptr, size_t buf_size, 47312c90784aSRichard Henderson const void *debug_frame, 47322c90784aSRichard Henderson size_t debug_frame_size) 4733813da627SRichard Henderson { 47345872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 47355872bbf2SRichard Henderson uint32_t len; 47365872bbf2SRichard Henderson uint16_t version; 47375872bbf2SRichard Henderson uint32_t abbrev; 47385872bbf2SRichard Henderson uint8_t ptr_size; 47395872bbf2SRichard Henderson uint8_t cu_die; 47405872bbf2SRichard Henderson uint16_t cu_lang; 47415872bbf2SRichard Henderson uintptr_t cu_low_pc; 47425872bbf2SRichard Henderson uintptr_t cu_high_pc; 47435872bbf2SRichard Henderson uint8_t fn_die; 47445872bbf2SRichard Henderson char fn_name[16]; 47455872bbf2SRichard Henderson uintptr_t fn_low_pc; 47465872bbf2SRichard Henderson uintptr_t fn_high_pc; 47475872bbf2SRichard Henderson uint8_t cu_eoc; 47485872bbf2SRichard Henderson }; 4749813da627SRichard Henderson 4750813da627SRichard Henderson struct ElfImage { 4751813da627SRichard Henderson ElfW(Ehdr) ehdr; 4752813da627SRichard Henderson ElfW(Phdr) phdr; 47535872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 47545872bbf2SRichard Henderson ElfW(Sym) sym[2]; 47555872bbf2SRichard Henderson struct DebugInfo di; 47565872bbf2SRichard Henderson uint8_t da[24]; 47575872bbf2SRichard Henderson char str[80]; 47585872bbf2SRichard Henderson }; 47595872bbf2SRichard Henderson 47605872bbf2SRichard Henderson struct ElfImage *img; 47615872bbf2SRichard Henderson 47625872bbf2SRichard Henderson static const struct ElfImage img_template = { 47635872bbf2SRichard Henderson .ehdr = { 47645872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 47655872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 47665872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 47675872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 47685872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 47695872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 47705872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 47715872bbf2SRichard Henderson .e_type = ET_EXEC, 47725872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 47735872bbf2SRichard Henderson .e_version = EV_CURRENT, 47745872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 47755872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 47765872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 47775872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 47785872bbf2SRichard Henderson .e_phnum = 1, 47795872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 47805872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 47815872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 4782abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 4783abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 4784abbb3eaeSRichard Henderson #endif 4785abbb3eaeSRichard Henderson #ifdef ELF_OSABI 4786abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 4787abbb3eaeSRichard Henderson #endif 47885872bbf2SRichard Henderson }, 47895872bbf2SRichard Henderson .phdr = { 47905872bbf2SRichard Henderson .p_type = PT_LOAD, 47915872bbf2SRichard Henderson .p_flags = PF_X, 47925872bbf2SRichard Henderson }, 47935872bbf2SRichard Henderson .shdr = { 47945872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 47955872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 47965872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 47975872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 47985872bbf2SRichard Henderson will not look for contents. We can record any address. */ 47995872bbf2SRichard Henderson [1] = { /* .text */ 48005872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 48015872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 48025872bbf2SRichard Henderson }, 48035872bbf2SRichard Henderson [2] = { /* .debug_info */ 48045872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 48055872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 48065872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 48075872bbf2SRichard Henderson }, 48085872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 48095872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 48105872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 48115872bbf2SRichard Henderson .sh_size = sizeof(img->da), 48125872bbf2SRichard Henderson }, 48135872bbf2SRichard Henderson [4] = { /* .debug_frame */ 48145872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 48155872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 48165872bbf2SRichard Henderson }, 48175872bbf2SRichard Henderson [5] = { /* .symtab */ 48185872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 48195872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 48205872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 48215872bbf2SRichard Henderson .sh_info = 1, 48225872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 48235872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 48245872bbf2SRichard Henderson }, 48255872bbf2SRichard Henderson [6] = { /* .strtab */ 48265872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 48275872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 48285872bbf2SRichard Henderson .sh_size = sizeof(img->str), 48295872bbf2SRichard Henderson } 48305872bbf2SRichard Henderson }, 48315872bbf2SRichard Henderson .sym = { 48325872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 48335872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 48345872bbf2SRichard Henderson .st_shndx = 1, 48355872bbf2SRichard Henderson } 48365872bbf2SRichard Henderson }, 48375872bbf2SRichard Henderson .di = { 48385872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 48395872bbf2SRichard Henderson .version = 2, 48405872bbf2SRichard Henderson .ptr_size = sizeof(void *), 48415872bbf2SRichard Henderson .cu_die = 1, 48425872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 48435872bbf2SRichard Henderson .fn_die = 2, 48445872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 48455872bbf2SRichard Henderson }, 48465872bbf2SRichard Henderson .da = { 48475872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 48485872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 48495872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 48505872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 48515872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 48525872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 48535872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 48545872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 48555872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 48565872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 48575872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 48585872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 48595872bbf2SRichard Henderson 0 /* no more abbrev */ 48605872bbf2SRichard Henderson }, 48615872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 48625872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 4863813da627SRichard Henderson }; 4864813da627SRichard Henderson 4865813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 4866813da627SRichard Henderson static struct jit_code_entry one_entry; 4867813da627SRichard Henderson 48685872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 4869813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 48702c90784aSRichard Henderson DebugFrameHeader *dfh; 4871813da627SRichard Henderson 48725872bbf2SRichard Henderson img = g_malloc(img_size); 48735872bbf2SRichard Henderson *img = img_template; 4874813da627SRichard Henderson 48755872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 48765872bbf2SRichard Henderson img->phdr.p_paddr = buf; 48775872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 4878813da627SRichard Henderson 48795872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 48805872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 48815872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 4882813da627SRichard Henderson 48835872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 48845872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 48855872bbf2SRichard Henderson 48865872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 48875872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 48885872bbf2SRichard Henderson 48895872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 48905872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 48915872bbf2SRichard Henderson 48925872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 48935872bbf2SRichard Henderson img->sym[1].st_value = buf; 48945872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 48955872bbf2SRichard Henderson 48965872bbf2SRichard Henderson img->di.cu_low_pc = buf; 489745aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 48985872bbf2SRichard Henderson img->di.fn_low_pc = buf; 489945aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 4900813da627SRichard Henderson 49012c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 49022c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 49032c90784aSRichard Henderson dfh->fde.func_start = buf; 49042c90784aSRichard Henderson dfh->fde.func_len = buf_size; 49052c90784aSRichard Henderson 4906813da627SRichard Henderson #ifdef DEBUG_JIT 4907813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 4908813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 4909813da627SRichard Henderson { 4910eb6b2edfSBin Meng g_autofree char *jit = g_strdup_printf("%s/qemu.jit", g_get_tmp_dir()); 4911eb6b2edfSBin Meng FILE *f = fopen(jit, "w+b"); 4912813da627SRichard Henderson if (f) { 49135872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 4914813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 4915813da627SRichard Henderson } 4916813da627SRichard Henderson fclose(f); 4917813da627SRichard Henderson } 4918813da627SRichard Henderson } 4919813da627SRichard Henderson #endif 4920813da627SRichard Henderson 4921813da627SRichard Henderson one_entry.symfile_addr = img; 4922813da627SRichard Henderson one_entry.symfile_size = img_size; 4923813da627SRichard Henderson 4924813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 4925813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 4926813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 4927813da627SRichard Henderson __jit_debug_register_code(); 4928813da627SRichard Henderson } 4929813da627SRichard Henderson #else 49305872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 49315872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 4932813da627SRichard Henderson 4933755bf9e5SRichard Henderson static void tcg_register_jit_int(const void *buf, size_t size, 49342c90784aSRichard Henderson const void *debug_frame, 49352c90784aSRichard Henderson size_t debug_frame_size) 4936813da627SRichard Henderson { 4937813da627SRichard Henderson } 4938813da627SRichard Henderson 4939755bf9e5SRichard Henderson void tcg_register_jit(const void *buf, size_t buf_size) 4940813da627SRichard Henderson { 4941813da627SRichard Henderson } 4942813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 4943db432672SRichard Henderson 4944db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 4945db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 4946db432672SRichard Henderson { 4947db432672SRichard Henderson g_assert_not_reached(); 4948db432672SRichard Henderson } 4949db432672SRichard Henderson #endif 4950