1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 33f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 341de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 351de7afc9SPaolo Bonzini #include "qemu/timer.h" 36c896fe29Sbellard 37c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 38c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 39c896fe29Sbellard instructions */ 40c896fe29Sbellard #define NO_CPU_IO_DEFS 41c896fe29Sbellard #include "cpu.h" 42c896fe29Sbellard 4363c91552SPaolo Bonzini #include "exec/cpu-common.h" 4463c91552SPaolo Bonzini #include "exec/exec-all.h" 4563c91552SPaolo Bonzini 46c896fe29Sbellard #include "tcg-op.h" 47813da627SRichard Henderson 48edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 49813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 50edee2579SRichard Henderson #else 51edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 52813da627SRichard Henderson #endif 53813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 54813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 55813da627SRichard Henderson #else 56813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 57813da627SRichard Henderson #endif 58813da627SRichard Henderson 59c896fe29Sbellard #include "elf.h" 60508127e2SPaolo Bonzini #include "exec/log.h" 61c896fe29Sbellard 62ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and 63ce151109SPeter Maydell used here. */ 64e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 65f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode); 66e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 671813e175SRichard Henderson static void patch_reloc(tcg_insn_unit *code_ptr, int type, 682ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 69c896fe29Sbellard 70497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 71497a22ebSRichard Henderson typedef struct { 72497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 73497a22ebSRichard Henderson uint32_t id; 74497a22ebSRichard Henderson uint8_t version; 75497a22ebSRichard Henderson char augmentation[1]; 76497a22ebSRichard Henderson uint8_t code_align; 77497a22ebSRichard Henderson uint8_t data_align; 78497a22ebSRichard Henderson uint8_t return_column; 79497a22ebSRichard Henderson } DebugFrameCIE; 80497a22ebSRichard Henderson 81497a22ebSRichard Henderson typedef struct QEMU_PACKED { 82497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 83497a22ebSRichard Henderson uint32_t cie_offset; 84edee2579SRichard Henderson uintptr_t func_start; 85edee2579SRichard Henderson uintptr_t func_len; 86497a22ebSRichard Henderson } DebugFrameFDEHeader; 87497a22ebSRichard Henderson 882c90784aSRichard Henderson typedef struct QEMU_PACKED { 892c90784aSRichard Henderson DebugFrameCIE cie; 902c90784aSRichard Henderson DebugFrameFDEHeader fde; 912c90784aSRichard Henderson } DebugFrameHeader; 922c90784aSRichard Henderson 93813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 942c90784aSRichard Henderson const void *debug_frame, 952c90784aSRichard Henderson size_t debug_frame_size) 96813da627SRichard Henderson __attribute__((unused)); 97813da627SRichard Henderson 98ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */ 99069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct, 100069ea736SRichard Henderson const char *ct_str, TCGType type); 1012a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 102a05b5b9bSRichard Henderson intptr_t arg2); 1032a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 104c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1052a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 106c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args, 107c0ad3001SStefan Weil const int *const_args); 1082a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 109a05b5b9bSRichard Henderson intptr_t arg2); 11059d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 11159d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 112cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); 113f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type, 114c0ad3001SStefan Weil const TCGArgConstraint *arg_ct); 115659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 116659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s); 117659ef5cbSRichard Henderson #endif 118c896fe29Sbellard 119b1d8e52eSblueswir1 static TCGRegSet tcg_target_available_regs[2]; 120b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 121c896fe29Sbellard 1221813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1234196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 124c896fe29Sbellard { 125c896fe29Sbellard *s->code_ptr++ = v; 126c896fe29Sbellard } 127c896fe29Sbellard 1284196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1294196dca6SPeter Maydell uint8_t v) 1305c53bb81SPeter Maydell { 1311813e175SRichard Henderson *p = v; 1325c53bb81SPeter Maydell } 1331813e175SRichard Henderson #endif 1345c53bb81SPeter Maydell 1351813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1364196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 137c896fe29Sbellard { 1381813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1391813e175SRichard Henderson *s->code_ptr++ = v; 1401813e175SRichard Henderson } else { 1411813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1424387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1431813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 1441813e175SRichard Henderson } 145c896fe29Sbellard } 146c896fe29Sbellard 1474196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 1484196dca6SPeter Maydell uint16_t v) 1495c53bb81SPeter Maydell { 1501813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1511813e175SRichard Henderson *p = v; 1521813e175SRichard Henderson } else { 1535c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 1545c53bb81SPeter Maydell } 1551813e175SRichard Henderson } 1561813e175SRichard Henderson #endif 1575c53bb81SPeter Maydell 1581813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 1594196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 160c896fe29Sbellard { 1611813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 1621813e175SRichard Henderson *s->code_ptr++ = v; 1631813e175SRichard Henderson } else { 1641813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1654387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1661813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 1671813e175SRichard Henderson } 168c896fe29Sbellard } 169c896fe29Sbellard 1704196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 1714196dca6SPeter Maydell uint32_t v) 1725c53bb81SPeter Maydell { 1731813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 1741813e175SRichard Henderson *p = v; 1751813e175SRichard Henderson } else { 1765c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 1775c53bb81SPeter Maydell } 1781813e175SRichard Henderson } 1791813e175SRichard Henderson #endif 1805c53bb81SPeter Maydell 1811813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 1824196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 183ac26eb69SRichard Henderson { 1841813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 1851813e175SRichard Henderson *s->code_ptr++ = v; 1861813e175SRichard Henderson } else { 1871813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1884387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1891813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 1901813e175SRichard Henderson } 191ac26eb69SRichard Henderson } 192ac26eb69SRichard Henderson 1934196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 1944196dca6SPeter Maydell uint64_t v) 1955c53bb81SPeter Maydell { 1961813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 1971813e175SRichard Henderson *p = v; 1981813e175SRichard Henderson } else { 1995c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2005c53bb81SPeter Maydell } 2011813e175SRichard Henderson } 2021813e175SRichard Henderson #endif 2035c53bb81SPeter Maydell 204c896fe29Sbellard /* label relocation processing */ 205c896fe29Sbellard 2061813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 207bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 208c896fe29Sbellard { 209c896fe29Sbellard TCGRelocation *r; 210c896fe29Sbellard 211c896fe29Sbellard if (l->has_value) { 212623e265cSpbrook /* FIXME: This may break relocations on RISC targets that 213623e265cSpbrook modify instruction fields in place. The caller may not have 214623e265cSpbrook written the initial value. */ 215f54b3f92Saurel32 patch_reloc(code_ptr, type, l->u.value, addend); 216c896fe29Sbellard } else { 217c896fe29Sbellard /* add a new relocation entry */ 218c896fe29Sbellard r = tcg_malloc(sizeof(TCGRelocation)); 219c896fe29Sbellard r->type = type; 220c896fe29Sbellard r->ptr = code_ptr; 221c896fe29Sbellard r->addend = addend; 222c896fe29Sbellard r->next = l->u.first_reloc; 223c896fe29Sbellard l->u.first_reloc = r; 224c896fe29Sbellard } 225c896fe29Sbellard } 226c896fe29Sbellard 227bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr) 228c896fe29Sbellard { 2292ba7fae2SRichard Henderson intptr_t value = (intptr_t)ptr; 2301813e175SRichard Henderson TCGRelocation *r; 231c896fe29Sbellard 232eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 2331813e175SRichard Henderson 2341813e175SRichard Henderson for (r = l->u.first_reloc; r != NULL; r = r->next) { 235f54b3f92Saurel32 patch_reloc(r->ptr, r->type, value, r->addend); 236c896fe29Sbellard } 2371813e175SRichard Henderson 238c896fe29Sbellard l->has_value = 1; 2391813e175SRichard Henderson l->u.value_ptr = ptr; 240c896fe29Sbellard } 241c896fe29Sbellard 24242a268c2SRichard Henderson TCGLabel *gen_new_label(void) 243c896fe29Sbellard { 244c896fe29Sbellard TCGContext *s = &tcg_ctx; 24551e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 246c896fe29Sbellard 24751e3972cSRichard Henderson *l = (TCGLabel){ 24851e3972cSRichard Henderson .id = s->nb_labels++ 24951e3972cSRichard Henderson }; 25042a268c2SRichard Henderson 25142a268c2SRichard Henderson return l; 252c896fe29Sbellard } 253c896fe29Sbellard 254ce151109SPeter Maydell #include "tcg-target.inc.c" 255c896fe29Sbellard 256c896fe29Sbellard /* pool based memory allocation */ 257c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 258c896fe29Sbellard { 259c896fe29Sbellard TCGPool *p; 260c896fe29Sbellard int pool_size; 261c896fe29Sbellard 262c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 263c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 2647267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 265c896fe29Sbellard p->size = size; 2664055299eSKirill Batuzov p->next = s->pool_first_large; 2674055299eSKirill Batuzov s->pool_first_large = p; 2684055299eSKirill Batuzov return p->data; 269c896fe29Sbellard } else { 270c896fe29Sbellard p = s->pool_current; 271c896fe29Sbellard if (!p) { 272c896fe29Sbellard p = s->pool_first; 273c896fe29Sbellard if (!p) 274c896fe29Sbellard goto new_pool; 275c896fe29Sbellard } else { 276c896fe29Sbellard if (!p->next) { 277c896fe29Sbellard new_pool: 278c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 2797267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 280c896fe29Sbellard p->size = pool_size; 281c896fe29Sbellard p->next = NULL; 282c896fe29Sbellard if (s->pool_current) 283c896fe29Sbellard s->pool_current->next = p; 284c896fe29Sbellard else 285c896fe29Sbellard s->pool_first = p; 286c896fe29Sbellard } else { 287c896fe29Sbellard p = p->next; 288c896fe29Sbellard } 289c896fe29Sbellard } 290c896fe29Sbellard } 291c896fe29Sbellard s->pool_current = p; 292c896fe29Sbellard s->pool_cur = p->data + size; 293c896fe29Sbellard s->pool_end = p->data + p->size; 294c896fe29Sbellard return p->data; 295c896fe29Sbellard } 296c896fe29Sbellard 297c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 298c896fe29Sbellard { 2994055299eSKirill Batuzov TCGPool *p, *t; 3004055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 3014055299eSKirill Batuzov t = p->next; 3024055299eSKirill Batuzov g_free(p); 3034055299eSKirill Batuzov } 3044055299eSKirill Batuzov s->pool_first_large = NULL; 305c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 306c896fe29Sbellard s->pool_current = NULL; 307c896fe29Sbellard } 308c896fe29Sbellard 309100b5e01SRichard Henderson typedef struct TCGHelperInfo { 310100b5e01SRichard Henderson void *func; 311100b5e01SRichard Henderson const char *name; 312afb49896SRichard Henderson unsigned flags; 313afb49896SRichard Henderson unsigned sizemask; 314100b5e01SRichard Henderson } TCGHelperInfo; 315100b5e01SRichard Henderson 3162ef6175aSRichard Henderson #include "exec/helper-proto.h" 3172ef6175aSRichard Henderson 318100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 3192ef6175aSRichard Henderson #include "exec/helper-tcg.h" 320100b5e01SRichard Henderson }; 321100b5e01SRichard Henderson 32291478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 323f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 32491478cefSRichard Henderson 325c896fe29Sbellard void tcg_context_init(TCGContext *s) 326c896fe29Sbellard { 327100b5e01SRichard Henderson int op, total_args, n, i; 328c896fe29Sbellard TCGOpDef *def; 329c896fe29Sbellard TCGArgConstraint *args_ct; 330c896fe29Sbellard int *sorted_args; 33184fd9dd3SRichard Henderson GHashTable *helper_table; 332c896fe29Sbellard 333c896fe29Sbellard memset(s, 0, sizeof(*s)); 334c896fe29Sbellard s->nb_globals = 0; 335c896fe29Sbellard 336c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 337c896fe29Sbellard space */ 338c896fe29Sbellard total_args = 0; 339c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 340c896fe29Sbellard def = &tcg_op_defs[op]; 341c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 342c896fe29Sbellard total_args += n; 343c896fe29Sbellard } 344c896fe29Sbellard 3457267c094SAnthony Liguori args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args); 3467267c094SAnthony Liguori sorted_args = g_malloc(sizeof(int) * total_args); 347c896fe29Sbellard 348c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 349c896fe29Sbellard def = &tcg_op_defs[op]; 350c896fe29Sbellard def->args_ct = args_ct; 351c896fe29Sbellard def->sorted_args = sorted_args; 352c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 353c896fe29Sbellard sorted_args += n; 354c896fe29Sbellard args_ct += n; 355c896fe29Sbellard } 356c896fe29Sbellard 3575cd8f621SRichard Henderson /* Register helpers. */ 35884fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 35984fd9dd3SRichard Henderson s->helpers = helper_table = g_hash_table_new(NULL, NULL); 36084fd9dd3SRichard Henderson 361100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 36284fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 36372866e82SRichard Henderson (gpointer)&all_helpers[i]); 364100b5e01SRichard Henderson } 3655cd8f621SRichard Henderson 366c896fe29Sbellard tcg_target_init(s); 367f69d277eSRichard Henderson process_op_defs(s); 36891478cefSRichard Henderson 36991478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 37091478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 37191478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 37291478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 37391478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 37491478cefSRichard Henderson break; 37591478cefSRichard Henderson } 37691478cefSRichard Henderson } 37791478cefSRichard Henderson for (i = 0; i < n; ++i) { 37891478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 37991478cefSRichard Henderson } 38091478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 38191478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 38291478cefSRichard Henderson } 3839002ec79SRichard Henderson } 384b03cce8eSbellard 3856e3b2bfdSEmilio G. Cota /* 3866e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 3876e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 3886e3b2bfdSEmilio G. Cota */ 3896e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 3906e3b2bfdSEmilio G. Cota { 3916e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 3926e3b2bfdSEmilio G. Cota TranslationBlock *tb; 3936e3b2bfdSEmilio G. Cota void *next; 3946e3b2bfdSEmilio G. Cota 3956e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 3966e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 3976e3b2bfdSEmilio G. Cota 3986e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 3996e3b2bfdSEmilio G. Cota return NULL; 4006e3b2bfdSEmilio G. Cota } 4016e3b2bfdSEmilio G. Cota s->code_gen_ptr = next; 40257a26946SRichard Henderson s->data_gen_ptr = NULL; 4036e3b2bfdSEmilio G. Cota return tb; 4046e3b2bfdSEmilio G. Cota } 4056e3b2bfdSEmilio G. Cota 4069002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 4079002ec79SRichard Henderson { 4088163b749SRichard Henderson size_t prologue_size, total_size; 4098163b749SRichard Henderson void *buf0, *buf1; 4108163b749SRichard Henderson 4118163b749SRichard Henderson /* Put the prologue at the beginning of code_gen_buffer. */ 4128163b749SRichard Henderson buf0 = s->code_gen_buffer; 4138163b749SRichard Henderson s->code_ptr = buf0; 4148163b749SRichard Henderson s->code_buf = buf0; 4158163b749SRichard Henderson s->code_gen_prologue = buf0; 4168163b749SRichard Henderson 4178163b749SRichard Henderson /* Generate the prologue. */ 418b03cce8eSbellard tcg_target_qemu_prologue(s); 4198163b749SRichard Henderson buf1 = s->code_ptr; 4208163b749SRichard Henderson flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1); 4218163b749SRichard Henderson 4228163b749SRichard Henderson /* Deduct the prologue from the buffer. */ 4238163b749SRichard Henderson prologue_size = tcg_current_code_size(s); 4248163b749SRichard Henderson s->code_gen_ptr = buf1; 4258163b749SRichard Henderson s->code_gen_buffer = buf1; 4268163b749SRichard Henderson s->code_buf = buf1; 4278163b749SRichard Henderson total_size = s->code_gen_buffer_size - prologue_size; 4288163b749SRichard Henderson s->code_gen_buffer_size = total_size; 4298163b749SRichard Henderson 430b125f9dcSRichard Henderson /* Compute a high-water mark, at which we voluntarily flush the buffer 431b125f9dcSRichard Henderson and start over. The size here is arbitrary, significantly larger 432b125f9dcSRichard Henderson than we expect the code generation for any one opcode to require. */ 43323dceda6SRichard Henderson s->code_gen_highwater = s->code_gen_buffer + (total_size - 1024); 4348163b749SRichard Henderson 4358163b749SRichard Henderson tcg_register_jit(s->code_gen_buffer, total_size); 436d6b64b2bSRichard Henderson 437d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 438d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 4391ee73216SRichard Henderson qemu_log_lock(); 4408163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 4418163b749SRichard Henderson log_disas(buf0, prologue_size); 442d6b64b2bSRichard Henderson qemu_log("\n"); 443d6b64b2bSRichard Henderson qemu_log_flush(); 4441ee73216SRichard Henderson qemu_log_unlock(); 445d6b64b2bSRichard Henderson } 446d6b64b2bSRichard Henderson #endif 447cedbcb01SEmilio G. Cota 448cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 449cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 450cedbcb01SEmilio G. Cota tcg_debug_assert(s->code_gen_epilogue != NULL); 451cedbcb01SEmilio G. Cota } 452c896fe29Sbellard } 453c896fe29Sbellard 454c896fe29Sbellard void tcg_func_start(TCGContext *s) 455c896fe29Sbellard { 456c896fe29Sbellard tcg_pool_reset(s); 457c896fe29Sbellard s->nb_temps = s->nb_globals; 4580ec9eabcSRichard Henderson 4590ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 4600ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 4610ec9eabcSRichard Henderson 462c896fe29Sbellard s->nb_labels = 0; 463c896fe29Sbellard s->current_frame_offset = s->frame_start; 464c896fe29Sbellard 4650a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 4660a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 4670a209d4bSRichard Henderson #endif 4680a209d4bSRichard Henderson 469dcb8e758SRichard Henderson s->gen_op_buf[0].next = 1; 470dcb8e758SRichard Henderson s->gen_op_buf[0].prev = 0; 471dcb8e758SRichard Henderson s->gen_next_op_idx = 1; 472c45cb8bbSRichard Henderson s->gen_next_parm_idx = 0; 473c896fe29Sbellard } 474c896fe29Sbellard 4757ca4b752SRichard Henderson static inline int temp_idx(TCGContext *s, TCGTemp *ts) 476c896fe29Sbellard { 4777ca4b752SRichard Henderson ptrdiff_t n = ts - s->temps; 4787ca4b752SRichard Henderson tcg_debug_assert(n >= 0 && n < s->nb_temps); 4797ca4b752SRichard Henderson return n; 4807ca4b752SRichard Henderson } 4817ca4b752SRichard Henderson 4827ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s) 4837ca4b752SRichard Henderson { 4847ca4b752SRichard Henderson int n = s->nb_temps++; 4857ca4b752SRichard Henderson tcg_debug_assert(n < TCG_MAX_TEMPS); 4867ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 4877ca4b752SRichard Henderson } 4887ca4b752SRichard Henderson 4897ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s) 4907ca4b752SRichard Henderson { 4917ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 4927ca4b752SRichard Henderson s->nb_globals++; 4937ca4b752SRichard Henderson return tcg_temp_alloc(s); 494c896fe29Sbellard } 495c896fe29Sbellard 496b3a62939SRichard Henderson static int tcg_global_reg_new_internal(TCGContext *s, TCGType type, 497b6638662SRichard Henderson TCGReg reg, const char *name) 498c896fe29Sbellard { 499c896fe29Sbellard TCGTemp *ts; 500c896fe29Sbellard 501b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 502c896fe29Sbellard tcg_abort(); 503b3a62939SRichard Henderson } 5047ca4b752SRichard Henderson 5057ca4b752SRichard Henderson ts = tcg_global_alloc(s); 506c896fe29Sbellard ts->base_type = type; 507c896fe29Sbellard ts->type = type; 508c896fe29Sbellard ts->fixed_reg = 1; 509c896fe29Sbellard ts->reg = reg; 510c896fe29Sbellard ts->name = name; 511c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 5127ca4b752SRichard Henderson 5137ca4b752SRichard Henderson return temp_idx(s, ts); 514a7812ae4Spbrook } 515a7812ae4Spbrook 516b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 517a7812ae4Spbrook { 518a7812ae4Spbrook int idx; 519b3a62939SRichard Henderson s->frame_start = start; 520b3a62939SRichard Henderson s->frame_end = start + size; 521b3a62939SRichard Henderson idx = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 522b3a62939SRichard Henderson s->frame_temp = &s->temps[idx]; 523b3a62939SRichard Henderson } 524a7812ae4Spbrook 525b6638662SRichard Henderson TCGv_i32 tcg_global_reg_new_i32(TCGReg reg, const char *name) 526b3a62939SRichard Henderson { 527b3a62939SRichard Henderson TCGContext *s = &tcg_ctx; 528b3a62939SRichard Henderson int idx; 529b3a62939SRichard Henderson 530b3a62939SRichard Henderson if (tcg_regset_test_reg(s->reserved_regs, reg)) { 531b3a62939SRichard Henderson tcg_abort(); 532b3a62939SRichard Henderson } 533b3a62939SRichard Henderson idx = tcg_global_reg_new_internal(s, TCG_TYPE_I32, reg, name); 534a7812ae4Spbrook return MAKE_TCGV_I32(idx); 535a7812ae4Spbrook } 536a7812ae4Spbrook 537b6638662SRichard Henderson TCGv_i64 tcg_global_reg_new_i64(TCGReg reg, const char *name) 538a7812ae4Spbrook { 539b3a62939SRichard Henderson TCGContext *s = &tcg_ctx; 540a7812ae4Spbrook int idx; 541a7812ae4Spbrook 542b3a62939SRichard Henderson if (tcg_regset_test_reg(s->reserved_regs, reg)) { 543b3a62939SRichard Henderson tcg_abort(); 544b3a62939SRichard Henderson } 545b3a62939SRichard Henderson idx = tcg_global_reg_new_internal(s, TCG_TYPE_I64, reg, name); 546a7812ae4Spbrook return MAKE_TCGV_I64(idx); 547c896fe29Sbellard } 548c896fe29Sbellard 549e1ccc054SRichard Henderson int tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 550e1ccc054SRichard Henderson intptr_t offset, const char *name) 551c896fe29Sbellard { 552c896fe29Sbellard TCGContext *s = &tcg_ctx; 5537ca4b752SRichard Henderson TCGTemp *base_ts = &s->temps[GET_TCGV_PTR(base)]; 5547ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 555b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 5567ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 5577ca4b752SRichard Henderson bigendian = 1; 5587ca4b752SRichard Henderson #endif 559c896fe29Sbellard 560b3915dbbSRichard Henderson if (!base_ts->fixed_reg) { 5615a18407fSRichard Henderson /* We do not support double-indirect registers. */ 5625a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 563b3915dbbSRichard Henderson base_ts->indirect_base = 1; 5645a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 5655a18407fSRichard Henderson ? 2 : 1); 5665a18407fSRichard Henderson indirect_reg = 1; 567b3915dbbSRichard Henderson } 568b3915dbbSRichard Henderson 5697ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 5707ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 571c896fe29Sbellard char buf[64]; 5727ca4b752SRichard Henderson 5737ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 574c896fe29Sbellard ts->type = TCG_TYPE_I32; 575b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 576c896fe29Sbellard ts->mem_allocated = 1; 577b3a62939SRichard Henderson ts->mem_base = base_ts; 5787ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 579c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 580c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 581c896fe29Sbellard ts->name = strdup(buf); 582c896fe29Sbellard 5837ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 5847ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 5857ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 586b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 5877ca4b752SRichard Henderson ts2->mem_allocated = 1; 5887ca4b752SRichard Henderson ts2->mem_base = base_ts; 5897ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 590c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 591c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 592120c1084SRichard Henderson ts2->name = strdup(buf); 5937ca4b752SRichard Henderson } else { 594c896fe29Sbellard ts->base_type = type; 595c896fe29Sbellard ts->type = type; 596b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 597c896fe29Sbellard ts->mem_allocated = 1; 598b3a62939SRichard Henderson ts->mem_base = base_ts; 599c896fe29Sbellard ts->mem_offset = offset; 600c896fe29Sbellard ts->name = name; 601c896fe29Sbellard } 6027ca4b752SRichard Henderson return temp_idx(s, ts); 603c896fe29Sbellard } 604c896fe29Sbellard 6057ca4b752SRichard Henderson static int tcg_temp_new_internal(TCGType type, int temp_local) 606c896fe29Sbellard { 607c896fe29Sbellard TCGContext *s = &tcg_ctx; 608c896fe29Sbellard TCGTemp *ts; 609641d5fbeSbellard int idx, k; 610c896fe29Sbellard 6110ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 6120ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 6130ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 6140ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 6150ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 6160ec9eabcSRichard Henderson 617e8996ee0Sbellard ts = &s->temps[idx]; 618e8996ee0Sbellard ts->temp_allocated = 1; 6197ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 6207ca4b752SRichard Henderson tcg_debug_assert(ts->temp_local == temp_local); 621e8996ee0Sbellard } else { 6227ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 6237ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 6247ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 6257ca4b752SRichard Henderson 626c896fe29Sbellard ts->base_type = type; 627c896fe29Sbellard ts->type = TCG_TYPE_I32; 628e8996ee0Sbellard ts->temp_allocated = 1; 629641d5fbeSbellard ts->temp_local = temp_local; 6307ca4b752SRichard Henderson 6317ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 6327ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 6337ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 6347ca4b752SRichard Henderson ts2->temp_allocated = 1; 6357ca4b752SRichard Henderson ts2->temp_local = temp_local; 6367ca4b752SRichard Henderson } else { 637c896fe29Sbellard ts->base_type = type; 638c896fe29Sbellard ts->type = type; 639e8996ee0Sbellard ts->temp_allocated = 1; 640641d5fbeSbellard ts->temp_local = temp_local; 641c896fe29Sbellard } 6427ca4b752SRichard Henderson idx = temp_idx(s, ts); 643e8996ee0Sbellard } 64427bfd83cSPeter Maydell 64527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 64627bfd83cSPeter Maydell s->temps_in_use++; 64727bfd83cSPeter Maydell #endif 648a7812ae4Spbrook return idx; 649c896fe29Sbellard } 650c896fe29Sbellard 651a7812ae4Spbrook TCGv_i32 tcg_temp_new_internal_i32(int temp_local) 652a7812ae4Spbrook { 653a7812ae4Spbrook int idx; 654a7812ae4Spbrook 655a7812ae4Spbrook idx = tcg_temp_new_internal(TCG_TYPE_I32, temp_local); 656a7812ae4Spbrook return MAKE_TCGV_I32(idx); 657a7812ae4Spbrook } 658a7812ae4Spbrook 659a7812ae4Spbrook TCGv_i64 tcg_temp_new_internal_i64(int temp_local) 660a7812ae4Spbrook { 661a7812ae4Spbrook int idx; 662a7812ae4Spbrook 663a7812ae4Spbrook idx = tcg_temp_new_internal(TCG_TYPE_I64, temp_local); 664a7812ae4Spbrook return MAKE_TCGV_I64(idx); 665a7812ae4Spbrook } 666a7812ae4Spbrook 6670ec9eabcSRichard Henderson static void tcg_temp_free_internal(int idx) 668c896fe29Sbellard { 669c896fe29Sbellard TCGContext *s = &tcg_ctx; 670c896fe29Sbellard TCGTemp *ts; 671641d5fbeSbellard int k; 672c896fe29Sbellard 67327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 67427bfd83cSPeter Maydell s->temps_in_use--; 67527bfd83cSPeter Maydell if (s->temps_in_use < 0) { 67627bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 67727bfd83cSPeter Maydell } 67827bfd83cSPeter Maydell #endif 67927bfd83cSPeter Maydell 680eabb7b91SAurelien Jarno tcg_debug_assert(idx >= s->nb_globals && idx < s->nb_temps); 681c896fe29Sbellard ts = &s->temps[idx]; 682eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 683e8996ee0Sbellard ts->temp_allocated = 0; 6840ec9eabcSRichard Henderson 68518d13fa2SAlexander Graf k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0); 6860ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 687e8996ee0Sbellard } 688e8996ee0Sbellard 689a7812ae4Spbrook void tcg_temp_free_i32(TCGv_i32 arg) 690e8996ee0Sbellard { 691a7812ae4Spbrook tcg_temp_free_internal(GET_TCGV_I32(arg)); 692a7812ae4Spbrook } 693a7812ae4Spbrook 694a7812ae4Spbrook void tcg_temp_free_i64(TCGv_i64 arg) 695a7812ae4Spbrook { 696a7812ae4Spbrook tcg_temp_free_internal(GET_TCGV_I64(arg)); 697a7812ae4Spbrook } 698a7812ae4Spbrook 699a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 700a7812ae4Spbrook { 701a7812ae4Spbrook TCGv_i32 t0; 702a7812ae4Spbrook t0 = tcg_temp_new_i32(); 703e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 704e8996ee0Sbellard return t0; 705c896fe29Sbellard } 706c896fe29Sbellard 707a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 708c896fe29Sbellard { 709a7812ae4Spbrook TCGv_i64 t0; 710a7812ae4Spbrook t0 = tcg_temp_new_i64(); 711e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 712e8996ee0Sbellard return t0; 713c896fe29Sbellard } 714c896fe29Sbellard 715a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 716bdffd4a9Saurel32 { 717a7812ae4Spbrook TCGv_i32 t0; 718a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 719bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 720bdffd4a9Saurel32 return t0; 721bdffd4a9Saurel32 } 722bdffd4a9Saurel32 723a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 724bdffd4a9Saurel32 { 725a7812ae4Spbrook TCGv_i64 t0; 726a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 727bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 728bdffd4a9Saurel32 return t0; 729bdffd4a9Saurel32 } 730bdffd4a9Saurel32 73127bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 73227bfd83cSPeter Maydell void tcg_clear_temp_count(void) 73327bfd83cSPeter Maydell { 73427bfd83cSPeter Maydell TCGContext *s = &tcg_ctx; 73527bfd83cSPeter Maydell s->temps_in_use = 0; 73627bfd83cSPeter Maydell } 73727bfd83cSPeter Maydell 73827bfd83cSPeter Maydell int tcg_check_temp_count(void) 73927bfd83cSPeter Maydell { 74027bfd83cSPeter Maydell TCGContext *s = &tcg_ctx; 74127bfd83cSPeter Maydell if (s->temps_in_use) { 74227bfd83cSPeter Maydell /* Clear the count so that we don't give another 74327bfd83cSPeter Maydell * warning immediately next time around. 74427bfd83cSPeter Maydell */ 74527bfd83cSPeter Maydell s->temps_in_use = 0; 74627bfd83cSPeter Maydell return 1; 74727bfd83cSPeter Maydell } 74827bfd83cSPeter Maydell return 0; 74927bfd83cSPeter Maydell } 75027bfd83cSPeter Maydell #endif 75127bfd83cSPeter Maydell 752be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 753be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 754be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 755be0f34b5SRichard Henderson { 756be0f34b5SRichard Henderson switch (op) { 757be0f34b5SRichard Henderson case INDEX_op_discard: 758be0f34b5SRichard Henderson case INDEX_op_set_label: 759be0f34b5SRichard Henderson case INDEX_op_call: 760be0f34b5SRichard Henderson case INDEX_op_br: 761be0f34b5SRichard Henderson case INDEX_op_mb: 762be0f34b5SRichard Henderson case INDEX_op_insn_start: 763be0f34b5SRichard Henderson case INDEX_op_exit_tb: 764be0f34b5SRichard Henderson case INDEX_op_goto_tb: 765be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 766be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 767be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 768be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 769be0f34b5SRichard Henderson return true; 770be0f34b5SRichard Henderson 771be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 772be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 773be0f34b5SRichard Henderson 774be0f34b5SRichard Henderson case INDEX_op_mov_i32: 775be0f34b5SRichard Henderson case INDEX_op_movi_i32: 776be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 777be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 778be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 779be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 780be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 781be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 782be0f34b5SRichard Henderson case INDEX_op_ld_i32: 783be0f34b5SRichard Henderson case INDEX_op_st8_i32: 784be0f34b5SRichard Henderson case INDEX_op_st16_i32: 785be0f34b5SRichard Henderson case INDEX_op_st_i32: 786be0f34b5SRichard Henderson case INDEX_op_add_i32: 787be0f34b5SRichard Henderson case INDEX_op_sub_i32: 788be0f34b5SRichard Henderson case INDEX_op_mul_i32: 789be0f34b5SRichard Henderson case INDEX_op_and_i32: 790be0f34b5SRichard Henderson case INDEX_op_or_i32: 791be0f34b5SRichard Henderson case INDEX_op_xor_i32: 792be0f34b5SRichard Henderson case INDEX_op_shl_i32: 793be0f34b5SRichard Henderson case INDEX_op_shr_i32: 794be0f34b5SRichard Henderson case INDEX_op_sar_i32: 795be0f34b5SRichard Henderson return true; 796be0f34b5SRichard Henderson 797be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 798be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 799be0f34b5SRichard Henderson case INDEX_op_div_i32: 800be0f34b5SRichard Henderson case INDEX_op_divu_i32: 801be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 802be0f34b5SRichard Henderson case INDEX_op_rem_i32: 803be0f34b5SRichard Henderson case INDEX_op_remu_i32: 804be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 805be0f34b5SRichard Henderson case INDEX_op_div2_i32: 806be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 807be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 808be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 809be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 810be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 811be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 812be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 813be0f34b5SRichard Henderson case INDEX_op_extract_i32: 814be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 815be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 816be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 817be0f34b5SRichard Henderson case INDEX_op_add2_i32: 818be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 819be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 820be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 821be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 822be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 823be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 824be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 825be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 826be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 827be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 828be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 829be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 830be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 831be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 832be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 833be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 834be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 835be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 836be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 837be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 838be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 839be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 840be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 841be0f34b5SRichard Henderson case INDEX_op_not_i32: 842be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 843be0f34b5SRichard Henderson case INDEX_op_neg_i32: 844be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 845be0f34b5SRichard Henderson case INDEX_op_andc_i32: 846be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 847be0f34b5SRichard Henderson case INDEX_op_orc_i32: 848be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 849be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 850be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 851be0f34b5SRichard Henderson case INDEX_op_nand_i32: 852be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 853be0f34b5SRichard Henderson case INDEX_op_nor_i32: 854be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 855be0f34b5SRichard Henderson case INDEX_op_clz_i32: 856be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 857be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 858be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 859be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 860be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 861be0f34b5SRichard Henderson 862be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 863be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 864be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 865be0f34b5SRichard Henderson 866be0f34b5SRichard Henderson case INDEX_op_mov_i64: 867be0f34b5SRichard Henderson case INDEX_op_movi_i64: 868be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 869be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 870be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 871be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 872be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 873be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 874be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 875be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 876be0f34b5SRichard Henderson case INDEX_op_ld_i64: 877be0f34b5SRichard Henderson case INDEX_op_st8_i64: 878be0f34b5SRichard Henderson case INDEX_op_st16_i64: 879be0f34b5SRichard Henderson case INDEX_op_st32_i64: 880be0f34b5SRichard Henderson case INDEX_op_st_i64: 881be0f34b5SRichard Henderson case INDEX_op_add_i64: 882be0f34b5SRichard Henderson case INDEX_op_sub_i64: 883be0f34b5SRichard Henderson case INDEX_op_mul_i64: 884be0f34b5SRichard Henderson case INDEX_op_and_i64: 885be0f34b5SRichard Henderson case INDEX_op_or_i64: 886be0f34b5SRichard Henderson case INDEX_op_xor_i64: 887be0f34b5SRichard Henderson case INDEX_op_shl_i64: 888be0f34b5SRichard Henderson case INDEX_op_shr_i64: 889be0f34b5SRichard Henderson case INDEX_op_sar_i64: 890be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 891be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 892be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 893be0f34b5SRichard Henderson 894be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 895be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 896be0f34b5SRichard Henderson case INDEX_op_div_i64: 897be0f34b5SRichard Henderson case INDEX_op_divu_i64: 898be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 899be0f34b5SRichard Henderson case INDEX_op_rem_i64: 900be0f34b5SRichard Henderson case INDEX_op_remu_i64: 901be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 902be0f34b5SRichard Henderson case INDEX_op_div2_i64: 903be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 904be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 905be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 906be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 907be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 908be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 909be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 910be0f34b5SRichard Henderson case INDEX_op_extract_i64: 911be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 912be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 913be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 914be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 915be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 916be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 917be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 918be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 919be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 920be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 921be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 922be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 923be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 924be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 925be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 926be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 927be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 928be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 929be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 930be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 931be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 932be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 933be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 934be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 935be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 936be0f34b5SRichard Henderson case INDEX_op_not_i64: 937be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 938be0f34b5SRichard Henderson case INDEX_op_neg_i64: 939be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 940be0f34b5SRichard Henderson case INDEX_op_andc_i64: 941be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 942be0f34b5SRichard Henderson case INDEX_op_orc_i64: 943be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 944be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 945be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 946be0f34b5SRichard Henderson case INDEX_op_nand_i64: 947be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 948be0f34b5SRichard Henderson case INDEX_op_nor_i64: 949be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 950be0f34b5SRichard Henderson case INDEX_op_clz_i64: 951be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 952be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 953be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 954be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 955be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 956be0f34b5SRichard Henderson case INDEX_op_add2_i64: 957be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 958be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 959be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 960be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 961be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 962be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 963be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 964be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 965be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 966be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 967be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 968be0f34b5SRichard Henderson 969be0f34b5SRichard Henderson case NB_OPS: 970be0f34b5SRichard Henderson break; 971be0f34b5SRichard Henderson } 972be0f34b5SRichard Henderson g_assert_not_reached(); 973be0f34b5SRichard Henderson } 974be0f34b5SRichard Henderson 97539cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 97639cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 97739cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 978bbb8a1b4SRichard Henderson void tcg_gen_callN(TCGContext *s, void *func, TCGArg ret, 979bbb8a1b4SRichard Henderson int nargs, TCGArg *args) 980c896fe29Sbellard { 981c45cb8bbSRichard Henderson int i, real_args, nb_rets, pi, pi_first; 982bbb8a1b4SRichard Henderson unsigned sizemask, flags; 983afb49896SRichard Henderson TCGHelperInfo *info; 984afb49896SRichard Henderson 985afb49896SRichard Henderson info = g_hash_table_lookup(s->helpers, (gpointer)func); 986bbb8a1b4SRichard Henderson flags = info->flags; 987bbb8a1b4SRichard Henderson sizemask = info->sizemask; 9882bece2c8SRichard Henderson 98934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 99034b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 99134b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 99234b1a49cSRichard Henderson separate parameters. Split them. */ 99334b1a49cSRichard Henderson int orig_sizemask = sizemask; 99434b1a49cSRichard Henderson int orig_nargs = nargs; 99534b1a49cSRichard Henderson TCGv_i64 retl, reth; 99634b1a49cSRichard Henderson 99734b1a49cSRichard Henderson TCGV_UNUSED_I64(retl); 99834b1a49cSRichard Henderson TCGV_UNUSED_I64(reth); 99934b1a49cSRichard Henderson if (sizemask != 0) { 100034b1a49cSRichard Henderson TCGArg *split_args = __builtin_alloca(sizeof(TCGArg) * nargs * 2); 100134b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 100234b1a49cSRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 100334b1a49cSRichard Henderson if (is_64bit) { 100434b1a49cSRichard Henderson TCGv_i64 orig = MAKE_TCGV_I64(args[i]); 100534b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 100634b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 100734b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 100834b1a49cSRichard Henderson split_args[real_args++] = GET_TCGV_I32(h); 100934b1a49cSRichard Henderson split_args[real_args++] = GET_TCGV_I32(l); 101034b1a49cSRichard Henderson } else { 101134b1a49cSRichard Henderson split_args[real_args++] = args[i]; 101234b1a49cSRichard Henderson } 101334b1a49cSRichard Henderson } 101434b1a49cSRichard Henderson nargs = real_args; 101534b1a49cSRichard Henderson args = split_args; 101634b1a49cSRichard Henderson sizemask = 0; 101734b1a49cSRichard Henderson } 101834b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 10192bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 10202bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 10212bece2c8SRichard Henderson int is_signed = sizemask & (2 << (i+1)*2); 10222bece2c8SRichard Henderson if (!is_64bit) { 10232bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 10242bece2c8SRichard Henderson TCGv_i64 orig = MAKE_TCGV_I64(args[i]); 10252bece2c8SRichard Henderson if (is_signed) { 10262bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 10272bece2c8SRichard Henderson } else { 10282bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 10292bece2c8SRichard Henderson } 10302bece2c8SRichard Henderson args[i] = GET_TCGV_I64(temp); 10312bece2c8SRichard Henderson } 10322bece2c8SRichard Henderson } 10332bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 10342bece2c8SRichard Henderson 1035c45cb8bbSRichard Henderson pi_first = pi = s->gen_next_parm_idx; 1036a7812ae4Spbrook if (ret != TCG_CALL_DUMMY_ARG) { 103734b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 103834b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 103934b1a49cSRichard Henderson if (orig_sizemask & 1) { 104034b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 104134b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 104234b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 104334b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 104434b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1045c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = GET_TCGV_I64(reth); 1046c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = GET_TCGV_I64(retl); 104734b1a49cSRichard Henderson nb_rets = 2; 104834b1a49cSRichard Henderson } else { 1049c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 105034b1a49cSRichard Henderson nb_rets = 1; 105134b1a49cSRichard Henderson } 105234b1a49cSRichard Henderson #else 105334b1a49cSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) { 105402eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1055c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret + 1; 1056c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 1057a7812ae4Spbrook #else 1058c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 1059c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret + 1; 1060a7812ae4Spbrook #endif 1061a7812ae4Spbrook nb_rets = 2; 106234b1a49cSRichard Henderson } else { 1063c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 1064a7812ae4Spbrook nb_rets = 1; 1065a7812ae4Spbrook } 106634b1a49cSRichard Henderson #endif 1067a7812ae4Spbrook } else { 1068a7812ae4Spbrook nb_rets = 0; 1069a7812ae4Spbrook } 1070a7812ae4Spbrook real_args = 0; 1071a7812ae4Spbrook for (i = 0; i < nargs; i++) { 10722bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 1073bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 107439cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 107539cf05d3Sbellard /* some targets want aligned 64 bit args */ 1076ebd486d5Smalc if (real_args & 1) { 1077c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = TCG_CALL_DUMMY_ARG; 1078ebd486d5Smalc real_args++; 107939cf05d3Sbellard } 108039cf05d3Sbellard #endif 10813f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 10823f90f252SRichard Henderson arguments at lower addresses, which means we need to 10833f90f252SRichard Henderson reverse the order compared to how we would normally 10843f90f252SRichard Henderson treat either big or little-endian. For those arguments 10853f90f252SRichard Henderson that will wind up in registers, this still works for 10863f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 10873f90f252SRichard Henderson argument registers are *also* allocated in decreasing 10883f90f252SRichard Henderson order. If another such target is added, this logic may 10893f90f252SRichard Henderson have to get more complicated to differentiate between 10903f90f252SRichard Henderson stack arguments and register arguments. */ 109102eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1092c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i] + 1; 1093c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i]; 1094c896fe29Sbellard #else 1095c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i]; 1096c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i] + 1; 1097c896fe29Sbellard #endif 1098a7812ae4Spbrook real_args += 2; 10992bece2c8SRichard Henderson continue; 11002bece2c8SRichard Henderson } 11012bece2c8SRichard Henderson 1102c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i]; 1103a7812ae4Spbrook real_args++; 1104c896fe29Sbellard } 1105c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = (uintptr_t)func; 1106c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = flags; 1107a7812ae4Spbrook 1108c45cb8bbSRichard Henderson i = s->gen_next_op_idx; 1109c45cb8bbSRichard Henderson tcg_debug_assert(i < OPC_BUF_SIZE); 1110c45cb8bbSRichard Henderson tcg_debug_assert(pi <= OPPARAM_BUF_SIZE); 1111a7812ae4Spbrook 1112c45cb8bbSRichard Henderson /* Set links for sequential allocation during translation. */ 1113c45cb8bbSRichard Henderson s->gen_op_buf[i] = (TCGOp){ 1114c45cb8bbSRichard Henderson .opc = INDEX_op_call, 1115c45cb8bbSRichard Henderson .callo = nb_rets, 1116c45cb8bbSRichard Henderson .calli = real_args, 1117c45cb8bbSRichard Henderson .args = pi_first, 1118c45cb8bbSRichard Henderson .prev = i - 1, 1119c45cb8bbSRichard Henderson .next = i + 1 1120c45cb8bbSRichard Henderson }; 1121c45cb8bbSRichard Henderson 1122c45cb8bbSRichard Henderson /* Make sure the calli field didn't overflow. */ 1123c45cb8bbSRichard Henderson tcg_debug_assert(s->gen_op_buf[i].calli == real_args); 1124c45cb8bbSRichard Henderson 1125dcb8e758SRichard Henderson s->gen_op_buf[0].prev = i; 1126c45cb8bbSRichard Henderson s->gen_next_op_idx = i + 1; 1127c45cb8bbSRichard Henderson s->gen_next_parm_idx = pi; 11282bece2c8SRichard Henderson 112934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 113034b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 113134b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 113234b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 113334b1a49cSRichard Henderson int is_64bit = orig_sizemask & (1 << (i+1)*2); 113434b1a49cSRichard Henderson if (is_64bit) { 113534b1a49cSRichard Henderson TCGv_i32 h = MAKE_TCGV_I32(args[real_args++]); 113634b1a49cSRichard Henderson TCGv_i32 l = MAKE_TCGV_I32(args[real_args++]); 113734b1a49cSRichard Henderson tcg_temp_free_i32(h); 113834b1a49cSRichard Henderson tcg_temp_free_i32(l); 113934b1a49cSRichard Henderson } else { 114034b1a49cSRichard Henderson real_args++; 114134b1a49cSRichard Henderson } 114234b1a49cSRichard Henderson } 114334b1a49cSRichard Henderson if (orig_sizemask & 1) { 114434b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 114534b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 114634b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 114734b1a49cSRichard Henderson tcg_gen_concat32_i64(MAKE_TCGV_I64(ret), retl, reth); 114834b1a49cSRichard Henderson tcg_temp_free_i64(retl); 114934b1a49cSRichard Henderson tcg_temp_free_i64(reth); 115034b1a49cSRichard Henderson } 115134b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 11522bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 11532bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 11542bece2c8SRichard Henderson if (!is_64bit) { 11552bece2c8SRichard Henderson TCGv_i64 temp = MAKE_TCGV_I64(args[i]); 11562bece2c8SRichard Henderson tcg_temp_free_i64(temp); 11572bece2c8SRichard Henderson } 11582bece2c8SRichard Henderson } 11592bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1160a7812ae4Spbrook } 1161c896fe29Sbellard 11628fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1163c896fe29Sbellard { 1164c896fe29Sbellard int i; 1165c896fe29Sbellard TCGTemp *ts; 1166c896fe29Sbellard for(i = 0; i < s->nb_globals; i++) { 1167c896fe29Sbellard ts = &s->temps[i]; 1168c896fe29Sbellard if (ts->fixed_reg) { 1169c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 1170c896fe29Sbellard } else { 1171c896fe29Sbellard ts->val_type = TEMP_VAL_MEM; 1172c896fe29Sbellard } 1173c896fe29Sbellard } 1174e8996ee0Sbellard for(i = s->nb_globals; i < s->nb_temps; i++) { 1175e8996ee0Sbellard ts = &s->temps[i]; 11767dfd8c6aSAurelien Jarno if (ts->temp_local) { 11777dfd8c6aSAurelien Jarno ts->val_type = TEMP_VAL_MEM; 11787dfd8c6aSAurelien Jarno } else { 1179e8996ee0Sbellard ts->val_type = TEMP_VAL_DEAD; 11807dfd8c6aSAurelien Jarno } 1181e8996ee0Sbellard ts->mem_allocated = 0; 1182e8996ee0Sbellard ts->fixed_reg = 0; 1183e8996ee0Sbellard } 1184f8b2f202SRichard Henderson 1185f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1186c896fe29Sbellard } 1187c896fe29Sbellard 1188f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1189f8b2f202SRichard Henderson TCGTemp *ts) 1190c896fe29Sbellard { 1191f8b2f202SRichard Henderson int idx = temp_idx(s, ts); 1192ac56dd48Spbrook 1193ac56dd48Spbrook if (idx < s->nb_globals) { 1194ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1195f8b2f202SRichard Henderson } else if (ts->temp_local) { 1196641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1197f8b2f202SRichard Henderson } else { 1198ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1199c896fe29Sbellard } 1200c896fe29Sbellard return buf; 1201c896fe29Sbellard } 1202c896fe29Sbellard 1203f8b2f202SRichard Henderson static char *tcg_get_arg_str_idx(TCGContext *s, char *buf, 1204f8b2f202SRichard Henderson int buf_size, int idx) 1205f8b2f202SRichard Henderson { 1206eabb7b91SAurelien Jarno tcg_debug_assert(idx >= 0 && idx < s->nb_temps); 1207f8b2f202SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, &s->temps[idx]); 1208f8b2f202SRichard Henderson } 1209f8b2f202SRichard Henderson 12106e085f72SRichard Henderson /* Find helper name. */ 12116e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val) 1212e8996ee0Sbellard { 12136e085f72SRichard Henderson const char *ret = NULL; 12146e085f72SRichard Henderson if (s->helpers) { 121572866e82SRichard Henderson TCGHelperInfo *info = g_hash_table_lookup(s->helpers, (gpointer)val); 121672866e82SRichard Henderson if (info) { 121772866e82SRichard Henderson ret = info->name; 121872866e82SRichard Henderson } 1219e8996ee0Sbellard } 12206e085f72SRichard Henderson return ret; 12214dc81f28Sbellard } 12224dc81f28Sbellard 1223f48f3edeSblueswir1 static const char * const cond_name[] = 1224f48f3edeSblueswir1 { 12250aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 12260aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1227f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1228f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1229f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1230f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1231f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1232f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1233f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1234f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1235f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1236f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1237f48f3edeSblueswir1 }; 1238f48f3edeSblueswir1 1239f713d6adSRichard Henderson static const char * const ldst_name[] = 1240f713d6adSRichard Henderson { 1241f713d6adSRichard Henderson [MO_UB] = "ub", 1242f713d6adSRichard Henderson [MO_SB] = "sb", 1243f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1244f713d6adSRichard Henderson [MO_LESW] = "lesw", 1245f713d6adSRichard Henderson [MO_LEUL] = "leul", 1246f713d6adSRichard Henderson [MO_LESL] = "lesl", 1247f713d6adSRichard Henderson [MO_LEQ] = "leq", 1248f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1249f713d6adSRichard Henderson [MO_BESW] = "besw", 1250f713d6adSRichard Henderson [MO_BEUL] = "beul", 1251f713d6adSRichard Henderson [MO_BESL] = "besl", 1252f713d6adSRichard Henderson [MO_BEQ] = "beq", 1253f713d6adSRichard Henderson }; 1254f713d6adSRichard Henderson 12551f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 12561f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY 12571f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 12581f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 12591f00b27fSSergey Sorokin #else 12601f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 12611f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 12621f00b27fSSergey Sorokin #endif 12631f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 12641f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 12651f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 12661f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 12671f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 12681f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 12691f00b27fSSergey Sorokin }; 12701f00b27fSSergey Sorokin 1271eeacee4dSBlue Swirl void tcg_dump_ops(TCGContext *s) 1272c896fe29Sbellard { 1273c896fe29Sbellard char buf[128]; 1274c45cb8bbSRichard Henderson TCGOp *op; 1275c45cb8bbSRichard Henderson int oi; 1276c896fe29Sbellard 1277dcb8e758SRichard Henderson for (oi = s->gen_op_buf[0].next; oi != 0; oi = op->next) { 1278c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1279c45cb8bbSRichard Henderson const TCGOpDef *def; 1280c45cb8bbSRichard Henderson const TCGArg *args; 1281c45cb8bbSRichard Henderson TCGOpcode c; 1282bdfb460eSRichard Henderson int col = 0; 1283c45cb8bbSRichard Henderson 1284c45cb8bbSRichard Henderson op = &s->gen_op_buf[oi]; 1285c45cb8bbSRichard Henderson c = op->opc; 1286c896fe29Sbellard def = &tcg_op_defs[c]; 1287c45cb8bbSRichard Henderson args = &s->gen_opparam_buf[op->args]; 1288c45cb8bbSRichard Henderson 1289765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1290bdfb460eSRichard Henderson col += qemu_log("%s ----", oi != s->gen_op_buf[0].next ? "\n" : ""); 12919aef40edSRichard Henderson 12929aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 12939aef40edSRichard Henderson target_ulong a; 12947e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 12959aef40edSRichard Henderson a = ((target_ulong)args[i * 2 + 1] << 32) | args[i * 2]; 12967e4597d7Sbellard #else 12979aef40edSRichard Henderson a = args[i]; 12987e4597d7Sbellard #endif 1299bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1300eeacee4dSBlue Swirl } 13017e4597d7Sbellard } else if (c == INDEX_op_call) { 1302c896fe29Sbellard /* variable number of arguments */ 1303c45cb8bbSRichard Henderson nb_oargs = op->callo; 1304c45cb8bbSRichard Henderson nb_iargs = op->calli; 1305c896fe29Sbellard nb_cargs = def->nb_cargs; 1306b03cce8eSbellard 1307cf066674SRichard Henderson /* function name, flags, out args */ 1308bdfb460eSRichard Henderson col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name, 1309cf066674SRichard Henderson tcg_find_helper(s, args[nb_oargs + nb_iargs]), 1310cf066674SRichard Henderson args[nb_oargs + nb_iargs + 1], nb_oargs); 1311b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 1312bdfb460eSRichard Henderson col += qemu_log(",%s", tcg_get_arg_str_idx(s, buf, sizeof(buf), 1313eeacee4dSBlue Swirl args[i])); 1314b03cce8eSbellard } 1315cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1316cf066674SRichard Henderson TCGArg arg = args[nb_oargs + i]; 1317cf066674SRichard Henderson const char *t = "<dummy>"; 1318cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 1319cf066674SRichard Henderson t = tcg_get_arg_str_idx(s, buf, sizeof(buf), arg); 1320b03cce8eSbellard } 1321bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1322e8996ee0Sbellard } 1323b03cce8eSbellard } else { 1324bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1325c45cb8bbSRichard Henderson 1326c896fe29Sbellard nb_oargs = def->nb_oargs; 1327c896fe29Sbellard nb_iargs = def->nb_iargs; 1328c896fe29Sbellard nb_cargs = def->nb_cargs; 1329c896fe29Sbellard 1330c896fe29Sbellard k = 0; 1331c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1332eeacee4dSBlue Swirl if (k != 0) { 1333bdfb460eSRichard Henderson col += qemu_log(","); 1334eeacee4dSBlue Swirl } 1335bdfb460eSRichard Henderson col += qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf), 1336eeacee4dSBlue Swirl args[k++])); 1337c896fe29Sbellard } 1338c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1339eeacee4dSBlue Swirl if (k != 0) { 1340bdfb460eSRichard Henderson col += qemu_log(","); 1341eeacee4dSBlue Swirl } 1342bdfb460eSRichard Henderson col += qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf), 1343eeacee4dSBlue Swirl args[k++])); 1344c896fe29Sbellard } 1345be210acbSRichard Henderson switch (c) { 1346be210acbSRichard Henderson case INDEX_op_brcond_i32: 1347ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1348ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1349be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1350be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1351ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1352be210acbSRichard Henderson case INDEX_op_setcond_i64: 1353ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1354eeacee4dSBlue Swirl if (args[k] < ARRAY_SIZE(cond_name) && cond_name[args[k]]) { 1355bdfb460eSRichard Henderson col += qemu_log(",%s", cond_name[args[k++]]); 1356eeacee4dSBlue Swirl } else { 1357bdfb460eSRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, args[k++]); 1358eeacee4dSBlue Swirl } 1359f48f3edeSblueswir1 i = 1; 1360be210acbSRichard Henderson break; 1361f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1362f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 1363f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1364f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 136559227d5dSRichard Henderson { 136659227d5dSRichard Henderson TCGMemOpIdx oi = args[k++]; 136759227d5dSRichard Henderson TCGMemOp op = get_memop(oi); 136859227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 136959227d5dSRichard Henderson 137059c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1371bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 137259c4b7e8SRichard Henderson } else { 13731f00b27fSSergey Sorokin const char *s_al, *s_op; 13741f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 137559c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1376bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 1377f713d6adSRichard Henderson } 1378f713d6adSRichard Henderson i = 1; 137959227d5dSRichard Henderson } 1380f713d6adSRichard Henderson break; 1381be210acbSRichard Henderson default: 1382f48f3edeSblueswir1 i = 0; 1383be210acbSRichard Henderson break; 1384be210acbSRichard Henderson } 138551e3972cSRichard Henderson switch (c) { 138651e3972cSRichard Henderson case INDEX_op_set_label: 138751e3972cSRichard Henderson case INDEX_op_br: 138851e3972cSRichard Henderson case INDEX_op_brcond_i32: 138951e3972cSRichard Henderson case INDEX_op_brcond_i64: 139051e3972cSRichard Henderson case INDEX_op_brcond2_i32: 1391bdfb460eSRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", arg_label(args[k])->id); 139251e3972cSRichard Henderson i++, k++; 139351e3972cSRichard Henderson break; 139451e3972cSRichard Henderson default: 139551e3972cSRichard Henderson break; 1396eeacee4dSBlue Swirl } 139751e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 1398bdfb460eSRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", args[k]); 1399bdfb460eSRichard Henderson } 1400bdfb460eSRichard Henderson } 1401bdfb460eSRichard Henderson if (op->life) { 1402bdfb460eSRichard Henderson unsigned life = op->life; 1403bdfb460eSRichard Henderson 1404bdfb460eSRichard Henderson for (; col < 48; ++col) { 1405bdfb460eSRichard Henderson putc(' ', qemu_logfile); 1406bdfb460eSRichard Henderson } 1407bdfb460eSRichard Henderson 1408bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 1409bdfb460eSRichard Henderson qemu_log(" sync:"); 1410bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 1411bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 1412bdfb460eSRichard Henderson qemu_log(" %d", i); 1413bdfb460eSRichard Henderson } 1414bdfb460eSRichard Henderson } 1415bdfb460eSRichard Henderson } 1416bdfb460eSRichard Henderson life /= DEAD_ARG; 1417bdfb460eSRichard Henderson if (life) { 1418bdfb460eSRichard Henderson qemu_log(" dead:"); 1419bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 1420bdfb460eSRichard Henderson if (life & 1) { 1421bdfb460eSRichard Henderson qemu_log(" %d", i); 1422bdfb460eSRichard Henderson } 1423bdfb460eSRichard Henderson } 1424c896fe29Sbellard } 1425b03cce8eSbellard } 1426eeacee4dSBlue Swirl qemu_log("\n"); 1427c896fe29Sbellard } 1428c896fe29Sbellard } 1429c896fe29Sbellard 1430c896fe29Sbellard /* we give more priority to constraints with less registers */ 1431c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 1432c896fe29Sbellard { 1433c896fe29Sbellard const TCGArgConstraint *arg_ct; 1434c896fe29Sbellard 1435c896fe29Sbellard int i, n; 1436c896fe29Sbellard arg_ct = &def->args_ct[k]; 1437c896fe29Sbellard if (arg_ct->ct & TCG_CT_ALIAS) { 1438c896fe29Sbellard /* an alias is equivalent to a single register */ 1439c896fe29Sbellard n = 1; 1440c896fe29Sbellard } else { 1441c896fe29Sbellard if (!(arg_ct->ct & TCG_CT_REG)) 1442c896fe29Sbellard return 0; 1443c896fe29Sbellard n = 0; 1444c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 1445c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, i)) 1446c896fe29Sbellard n++; 1447c896fe29Sbellard } 1448c896fe29Sbellard } 1449c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 1450c896fe29Sbellard } 1451c896fe29Sbellard 1452c896fe29Sbellard /* sort from highest priority to lowest */ 1453c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 1454c896fe29Sbellard { 1455c896fe29Sbellard int i, j, p1, p2, tmp; 1456c896fe29Sbellard 1457c896fe29Sbellard for(i = 0; i < n; i++) 1458c896fe29Sbellard def->sorted_args[start + i] = start + i; 1459c896fe29Sbellard if (n <= 1) 1460c896fe29Sbellard return; 1461c896fe29Sbellard for(i = 0; i < n - 1; i++) { 1462c896fe29Sbellard for(j = i + 1; j < n; j++) { 1463c896fe29Sbellard p1 = get_constraint_priority(def, def->sorted_args[start + i]); 1464c896fe29Sbellard p2 = get_constraint_priority(def, def->sorted_args[start + j]); 1465c896fe29Sbellard if (p1 < p2) { 1466c896fe29Sbellard tmp = def->sorted_args[start + i]; 1467c896fe29Sbellard def->sorted_args[start + i] = def->sorted_args[start + j]; 1468c896fe29Sbellard def->sorted_args[start + j] = tmp; 1469c896fe29Sbellard } 1470c896fe29Sbellard } 1471c896fe29Sbellard } 1472c896fe29Sbellard } 1473c896fe29Sbellard 1474f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 1475c896fe29Sbellard { 1476a9751609SRichard Henderson TCGOpcode op; 1477c896fe29Sbellard 1478f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 1479f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 1480f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 1481069ea736SRichard Henderson TCGType type; 1482069ea736SRichard Henderson int i, nb_args; 1483f69d277eSRichard Henderson 1484f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 1485f69d277eSRichard Henderson continue; 1486f69d277eSRichard Henderson } 1487f69d277eSRichard Henderson 1488c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 1489f69d277eSRichard Henderson if (nb_args == 0) { 1490f69d277eSRichard Henderson continue; 1491f69d277eSRichard Henderson } 1492f69d277eSRichard Henderson 1493f69d277eSRichard Henderson tdefs = tcg_target_op_def(op); 1494f69d277eSRichard Henderson /* Missing TCGTargetOpDef entry. */ 1495f69d277eSRichard Henderson tcg_debug_assert(tdefs != NULL); 1496f69d277eSRichard Henderson 1497069ea736SRichard Henderson type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32); 1498c896fe29Sbellard for (i = 0; i < nb_args; i++) { 1499f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 1500f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 1501eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 1502f69d277eSRichard Henderson 1503*ccb1bb66SRichard Henderson def->args_ct[i].u.regs = 0; 1504c896fe29Sbellard def->args_ct[i].ct = 0; 150517280ff4SRichard Henderson while (*ct_str != '\0') { 150617280ff4SRichard Henderson switch(*ct_str) { 150717280ff4SRichard Henderson case '0' ... '9': 150817280ff4SRichard Henderson { 150917280ff4SRichard Henderson int oarg = *ct_str - '0'; 151017280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 1511eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 1512eabb7b91SAurelien Jarno tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG); 151317280ff4SRichard Henderson /* TCG_CT_ALIAS is for the output arguments. 151417280ff4SRichard Henderson The input is tagged with TCG_CT_IALIAS. */ 1515c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 151617280ff4SRichard Henderson def->args_ct[oarg].ct |= TCG_CT_ALIAS; 15175ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 1518c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_IALIAS; 15195ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 152017280ff4SRichard Henderson } 152117280ff4SRichard Henderson ct_str++; 1522c896fe29Sbellard break; 152382790a87SRichard Henderson case '&': 152482790a87SRichard Henderson def->args_ct[i].ct |= TCG_CT_NEWREG; 152582790a87SRichard Henderson ct_str++; 152682790a87SRichard Henderson break; 1527c896fe29Sbellard case 'i': 1528c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 1529c896fe29Sbellard ct_str++; 1530c896fe29Sbellard break; 1531c896fe29Sbellard default: 1532069ea736SRichard Henderson ct_str = target_parse_constraint(&def->args_ct[i], 1533069ea736SRichard Henderson ct_str, type); 1534f69d277eSRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 1535069ea736SRichard Henderson tcg_debug_assert(ct_str != NULL); 1536c896fe29Sbellard } 1537c896fe29Sbellard } 1538c896fe29Sbellard } 1539c896fe29Sbellard 1540c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 1541eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 1542c68aaa18SStefan Weil 1543c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 1544c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 1545c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 1546c896fe29Sbellard } 1547c896fe29Sbellard } 1548c896fe29Sbellard 15490c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 15500c627cdcSRichard Henderson { 15510c627cdcSRichard Henderson int next = op->next; 15520c627cdcSRichard Henderson int prev = op->prev; 15530c627cdcSRichard Henderson 1554dcb8e758SRichard Henderson /* We should never attempt to remove the list terminator. */ 1555dcb8e758SRichard Henderson tcg_debug_assert(op != &s->gen_op_buf[0]); 15560c627cdcSRichard Henderson 1557dcb8e758SRichard Henderson s->gen_op_buf[next].prev = prev; 1558dcb8e758SRichard Henderson s->gen_op_buf[prev].next = next; 1559dcb8e758SRichard Henderson 1560dcb8e758SRichard Henderson memset(op, 0, sizeof(*op)); 15610c627cdcSRichard Henderson 15620c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 15630c627cdcSRichard Henderson s->del_op_count++; 15640c627cdcSRichard Henderson #endif 15650c627cdcSRichard Henderson } 15660c627cdcSRichard Henderson 15675a18407fSRichard Henderson TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, 15685a18407fSRichard Henderson TCGOpcode opc, int nargs) 15695a18407fSRichard Henderson { 15705a18407fSRichard Henderson int oi = s->gen_next_op_idx; 15715a18407fSRichard Henderson int pi = s->gen_next_parm_idx; 15725a18407fSRichard Henderson int prev = old_op->prev; 15735a18407fSRichard Henderson int next = old_op - s->gen_op_buf; 15745a18407fSRichard Henderson TCGOp *new_op; 15755a18407fSRichard Henderson 15765a18407fSRichard Henderson tcg_debug_assert(oi < OPC_BUF_SIZE); 15775a18407fSRichard Henderson tcg_debug_assert(pi + nargs <= OPPARAM_BUF_SIZE); 15785a18407fSRichard Henderson s->gen_next_op_idx = oi + 1; 15795a18407fSRichard Henderson s->gen_next_parm_idx = pi + nargs; 15805a18407fSRichard Henderson 15815a18407fSRichard Henderson new_op = &s->gen_op_buf[oi]; 15825a18407fSRichard Henderson *new_op = (TCGOp){ 15835a18407fSRichard Henderson .opc = opc, 15845a18407fSRichard Henderson .args = pi, 15855a18407fSRichard Henderson .prev = prev, 15865a18407fSRichard Henderson .next = next 15875a18407fSRichard Henderson }; 15885a18407fSRichard Henderson s->gen_op_buf[prev].next = oi; 15895a18407fSRichard Henderson old_op->prev = oi; 15905a18407fSRichard Henderson 15915a18407fSRichard Henderson return new_op; 15925a18407fSRichard Henderson } 15935a18407fSRichard Henderson 15945a18407fSRichard Henderson TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, 15955a18407fSRichard Henderson TCGOpcode opc, int nargs) 15965a18407fSRichard Henderson { 15975a18407fSRichard Henderson int oi = s->gen_next_op_idx; 15985a18407fSRichard Henderson int pi = s->gen_next_parm_idx; 15995a18407fSRichard Henderson int prev = old_op - s->gen_op_buf; 16005a18407fSRichard Henderson int next = old_op->next; 16015a18407fSRichard Henderson TCGOp *new_op; 16025a18407fSRichard Henderson 16035a18407fSRichard Henderson tcg_debug_assert(oi < OPC_BUF_SIZE); 16045a18407fSRichard Henderson tcg_debug_assert(pi + nargs <= OPPARAM_BUF_SIZE); 16055a18407fSRichard Henderson s->gen_next_op_idx = oi + 1; 16065a18407fSRichard Henderson s->gen_next_parm_idx = pi + nargs; 16075a18407fSRichard Henderson 16085a18407fSRichard Henderson new_op = &s->gen_op_buf[oi]; 16095a18407fSRichard Henderson *new_op = (TCGOp){ 16105a18407fSRichard Henderson .opc = opc, 16115a18407fSRichard Henderson .args = pi, 16125a18407fSRichard Henderson .prev = prev, 16135a18407fSRichard Henderson .next = next 16145a18407fSRichard Henderson }; 16155a18407fSRichard Henderson s->gen_op_buf[next].prev = oi; 16165a18407fSRichard Henderson old_op->next = oi; 16175a18407fSRichard Henderson 16185a18407fSRichard Henderson return new_op; 16195a18407fSRichard Henderson } 16205a18407fSRichard Henderson 1621c70fbf0aSRichard Henderson #define TS_DEAD 1 1622c70fbf0aSRichard Henderson #define TS_MEM 2 1623c70fbf0aSRichard Henderson 16245a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 16255a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 16265a18407fSRichard Henderson 16279c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 16289c43b68dSAurelien Jarno should be in memory. */ 1629c70fbf0aSRichard Henderson static inline void tcg_la_func_end(TCGContext *s, uint8_t *temp_state) 1630c896fe29Sbellard { 1631c70fbf0aSRichard Henderson memset(temp_state, TS_DEAD | TS_MEM, s->nb_globals); 1632c70fbf0aSRichard Henderson memset(temp_state + s->nb_globals, TS_DEAD, s->nb_temps - s->nb_globals); 1633c896fe29Sbellard } 1634c896fe29Sbellard 16359c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 16369c43b68dSAurelien Jarno and local temps should be in memory. */ 1637c70fbf0aSRichard Henderson static inline void tcg_la_bb_end(TCGContext *s, uint8_t *temp_state) 1638641d5fbeSbellard { 1639c70fbf0aSRichard Henderson int i, n; 1640641d5fbeSbellard 1641c70fbf0aSRichard Henderson tcg_la_func_end(s, temp_state); 1642c70fbf0aSRichard Henderson for (i = s->nb_globals, n = s->nb_temps; i < n; i++) { 1643c70fbf0aSRichard Henderson if (s->temps[i].temp_local) { 1644c70fbf0aSRichard Henderson temp_state[i] |= TS_MEM; 1645c70fbf0aSRichard Henderson } 1646641d5fbeSbellard } 1647641d5fbeSbellard } 1648641d5fbeSbellard 1649a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 1650c896fe29Sbellard given input arguments is dead. Instructions updating dead 1651c896fe29Sbellard temporaries are removed. */ 16525a18407fSRichard Henderson static void liveness_pass_1(TCGContext *s, uint8_t *temp_state) 1653c896fe29Sbellard { 1654c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 16555a18407fSRichard Henderson int oi, oi_prev; 1656c896fe29Sbellard 1657c70fbf0aSRichard Henderson tcg_la_func_end(s, temp_state); 1658c896fe29Sbellard 1659dcb8e758SRichard Henderson for (oi = s->gen_op_buf[0].prev; oi != 0; oi = oi_prev) { 1660c45cb8bbSRichard Henderson int i, nb_iargs, nb_oargs; 1661c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 1662c45cb8bbSRichard Henderson bool have_opc_new2; 1663a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 1664c45cb8bbSRichard Henderson TCGArg arg; 1665c45cb8bbSRichard Henderson 1666c45cb8bbSRichard Henderson TCGOp * const op = &s->gen_op_buf[oi]; 1667c45cb8bbSRichard Henderson TCGArg * const args = &s->gen_opparam_buf[op->args]; 1668c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 1669c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 1670c45cb8bbSRichard Henderson 1671c45cb8bbSRichard Henderson oi_prev = op->prev; 1672c45cb8bbSRichard Henderson 1673c45cb8bbSRichard Henderson switch (opc) { 1674c896fe29Sbellard case INDEX_op_call: 1675c6e113f5Sbellard { 1676c6e113f5Sbellard int call_flags; 1677c6e113f5Sbellard 1678c45cb8bbSRichard Henderson nb_oargs = op->callo; 1679c45cb8bbSRichard Henderson nb_iargs = op->calli; 1680cf066674SRichard Henderson call_flags = args[nb_oargs + nb_iargs + 1]; 1681c6e113f5Sbellard 1682c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 168378505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 1684c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 1685c6e113f5Sbellard arg = args[i]; 1686c70fbf0aSRichard Henderson if (temp_state[arg] != TS_DEAD) { 1687c6e113f5Sbellard goto do_not_remove_call; 1688c6e113f5Sbellard } 16899c43b68dSAurelien Jarno } 1690c45cb8bbSRichard Henderson goto do_remove; 1691c6e113f5Sbellard } else { 1692c6e113f5Sbellard do_not_remove_call: 1693c896fe29Sbellard 1694c896fe29Sbellard /* output args are dead */ 1695c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1696c896fe29Sbellard arg = args[i]; 1697c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1698a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 16996b64b624SAurelien Jarno } 1700c70fbf0aSRichard Henderson if (temp_state[arg] & TS_MEM) { 1701a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 17029c43b68dSAurelien Jarno } 1703c70fbf0aSRichard Henderson temp_state[arg] = TS_DEAD; 1704c896fe29Sbellard } 1705c896fe29Sbellard 170678505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 170778505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 17089c43b68dSAurelien Jarno /* globals should go back to memory */ 1709c70fbf0aSRichard Henderson memset(temp_state, TS_DEAD | TS_MEM, nb_globals); 1710c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 1711c70fbf0aSRichard Henderson /* globals should be synced to memory */ 1712c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 1713c70fbf0aSRichard Henderson temp_state[i] |= TS_MEM; 1714c70fbf0aSRichard Henderson } 1715b9c18f56Saurel32 } 1716c896fe29Sbellard 1717c19f47bfSAurelien Jarno /* record arguments that die in this helper */ 1718866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 1719866cb6cbSAurelien Jarno arg = args[i]; 172039cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 1721c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1722a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 1723c896fe29Sbellard } 1724c896fe29Sbellard } 172539cf05d3Sbellard } 172667cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 1727c70fbf0aSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 1728c19f47bfSAurelien Jarno arg = args[i]; 1729c70fbf0aSRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 1730c70fbf0aSRichard Henderson temp_state[arg] &= ~TS_DEAD; 1731c70fbf0aSRichard Henderson } 1732c19f47bfSAurelien Jarno } 1733c6e113f5Sbellard } 1734c6e113f5Sbellard } 1735c896fe29Sbellard break; 1736765b842aSRichard Henderson case INDEX_op_insn_start: 1737c896fe29Sbellard break; 17385ff9d6a4Sbellard case INDEX_op_discard: 17395ff9d6a4Sbellard /* mark the temporary as dead */ 1740c70fbf0aSRichard Henderson temp_state[args[0]] = TS_DEAD; 17415ff9d6a4Sbellard break; 17421305c451SRichard Henderson 17431305c451SRichard Henderson case INDEX_op_add2_i32: 1744c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 1745f1fae40cSRichard Henderson goto do_addsub2; 17461305c451SRichard Henderson case INDEX_op_sub2_i32: 1747c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 1748f1fae40cSRichard Henderson goto do_addsub2; 1749f1fae40cSRichard Henderson case INDEX_op_add2_i64: 1750c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 1751f1fae40cSRichard Henderson goto do_addsub2; 1752f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 1753c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 1754f1fae40cSRichard Henderson do_addsub2: 17551305c451SRichard Henderson nb_iargs = 4; 17561305c451SRichard Henderson nb_oargs = 2; 17571305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 17581305c451SRichard Henderson the low part. The result can be optimized to a simple 17591305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 17601305c451SRichard Henderson cpu mode is set to 32 bit. */ 1761c70fbf0aSRichard Henderson if (temp_state[args[1]] == TS_DEAD) { 1762c70fbf0aSRichard Henderson if (temp_state[args[0]] == TS_DEAD) { 17631305c451SRichard Henderson goto do_remove; 17641305c451SRichard Henderson } 1765c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 1766c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 1767c45cb8bbSRichard Henderson op->opc = opc = opc_new; 17681305c451SRichard Henderson args[1] = args[2]; 17691305c451SRichard Henderson args[2] = args[4]; 17701305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 17711305c451SRichard Henderson nb_iargs = 2; 17721305c451SRichard Henderson nb_oargs = 1; 17731305c451SRichard Henderson } 17741305c451SRichard Henderson goto do_not_remove; 17751305c451SRichard Henderson 17761414968aSRichard Henderson case INDEX_op_mulu2_i32: 1777c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 1778c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 1779c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 178003271524SRichard Henderson goto do_mul2; 1781f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 1782c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 1783c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 1784c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 1785f1fae40cSRichard Henderson goto do_mul2; 1786f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 1787c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 1788c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 1789c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 179003271524SRichard Henderson goto do_mul2; 1791f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 1792c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 1793c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 1794c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 179503271524SRichard Henderson goto do_mul2; 1796f1fae40cSRichard Henderson do_mul2: 17971414968aSRichard Henderson nb_iargs = 2; 17981414968aSRichard Henderson nb_oargs = 2; 1799c70fbf0aSRichard Henderson if (temp_state[args[1]] == TS_DEAD) { 1800c70fbf0aSRichard Henderson if (temp_state[args[0]] == TS_DEAD) { 180103271524SRichard Henderson /* Both parts of the operation are dead. */ 18021414968aSRichard Henderson goto do_remove; 18031414968aSRichard Henderson } 180403271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 1805c45cb8bbSRichard Henderson op->opc = opc = opc_new; 18061414968aSRichard Henderson args[1] = args[2]; 18071414968aSRichard Henderson args[2] = args[3]; 1808c70fbf0aSRichard Henderson } else if (temp_state[args[0]] == TS_DEAD && have_opc_new2) { 180903271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 1810c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 181103271524SRichard Henderson args[0] = args[1]; 181203271524SRichard Henderson args[1] = args[2]; 181303271524SRichard Henderson args[2] = args[3]; 181403271524SRichard Henderson } else { 181503271524SRichard Henderson goto do_not_remove; 181603271524SRichard Henderson } 181703271524SRichard Henderson /* Mark the single-word operation live. */ 18181414968aSRichard Henderson nb_oargs = 1; 18191414968aSRichard Henderson goto do_not_remove; 18201414968aSRichard Henderson 1821c896fe29Sbellard default: 18221305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 1823c896fe29Sbellard nb_iargs = def->nb_iargs; 1824c896fe29Sbellard nb_oargs = def->nb_oargs; 1825c896fe29Sbellard 1826c896fe29Sbellard /* Test if the operation can be removed because all 18275ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 18285ff9d6a4Sbellard implies side effects */ 18295ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 1830c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1831c70fbf0aSRichard Henderson if (temp_state[args[i]] != TS_DEAD) { 1832c896fe29Sbellard goto do_not_remove; 1833c896fe29Sbellard } 18349c43b68dSAurelien Jarno } 18351305c451SRichard Henderson do_remove: 18360c627cdcSRichard Henderson tcg_op_remove(s, op); 1837c896fe29Sbellard } else { 1838c896fe29Sbellard do_not_remove: 1839c896fe29Sbellard /* output args are dead */ 1840c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1841c896fe29Sbellard arg = args[i]; 1842c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1843a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 18446b64b624SAurelien Jarno } 1845c70fbf0aSRichard Henderson if (temp_state[arg] & TS_MEM) { 1846a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 18479c43b68dSAurelien Jarno } 1848c70fbf0aSRichard Henderson temp_state[arg] = TS_DEAD; 1849c896fe29Sbellard } 1850c896fe29Sbellard 1851c896fe29Sbellard /* if end of basic block, update */ 1852c896fe29Sbellard if (def->flags & TCG_OPF_BB_END) { 1853c70fbf0aSRichard Henderson tcg_la_bb_end(s, temp_state); 18543d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 18553d5c5f87SAurelien Jarno /* globals should be synced to memory */ 1856c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 1857c70fbf0aSRichard Henderson temp_state[i] |= TS_MEM; 1858c70fbf0aSRichard Henderson } 1859c896fe29Sbellard } 1860c896fe29Sbellard 1861c19f47bfSAurelien Jarno /* record arguments that die in this opcode */ 1862866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 1863866cb6cbSAurelien Jarno arg = args[i]; 1864c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1865a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 1866c896fe29Sbellard } 1867c19f47bfSAurelien Jarno } 186867cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 1869c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 1870c70fbf0aSRichard Henderson temp_state[args[i]] &= ~TS_DEAD; 1871c896fe29Sbellard } 1872c896fe29Sbellard } 1873c896fe29Sbellard break; 1874c896fe29Sbellard } 1875bee158cbSRichard Henderson op->life = arg_life; 1876c896fe29Sbellard } 18771ff0a2c5SEvgeny Voevodin } 1878c896fe29Sbellard 18795a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 18805a18407fSRichard Henderson static bool liveness_pass_2(TCGContext *s, uint8_t *temp_state) 18815a18407fSRichard Henderson { 18825a18407fSRichard Henderson int nb_globals = s->nb_globals; 18835a18407fSRichard Henderson int16_t *dir_temps; 18845a18407fSRichard Henderson int i, oi, oi_next; 18855a18407fSRichard Henderson bool changes = false; 18865a18407fSRichard Henderson 18875a18407fSRichard Henderson dir_temps = tcg_malloc(nb_globals * sizeof(int16_t)); 18885a18407fSRichard Henderson memset(dir_temps, 0, nb_globals * sizeof(int16_t)); 18895a18407fSRichard Henderson 18905a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 18915a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 18925a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 18935a18407fSRichard Henderson if (its->indirect_reg) { 18945a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 18955a18407fSRichard Henderson dts->type = its->type; 18965a18407fSRichard Henderson dts->base_type = its->base_type; 18975a18407fSRichard Henderson dir_temps[i] = temp_idx(s, dts); 18985a18407fSRichard Henderson } 18995a18407fSRichard Henderson } 19005a18407fSRichard Henderson 19015a18407fSRichard Henderson memset(temp_state, TS_DEAD, nb_globals); 19025a18407fSRichard Henderson 19035a18407fSRichard Henderson for (oi = s->gen_op_buf[0].next; oi != 0; oi = oi_next) { 19045a18407fSRichard Henderson TCGOp *op = &s->gen_op_buf[oi]; 19055a18407fSRichard Henderson TCGArg *args = &s->gen_opparam_buf[op->args]; 19065a18407fSRichard Henderson TCGOpcode opc = op->opc; 19075a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 19085a18407fSRichard Henderson TCGLifeData arg_life = op->life; 19095a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 19105a18407fSRichard Henderson TCGArg arg, dir; 19115a18407fSRichard Henderson 19125a18407fSRichard Henderson oi_next = op->next; 19135a18407fSRichard Henderson 19145a18407fSRichard Henderson if (opc == INDEX_op_call) { 19155a18407fSRichard Henderson nb_oargs = op->callo; 19165a18407fSRichard Henderson nb_iargs = op->calli; 19175a18407fSRichard Henderson call_flags = args[nb_oargs + nb_iargs + 1]; 19185a18407fSRichard Henderson } else { 19195a18407fSRichard Henderson nb_iargs = def->nb_iargs; 19205a18407fSRichard Henderson nb_oargs = def->nb_oargs; 19215a18407fSRichard Henderson 19225a18407fSRichard Henderson /* Set flags similar to how calls require. */ 19235a18407fSRichard Henderson if (def->flags & TCG_OPF_BB_END) { 19245a18407fSRichard Henderson /* Like writing globals: save_globals */ 19255a18407fSRichard Henderson call_flags = 0; 19265a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 19275a18407fSRichard Henderson /* Like reading globals: sync_globals */ 19285a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 19295a18407fSRichard Henderson } else { 19305a18407fSRichard Henderson /* No effect on globals. */ 19315a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 19325a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 19335a18407fSRichard Henderson } 19345a18407fSRichard Henderson } 19355a18407fSRichard Henderson 19365a18407fSRichard Henderson /* Make sure that input arguments are available. */ 19375a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 19385a18407fSRichard Henderson arg = args[i]; 19395a18407fSRichard Henderson /* Note this unsigned test catches TCG_CALL_ARG_DUMMY too. */ 19405a18407fSRichard Henderson if (arg < nb_globals) { 19415a18407fSRichard Henderson dir = dir_temps[arg]; 19425a18407fSRichard Henderson if (dir != 0 && temp_state[arg] == TS_DEAD) { 19435a18407fSRichard Henderson TCGTemp *its = &s->temps[arg]; 19445a18407fSRichard Henderson TCGOpcode lopc = (its->type == TCG_TYPE_I32 19455a18407fSRichard Henderson ? INDEX_op_ld_i32 19465a18407fSRichard Henderson : INDEX_op_ld_i64); 19475a18407fSRichard Henderson TCGOp *lop = tcg_op_insert_before(s, op, lopc, 3); 19485a18407fSRichard Henderson TCGArg *largs = &s->gen_opparam_buf[lop->args]; 19495a18407fSRichard Henderson 19505a18407fSRichard Henderson largs[0] = dir; 19515a18407fSRichard Henderson largs[1] = temp_idx(s, its->mem_base); 19525a18407fSRichard Henderson largs[2] = its->mem_offset; 19535a18407fSRichard Henderson 19545a18407fSRichard Henderson /* Loaded, but synced with memory. */ 19555a18407fSRichard Henderson temp_state[arg] = TS_MEM; 19565a18407fSRichard Henderson } 19575a18407fSRichard Henderson } 19585a18407fSRichard Henderson } 19595a18407fSRichard Henderson 19605a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 19615a18407fSRichard Henderson No action is required except keeping temp_state up to date 19625a18407fSRichard Henderson so that we reload when needed. */ 19635a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 19645a18407fSRichard Henderson arg = args[i]; 19655a18407fSRichard Henderson if (arg < nb_globals) { 19665a18407fSRichard Henderson dir = dir_temps[arg]; 19675a18407fSRichard Henderson if (dir != 0) { 19685a18407fSRichard Henderson args[i] = dir; 19695a18407fSRichard Henderson changes = true; 19705a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 19715a18407fSRichard Henderson temp_state[arg] = TS_DEAD; 19725a18407fSRichard Henderson } 19735a18407fSRichard Henderson } 19745a18407fSRichard Henderson } 19755a18407fSRichard Henderson } 19765a18407fSRichard Henderson 19775a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 19785a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 19795a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 19805a18407fSRichard Henderson /* Nothing to do */ 19815a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 19825a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 19835a18407fSRichard Henderson /* Liveness should see that globals are synced back, 19845a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 19855a18407fSRichard Henderson tcg_debug_assert(dir_temps[i] == 0 19865a18407fSRichard Henderson || temp_state[i] != 0); 19875a18407fSRichard Henderson } 19885a18407fSRichard Henderson } else { 19895a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 19905a18407fSRichard Henderson /* Liveness should see that globals are saved back, 19915a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 19925a18407fSRichard Henderson tcg_debug_assert(dir_temps[i] == 0 19935a18407fSRichard Henderson || temp_state[i] == TS_DEAD); 19945a18407fSRichard Henderson } 19955a18407fSRichard Henderson } 19965a18407fSRichard Henderson 19975a18407fSRichard Henderson /* Outputs become available. */ 19985a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 19995a18407fSRichard Henderson arg = args[i]; 20005a18407fSRichard Henderson if (arg >= nb_globals) { 20015a18407fSRichard Henderson continue; 20025a18407fSRichard Henderson } 20035a18407fSRichard Henderson dir = dir_temps[arg]; 20045a18407fSRichard Henderson if (dir == 0) { 20055a18407fSRichard Henderson continue; 20065a18407fSRichard Henderson } 20075a18407fSRichard Henderson args[i] = dir; 20085a18407fSRichard Henderson changes = true; 20095a18407fSRichard Henderson 20105a18407fSRichard Henderson /* The output is now live and modified. */ 20115a18407fSRichard Henderson temp_state[arg] = 0; 20125a18407fSRichard Henderson 20135a18407fSRichard Henderson /* Sync outputs upon their last write. */ 20145a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 20155a18407fSRichard Henderson TCGTemp *its = &s->temps[arg]; 20165a18407fSRichard Henderson TCGOpcode sopc = (its->type == TCG_TYPE_I32 20175a18407fSRichard Henderson ? INDEX_op_st_i32 20185a18407fSRichard Henderson : INDEX_op_st_i64); 20195a18407fSRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc, 3); 20205a18407fSRichard Henderson TCGArg *sargs = &s->gen_opparam_buf[sop->args]; 20215a18407fSRichard Henderson 20225a18407fSRichard Henderson sargs[0] = dir; 20235a18407fSRichard Henderson sargs[1] = temp_idx(s, its->mem_base); 20245a18407fSRichard Henderson sargs[2] = its->mem_offset; 20255a18407fSRichard Henderson 20265a18407fSRichard Henderson temp_state[arg] = TS_MEM; 20275a18407fSRichard Henderson } 20285a18407fSRichard Henderson /* Drop outputs that are dead. */ 20295a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 20305a18407fSRichard Henderson temp_state[arg] = TS_DEAD; 20315a18407fSRichard Henderson } 20325a18407fSRichard Henderson } 20335a18407fSRichard Henderson } 20345a18407fSRichard Henderson 20355a18407fSRichard Henderson return changes; 20365a18407fSRichard Henderson } 20375a18407fSRichard Henderson 20388d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2039c896fe29Sbellard static void dump_regs(TCGContext *s) 2040c896fe29Sbellard { 2041c896fe29Sbellard TCGTemp *ts; 2042c896fe29Sbellard int i; 2043c896fe29Sbellard char buf[64]; 2044c896fe29Sbellard 2045c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2046c896fe29Sbellard ts = &s->temps[i]; 2047ac56dd48Spbrook printf(" %10s: ", tcg_get_arg_str_idx(s, buf, sizeof(buf), i)); 2048c896fe29Sbellard switch(ts->val_type) { 2049c896fe29Sbellard case TEMP_VAL_REG: 2050c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2051c896fe29Sbellard break; 2052c896fe29Sbellard case TEMP_VAL_MEM: 2053b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2054b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2055c896fe29Sbellard break; 2056c896fe29Sbellard case TEMP_VAL_CONST: 2057c896fe29Sbellard printf("$0x%" TCG_PRIlx, ts->val); 2058c896fe29Sbellard break; 2059c896fe29Sbellard case TEMP_VAL_DEAD: 2060c896fe29Sbellard printf("D"); 2061c896fe29Sbellard break; 2062c896fe29Sbellard default: 2063c896fe29Sbellard printf("???"); 2064c896fe29Sbellard break; 2065c896fe29Sbellard } 2066c896fe29Sbellard printf("\n"); 2067c896fe29Sbellard } 2068c896fe29Sbellard 2069c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2070f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2071c896fe29Sbellard printf("%s: %s\n", 2072c896fe29Sbellard tcg_target_reg_names[i], 2073f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2074c896fe29Sbellard } 2075c896fe29Sbellard } 2076c896fe29Sbellard } 2077c896fe29Sbellard 2078c896fe29Sbellard static void check_regs(TCGContext *s) 2079c896fe29Sbellard { 2080869938aeSRichard Henderson int reg; 2081b6638662SRichard Henderson int k; 2082c896fe29Sbellard TCGTemp *ts; 2083c896fe29Sbellard char buf[64]; 2084c896fe29Sbellard 2085c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2086f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2087f8b2f202SRichard Henderson if (ts != NULL) { 2088f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2089c896fe29Sbellard printf("Inconsistency for register %s:\n", 2090c896fe29Sbellard tcg_target_reg_names[reg]); 2091b03cce8eSbellard goto fail; 2092c896fe29Sbellard } 2093c896fe29Sbellard } 2094c896fe29Sbellard } 2095c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2096c896fe29Sbellard ts = &s->temps[k]; 2097f8b2f202SRichard Henderson if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg 2098f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2099c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2100f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2101b03cce8eSbellard fail: 2102c896fe29Sbellard printf("reg state:\n"); 2103c896fe29Sbellard dump_regs(s); 2104c896fe29Sbellard tcg_abort(); 2105c896fe29Sbellard } 2106c896fe29Sbellard } 2107c896fe29Sbellard } 2108c896fe29Sbellard #endif 2109c896fe29Sbellard 2110c896fe29Sbellard static void temp_allocate_frame(TCGContext *s, int temp) 2111c896fe29Sbellard { 2112c896fe29Sbellard TCGTemp *ts; 2113c896fe29Sbellard ts = &s->temps[temp]; 21149b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 21159b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2116b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2117b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2118b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2119f44c9960SBlue Swirl #endif 2120b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2121b591dc59SBlue Swirl s->frame_end) { 21225ff9d6a4Sbellard tcg_abort(); 2123b591dc59SBlue Swirl } 2124c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2125b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2126c896fe29Sbellard ts->mem_allocated = 1; 2127e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2128c896fe29Sbellard } 2129c896fe29Sbellard 2130b3915dbbSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet); 2131b3915dbbSRichard Henderson 213259d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 213359d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 213459d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2135c896fe29Sbellard { 213659d7c14eSRichard Henderson if (ts->fixed_reg) { 213759d7c14eSRichard Henderson return; 213859d7c14eSRichard Henderson } 213959d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 214059d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 214159d7c14eSRichard Henderson } 214259d7c14eSRichard Henderson ts->val_type = (free_or_dead < 0 214359d7c14eSRichard Henderson || ts->temp_local 214459d7c14eSRichard Henderson || temp_idx(s, ts) < s->nb_globals 214559d7c14eSRichard Henderson ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 214659d7c14eSRichard Henderson } 2147c896fe29Sbellard 214859d7c14eSRichard Henderson /* Mark a temporary as dead. */ 214959d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 215059d7c14eSRichard Henderson { 215159d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 215259d7c14eSRichard Henderson } 215359d7c14eSRichard Henderson 215459d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 215559d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 215659d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 215759d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 215859d7c14eSRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, 215959d7c14eSRichard Henderson TCGRegSet allocated_regs, int free_or_dead) 216059d7c14eSRichard Henderson { 216159d7c14eSRichard Henderson if (ts->fixed_reg) { 216259d7c14eSRichard Henderson return; 216359d7c14eSRichard Henderson } 216459d7c14eSRichard Henderson if (!ts->mem_coherent) { 21657f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 2166f8b2f202SRichard Henderson temp_allocate_frame(s, temp_idx(s, ts)); 216759d7c14eSRichard Henderson } 216859d7c14eSRichard Henderson switch (ts->val_type) { 216959d7c14eSRichard Henderson case TEMP_VAL_CONST: 217059d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 217159d7c14eSRichard Henderson require it later in a register, so attempt to store the 217259d7c14eSRichard Henderson constant to memory directly. */ 217359d7c14eSRichard Henderson if (free_or_dead 217459d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 217559d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 217659d7c14eSRichard Henderson break; 217759d7c14eSRichard Henderson } 217859d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 217959d7c14eSRichard Henderson allocated_regs); 218059d7c14eSRichard Henderson /* fallthrough */ 218159d7c14eSRichard Henderson 218259d7c14eSRichard Henderson case TEMP_VAL_REG: 218359d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 218459d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 218559d7c14eSRichard Henderson break; 218659d7c14eSRichard Henderson 218759d7c14eSRichard Henderson case TEMP_VAL_MEM: 218859d7c14eSRichard Henderson break; 218959d7c14eSRichard Henderson 219059d7c14eSRichard Henderson case TEMP_VAL_DEAD: 219159d7c14eSRichard Henderson default: 219259d7c14eSRichard Henderson tcg_abort(); 2193c896fe29Sbellard } 21947f6ceedfSAurelien Jarno ts->mem_coherent = 1; 21957f6ceedfSAurelien Jarno } 219659d7c14eSRichard Henderson if (free_or_dead) { 219759d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 219859d7c14eSRichard Henderson } 219959d7c14eSRichard Henderson } 22007f6ceedfSAurelien Jarno 22017f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 2202b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 22037f6ceedfSAurelien Jarno { 2204f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 2205f8b2f202SRichard Henderson if (ts != NULL) { 220659d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, -1); 2207c896fe29Sbellard } 2208c896fe29Sbellard } 2209c896fe29Sbellard 2210c896fe29Sbellard /* Allocate a register belonging to reg1 & ~reg2 */ 2211b3915dbbSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet desired_regs, 221291478cefSRichard Henderson TCGRegSet allocated_regs, bool rev) 2213c896fe29Sbellard { 221491478cefSRichard Henderson int i, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 221591478cefSRichard Henderson const int *order; 2216b6638662SRichard Henderson TCGReg reg; 2217c896fe29Sbellard TCGRegSet reg_ct; 2218c896fe29Sbellard 2219b3915dbbSRichard Henderson tcg_regset_andnot(reg_ct, desired_regs, allocated_regs); 222091478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 2221c896fe29Sbellard 2222c896fe29Sbellard /* first try free registers */ 222391478cefSRichard Henderson for(i = 0; i < n; i++) { 222491478cefSRichard Henderson reg = order[i]; 2225f8b2f202SRichard Henderson if (tcg_regset_test_reg(reg_ct, reg) && s->reg_to_temp[reg] == NULL) 2226c896fe29Sbellard return reg; 2227c896fe29Sbellard } 2228c896fe29Sbellard 2229c896fe29Sbellard /* XXX: do better spill choice */ 223091478cefSRichard Henderson for(i = 0; i < n; i++) { 223191478cefSRichard Henderson reg = order[i]; 2232c896fe29Sbellard if (tcg_regset_test_reg(reg_ct, reg)) { 2233b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 2234c896fe29Sbellard return reg; 2235c896fe29Sbellard } 2236c896fe29Sbellard } 2237c896fe29Sbellard 2238c896fe29Sbellard tcg_abort(); 2239c896fe29Sbellard } 2240c896fe29Sbellard 224140ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 224240ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 224340ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 224440ae5c62SRichard Henderson TCGRegSet allocated_regs) 224540ae5c62SRichard Henderson { 224640ae5c62SRichard Henderson TCGReg reg; 224740ae5c62SRichard Henderson 224840ae5c62SRichard Henderson switch (ts->val_type) { 224940ae5c62SRichard Henderson case TEMP_VAL_REG: 225040ae5c62SRichard Henderson return; 225140ae5c62SRichard Henderson case TEMP_VAL_CONST: 225291478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 225340ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 225440ae5c62SRichard Henderson ts->mem_coherent = 0; 225540ae5c62SRichard Henderson break; 225640ae5c62SRichard Henderson case TEMP_VAL_MEM: 225791478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 225840ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 225940ae5c62SRichard Henderson ts->mem_coherent = 1; 226040ae5c62SRichard Henderson break; 226140ae5c62SRichard Henderson case TEMP_VAL_DEAD: 226240ae5c62SRichard Henderson default: 226340ae5c62SRichard Henderson tcg_abort(); 226440ae5c62SRichard Henderson } 226540ae5c62SRichard Henderson ts->reg = reg; 226640ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 226740ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 226840ae5c62SRichard Henderson } 226940ae5c62SRichard Henderson 227059d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 2271e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 227259d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 22731ad80729SAurelien Jarno { 22742c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 2275eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 2276f8bf00f1SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg); 22771ad80729SAurelien Jarno } 22781ad80729SAurelien Jarno 22799814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 2280641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 2281641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 2282641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 2283641d5fbeSbellard { 2284641d5fbeSbellard int i; 2285641d5fbeSbellard 2286641d5fbeSbellard for (i = 0; i < s->nb_globals; i++) { 2287b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 2288641d5fbeSbellard } 2289e5097dc8Sbellard } 2290e5097dc8Sbellard 22913d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 22923d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 22933d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 22943d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 22953d5c5f87SAurelien Jarno { 22963d5c5f87SAurelien Jarno int i; 22973d5c5f87SAurelien Jarno 22983d5c5f87SAurelien Jarno for (i = 0; i < s->nb_globals; i++) { 229912b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 230012b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 230112b9b11aSRichard Henderson || ts->fixed_reg 230212b9b11aSRichard Henderson || ts->mem_coherent); 23033d5c5f87SAurelien Jarno } 23043d5c5f87SAurelien Jarno } 23053d5c5f87SAurelien Jarno 2306e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 2307e8996ee0Sbellard all globals are stored at their canonical location. */ 2308e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 2309e5097dc8Sbellard { 2310e5097dc8Sbellard int i; 2311e5097dc8Sbellard 2312c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 2313b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 2314641d5fbeSbellard if (ts->temp_local) { 2315b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 2316641d5fbeSbellard } else { 23172c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 2318eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 2319eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 2320c896fe29Sbellard } 2321641d5fbeSbellard } 2322e8996ee0Sbellard 2323e8996ee0Sbellard save_globals(s, allocated_regs); 2324c896fe29Sbellard } 2325c896fe29Sbellard 23260fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 23270fe4fca4SPaolo Bonzini tcg_target_ulong val, TCGLifeData arg_life) 2328e8996ee0Sbellard { 2329e8996ee0Sbellard if (ots->fixed_reg) { 233059d7c14eSRichard Henderson /* For fixed registers, we do not do any constant propagation. */ 2331e8996ee0Sbellard tcg_out_movi(s, ots->type, ots->reg, val); 233259d7c14eSRichard Henderson return; 233359d7c14eSRichard Henderson } 233459d7c14eSRichard Henderson 233559d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 2336f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 2337f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2338f8b2f202SRichard Henderson } 2339e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 2340e8996ee0Sbellard ots->val = val; 234159d7c14eSRichard Henderson ots->mem_coherent = 0; 2342ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 234359d7c14eSRichard Henderson temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0)); 234459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 2345f8bf00f1SRichard Henderson temp_dead(s, ots); 23464c4e1ab2SAurelien Jarno } 2347e8996ee0Sbellard } 2348e8996ee0Sbellard 23490fe4fca4SPaolo Bonzini static void tcg_reg_alloc_movi(TCGContext *s, const TCGArg *args, 23500fe4fca4SPaolo Bonzini TCGLifeData arg_life) 23510fe4fca4SPaolo Bonzini { 23520fe4fca4SPaolo Bonzini TCGTemp *ots = &s->temps[args[0]]; 23530fe4fca4SPaolo Bonzini tcg_target_ulong val = args[1]; 23540fe4fca4SPaolo Bonzini 23550fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 23560fe4fca4SPaolo Bonzini } 23570fe4fca4SPaolo Bonzini 2358c896fe29Sbellard static void tcg_reg_alloc_mov(TCGContext *s, const TCGOpDef *def, 2359a1b3c48dSRichard Henderson const TCGArg *args, TCGLifeData arg_life) 2360c896fe29Sbellard { 2361c29c1d7eSAurelien Jarno TCGRegSet allocated_regs; 2362c896fe29Sbellard TCGTemp *ts, *ots; 2363450445d5SRichard Henderson TCGType otype, itype; 2364c896fe29Sbellard 2365c29c1d7eSAurelien Jarno tcg_regset_set(allocated_regs, s->reserved_regs); 2366c896fe29Sbellard ots = &s->temps[args[0]]; 2367c896fe29Sbellard ts = &s->temps[args[1]]; 2368450445d5SRichard Henderson 2369450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 2370450445d5SRichard Henderson otype = ots->type; 2371450445d5SRichard Henderson itype = ts->type; 2372c896fe29Sbellard 23730fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 23740fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 23750fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 23760fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 23770fe4fca4SPaolo Bonzini temp_dead(s, ts); 23780fe4fca4SPaolo Bonzini } 23790fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 23800fe4fca4SPaolo Bonzini return; 23810fe4fca4SPaolo Bonzini } 23820fe4fca4SPaolo Bonzini 23830fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 23840fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 23850fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 23860fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 23870fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 238840ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], allocated_regs); 2389c29c1d7eSAurelien Jarno } 2390c29c1d7eSAurelien Jarno 23910fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 2392c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(0) && !ots->fixed_reg) { 2393c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 2394c29c1d7eSAurelien Jarno liveness analysis disabled). */ 2395eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 2396c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 2397c29c1d7eSAurelien Jarno temp_allocate_frame(s, args[0]); 2398c29c1d7eSAurelien Jarno } 2399b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 2400c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 2401f8bf00f1SRichard Henderson temp_dead(s, ts); 2402c29c1d7eSAurelien Jarno } 2403f8bf00f1SRichard Henderson temp_dead(s, ots); 2404e8996ee0Sbellard } else { 2405c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) { 2406c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 2407c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 2408f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2409c896fe29Sbellard } 2410c29c1d7eSAurelien Jarno ots->reg = ts->reg; 2411f8bf00f1SRichard Henderson temp_dead(s, ts); 2412c29c1d7eSAurelien Jarno } else { 2413c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 2414c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 2415c29c1d7eSAurelien Jarno input one. */ 2416c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 2417450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 241891478cefSRichard Henderson allocated_regs, ots->indirect_base); 2419c29c1d7eSAurelien Jarno } 2420450445d5SRichard Henderson tcg_out_mov(s, otype, ots->reg, ts->reg); 2421c29c1d7eSAurelien Jarno } 2422c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 2423c896fe29Sbellard ots->mem_coherent = 0; 2424f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 2425ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 242659d7c14eSRichard Henderson temp_sync(s, ots, allocated_regs, 0); 2427c29c1d7eSAurelien Jarno } 2428ec7a869dSAurelien Jarno } 2429c896fe29Sbellard } 2430c896fe29Sbellard 2431c896fe29Sbellard static void tcg_reg_alloc_op(TCGContext *s, 2432a9751609SRichard Henderson const TCGOpDef *def, TCGOpcode opc, 2433a1b3c48dSRichard Henderson const TCGArg *args, TCGLifeData arg_life) 2434c896fe29Sbellard { 243582790a87SRichard Henderson TCGRegSet i_allocated_regs; 243682790a87SRichard Henderson TCGRegSet o_allocated_regs; 2437b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 2438b6638662SRichard Henderson TCGReg reg; 2439c896fe29Sbellard TCGArg arg; 2440c896fe29Sbellard const TCGArgConstraint *arg_ct; 2441c896fe29Sbellard TCGTemp *ts; 2442c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 2443c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 2444c896fe29Sbellard 2445c896fe29Sbellard nb_oargs = def->nb_oargs; 2446c896fe29Sbellard nb_iargs = def->nb_iargs; 2447c896fe29Sbellard 2448c896fe29Sbellard /* copy constants */ 2449c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 2450c896fe29Sbellard args + nb_oargs + nb_iargs, 2451c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 2452c896fe29Sbellard 245382790a87SRichard Henderson tcg_regset_set(i_allocated_regs, s->reserved_regs); 245482790a87SRichard Henderson tcg_regset_set(o_allocated_regs, s->reserved_regs); 245582790a87SRichard Henderson 2456c896fe29Sbellard /* satisfy input constraints */ 2457c896fe29Sbellard for(k = 0; k < nb_iargs; k++) { 2458c896fe29Sbellard i = def->sorted_args[nb_oargs + k]; 2459c896fe29Sbellard arg = args[i]; 2460c896fe29Sbellard arg_ct = &def->args_ct[i]; 2461c896fe29Sbellard ts = &s->temps[arg]; 246240ae5c62SRichard Henderson 246340ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 246440ae5c62SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct)) { 2465c896fe29Sbellard /* constant is OK for instruction */ 2466c896fe29Sbellard const_args[i] = 1; 2467c896fe29Sbellard new_args[i] = ts->val; 2468c896fe29Sbellard goto iarg_end; 2469c896fe29Sbellard } 247040ae5c62SRichard Henderson 247182790a87SRichard Henderson temp_load(s, ts, arg_ct->u.regs, i_allocated_regs); 247240ae5c62SRichard Henderson 24735ff9d6a4Sbellard if (arg_ct->ct & TCG_CT_IALIAS) { 24745ff9d6a4Sbellard if (ts->fixed_reg) { 24755ff9d6a4Sbellard /* if fixed register, we must allocate a new register 24765ff9d6a4Sbellard if the alias is not the same register */ 24775ff9d6a4Sbellard if (arg != args[arg_ct->alias_index]) 24785ff9d6a4Sbellard goto allocate_in_reg; 24795ff9d6a4Sbellard } else { 2480c896fe29Sbellard /* if the input is aliased to an output and if it is 2481c896fe29Sbellard not dead after the instruction, we must allocate 2482c896fe29Sbellard a new register and move it */ 2483866cb6cbSAurelien Jarno if (!IS_DEAD_ARG(i)) { 2484c896fe29Sbellard goto allocate_in_reg; 2485c896fe29Sbellard } 24867e1df267SAurelien Jarno /* check if the current register has already been allocated 24877e1df267SAurelien Jarno for another input aliased to an output */ 24887e1df267SAurelien Jarno int k2, i2; 24897e1df267SAurelien Jarno for (k2 = 0 ; k2 < k ; k2++) { 24907e1df267SAurelien Jarno i2 = def->sorted_args[nb_oargs + k2]; 24917e1df267SAurelien Jarno if ((def->args_ct[i2].ct & TCG_CT_IALIAS) && 24927e1df267SAurelien Jarno (new_args[i2] == ts->reg)) { 24937e1df267SAurelien Jarno goto allocate_in_reg; 24947e1df267SAurelien Jarno } 24957e1df267SAurelien Jarno } 24965ff9d6a4Sbellard } 2497866cb6cbSAurelien Jarno } 2498c896fe29Sbellard reg = ts->reg; 2499c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, reg)) { 2500c896fe29Sbellard /* nothing to do : the constraint is satisfied */ 2501c896fe29Sbellard } else { 2502c896fe29Sbellard allocate_in_reg: 2503c896fe29Sbellard /* allocate a new register matching the constraint 2504c896fe29Sbellard and move the temporary register into it */ 250582790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs, 250691478cefSRichard Henderson ts->indirect_base); 25073b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 2508c896fe29Sbellard } 2509c896fe29Sbellard new_args[i] = reg; 2510c896fe29Sbellard const_args[i] = 0; 251182790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 2512c896fe29Sbellard iarg_end: ; 2513c896fe29Sbellard } 2514c896fe29Sbellard 2515c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 2516866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2517866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 2518f8bf00f1SRichard Henderson temp_dead(s, &s->temps[args[i]]); 2519c896fe29Sbellard } 2520c896fe29Sbellard } 2521c896fe29Sbellard 2522a52ad07eSAurelien Jarno if (def->flags & TCG_OPF_BB_END) { 252382790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 2524a52ad07eSAurelien Jarno } else { 2525c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 2526b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 2527c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 2528c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 252982790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 2530c896fe29Sbellard } 2531c896fe29Sbellard } 25323d5c5f87SAurelien Jarno } 25333d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 25343d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 25353d5c5f87SAurelien Jarno an exception. */ 253682790a87SRichard Henderson sync_globals(s, i_allocated_regs); 2537c896fe29Sbellard } 2538c896fe29Sbellard 2539c896fe29Sbellard /* satisfy the output constraints */ 2540c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 2541c896fe29Sbellard i = def->sorted_args[k]; 2542c896fe29Sbellard arg = args[i]; 2543c896fe29Sbellard arg_ct = &def->args_ct[i]; 2544c896fe29Sbellard ts = &s->temps[arg]; 254517280ff4SRichard Henderson if ((arg_ct->ct & TCG_CT_ALIAS) 254617280ff4SRichard Henderson && !const_args[arg_ct->alias_index]) { 25475ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 254882790a87SRichard Henderson } else if (arg_ct->ct & TCG_CT_NEWREG) { 254982790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, 255082790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 255182790a87SRichard Henderson ts->indirect_base); 2552c896fe29Sbellard } else { 2553c896fe29Sbellard /* if fixed register, we try to use it */ 2554c896fe29Sbellard reg = ts->reg; 2555c896fe29Sbellard if (ts->fixed_reg && 2556c896fe29Sbellard tcg_regset_test_reg(arg_ct->u.regs, reg)) { 2557c896fe29Sbellard goto oarg_end; 2558c896fe29Sbellard } 255982790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs, 256091478cefSRichard Henderson ts->indirect_base); 2561c896fe29Sbellard } 256282790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 2563c896fe29Sbellard /* if a fixed register is used, then a move will be done afterwards */ 2564c896fe29Sbellard if (!ts->fixed_reg) { 2565639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 2566f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 2567639368ddSAurelien Jarno } 2568c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 2569c896fe29Sbellard ts->reg = reg; 2570c896fe29Sbellard /* temp value is modified, so the value kept in memory is 2571c896fe29Sbellard potentially not the same */ 2572c896fe29Sbellard ts->mem_coherent = 0; 2573f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 2574c896fe29Sbellard } 2575c896fe29Sbellard oarg_end: 2576c896fe29Sbellard new_args[i] = reg; 2577c896fe29Sbellard } 2578e8996ee0Sbellard } 2579c896fe29Sbellard 2580c896fe29Sbellard /* emit instruction */ 2581c896fe29Sbellard tcg_out_op(s, opc, new_args, const_args); 2582c896fe29Sbellard 2583c896fe29Sbellard /* move the outputs in the correct register if needed */ 2584c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 2585c896fe29Sbellard ts = &s->temps[args[i]]; 2586c896fe29Sbellard reg = new_args[i]; 2587c896fe29Sbellard if (ts->fixed_reg && ts->reg != reg) { 25883b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 2589c896fe29Sbellard } 2590ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 259182790a87SRichard Henderson temp_sync(s, ts, o_allocated_regs, IS_DEAD_ARG(i)); 259259d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 2593f8bf00f1SRichard Henderson temp_dead(s, ts); 2594ec7a869dSAurelien Jarno } 2595c896fe29Sbellard } 2596c896fe29Sbellard } 2597c896fe29Sbellard 2598b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 2599b03cce8eSbellard #define STACK_DIR(x) (-(x)) 2600b03cce8eSbellard #else 2601b03cce8eSbellard #define STACK_DIR(x) (x) 2602b03cce8eSbellard #endif 2603b03cce8eSbellard 2604c45cb8bbSRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, int nb_oargs, int nb_iargs, 2605a1b3c48dSRichard Henderson const TCGArg * const args, TCGLifeData arg_life) 2606c896fe29Sbellard { 2607b6638662SRichard Henderson int flags, nb_regs, i; 2608b6638662SRichard Henderson TCGReg reg; 2609cf066674SRichard Henderson TCGArg arg; 2610c896fe29Sbellard TCGTemp *ts; 2611d3452f1fSRichard Henderson intptr_t stack_offset; 2612d3452f1fSRichard Henderson size_t call_stack_size; 2613cf066674SRichard Henderson tcg_insn_unit *func_addr; 2614cf066674SRichard Henderson int allocate_args; 2615c896fe29Sbellard TCGRegSet allocated_regs; 2616c896fe29Sbellard 2617cf066674SRichard Henderson func_addr = (tcg_insn_unit *)(intptr_t)args[nb_oargs + nb_iargs]; 2618cf066674SRichard Henderson flags = args[nb_oargs + nb_iargs + 1]; 2619c896fe29Sbellard 26206e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 2621c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 2622c45cb8bbSRichard Henderson nb_regs = nb_iargs; 2623cf066674SRichard Henderson } 2624c896fe29Sbellard 2625c896fe29Sbellard /* assign stack slots first */ 2626c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 2627c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 2628c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 2629b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 2630b03cce8eSbellard if (allocate_args) { 2631345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 2632345649c0SBlue Swirl preallocate call stack */ 2633345649c0SBlue Swirl tcg_abort(); 2634b03cce8eSbellard } 263539cf05d3Sbellard 263639cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 2637c45cb8bbSRichard Henderson for(i = nb_regs; i < nb_iargs; i++) { 2638c896fe29Sbellard arg = args[nb_oargs + i]; 263939cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 264039cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 264139cf05d3Sbellard #endif 264239cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 2643c896fe29Sbellard ts = &s->temps[arg]; 264440ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 264540ae5c62SRichard Henderson s->reserved_regs); 2646e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 264739cf05d3Sbellard } 264839cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 264939cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 265039cf05d3Sbellard #endif 2651c896fe29Sbellard } 2652c896fe29Sbellard 2653c896fe29Sbellard /* assign input registers */ 2654c896fe29Sbellard tcg_regset_set(allocated_regs, s->reserved_regs); 2655c896fe29Sbellard for(i = 0; i < nb_regs; i++) { 2656c896fe29Sbellard arg = args[nb_oargs + i]; 265739cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 2658c896fe29Sbellard ts = &s->temps[arg]; 2659c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 2660b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 266140ae5c62SRichard Henderson 2662c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 2663c896fe29Sbellard if (ts->reg != reg) { 26643b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 2665c896fe29Sbellard } 2666c896fe29Sbellard } else { 2667*ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 266840ae5c62SRichard Henderson 266940ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 267040ae5c62SRichard Henderson temp_load(s, ts, arg_set, allocated_regs); 2671c896fe29Sbellard } 267240ae5c62SRichard Henderson 2673c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 2674c896fe29Sbellard } 267539cf05d3Sbellard } 2676c896fe29Sbellard 2677c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 2678866cb6cbSAurelien Jarno for(i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2679866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 2680f8bf00f1SRichard Henderson temp_dead(s, &s->temps[args[i]]); 2681c896fe29Sbellard } 2682c896fe29Sbellard } 2683c896fe29Sbellard 2684c896fe29Sbellard /* clobber call registers */ 2685c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 2686c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 2687b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 2688c896fe29Sbellard } 2689c896fe29Sbellard } 2690c896fe29Sbellard 269178505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 269278505279SAurelien Jarno they might be read. */ 269378505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 269478505279SAurelien Jarno /* Nothing to do */ 269578505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 269678505279SAurelien Jarno sync_globals(s, allocated_regs); 269778505279SAurelien Jarno } else { 2698e8996ee0Sbellard save_globals(s, allocated_regs); 2699b9c18f56Saurel32 } 2700c896fe29Sbellard 2701cf066674SRichard Henderson tcg_out_call(s, func_addr); 2702c896fe29Sbellard 2703c896fe29Sbellard /* assign output registers and emit moves if needed */ 2704c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 2705c896fe29Sbellard arg = args[i]; 2706c896fe29Sbellard ts = &s->temps[arg]; 2707c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 2708eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 270934b1a49cSRichard Henderson 2710c896fe29Sbellard if (ts->fixed_reg) { 2711c896fe29Sbellard if (ts->reg != reg) { 27123b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 2713c896fe29Sbellard } 2714c896fe29Sbellard } else { 2715639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 2716f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 2717639368ddSAurelien Jarno } 2718c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 2719c896fe29Sbellard ts->reg = reg; 2720c896fe29Sbellard ts->mem_coherent = 0; 2721f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 2722ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 272359d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i)); 272459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 2725f8bf00f1SRichard Henderson temp_dead(s, ts); 2726c896fe29Sbellard } 2727c896fe29Sbellard } 27288c11ad25SAurelien Jarno } 2729c896fe29Sbellard } 2730c896fe29Sbellard 2731c896fe29Sbellard #ifdef CONFIG_PROFILER 2732c896fe29Sbellard 273354604f74Saurel32 static int64_t tcg_table_op_count[NB_OPS]; 2734c896fe29Sbellard 2735246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 2736c896fe29Sbellard { 2737c896fe29Sbellard int i; 2738d70724ceSzhanghailiang 273915fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 2740246ae24dSMax Filippov cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, 2741246ae24dSMax Filippov tcg_table_op_count[i]); 2742c896fe29Sbellard } 2743c896fe29Sbellard } 2744246ae24dSMax Filippov #else 2745246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 2746246ae24dSMax Filippov { 2747246ae24dSMax Filippov cpu_fprintf(f, "[TCG profiler not compiled]\n"); 2748246ae24dSMax Filippov } 2749c896fe29Sbellard #endif 2750c896fe29Sbellard 2751c896fe29Sbellard 27525bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 2753c896fe29Sbellard { 2754fca8a500SRichard Henderson int i, oi, oi_next, num_insns; 2755c896fe29Sbellard 275604fe6400SRichard Henderson #ifdef CONFIG_PROFILER 275704fe6400SRichard Henderson { 275804fe6400SRichard Henderson int n; 275904fe6400SRichard Henderson 2760dcb8e758SRichard Henderson n = s->gen_op_buf[0].prev + 1; 276104fe6400SRichard Henderson s->op_count += n; 276204fe6400SRichard Henderson if (n > s->op_count_max) { 276304fe6400SRichard Henderson s->op_count_max = n; 276404fe6400SRichard Henderson } 276504fe6400SRichard Henderson 276604fe6400SRichard Henderson n = s->nb_temps; 276704fe6400SRichard Henderson s->temp_count += n; 276804fe6400SRichard Henderson if (n > s->temp_count_max) { 276904fe6400SRichard Henderson s->temp_count_max = n; 277004fe6400SRichard Henderson } 277104fe6400SRichard Henderson } 277204fe6400SRichard Henderson #endif 277304fe6400SRichard Henderson 2774c896fe29Sbellard #ifdef DEBUG_DISAS 2775d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 2776d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 27771ee73216SRichard Henderson qemu_log_lock(); 277893fcfe39Saliguori qemu_log("OP:\n"); 2779eeacee4dSBlue Swirl tcg_dump_ops(s); 278093fcfe39Saliguori qemu_log("\n"); 27811ee73216SRichard Henderson qemu_log_unlock(); 2782c896fe29Sbellard } 2783c896fe29Sbellard #endif 2784c896fe29Sbellard 2785c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 2786c5cc28ffSAurelien Jarno s->opt_time -= profile_getclock(); 2787c5cc28ffSAurelien Jarno #endif 2788c5cc28ffSAurelien Jarno 27898f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 2790c45cb8bbSRichard Henderson tcg_optimize(s); 27918f2e8c07SKirill Batuzov #endif 27928f2e8c07SKirill Batuzov 2793a23a9ec6Sbellard #ifdef CONFIG_PROFILER 2794c5cc28ffSAurelien Jarno s->opt_time += profile_getclock(); 2795a23a9ec6Sbellard s->la_time -= profile_getclock(); 2796a23a9ec6Sbellard #endif 2797c5cc28ffSAurelien Jarno 27985a18407fSRichard Henderson { 27995a18407fSRichard Henderson uint8_t *temp_state = tcg_malloc(s->nb_temps + s->nb_indirects); 28005a18407fSRichard Henderson 28015a18407fSRichard Henderson liveness_pass_1(s, temp_state); 28025a18407fSRichard Henderson 28035a18407fSRichard Henderson if (s->nb_indirects > 0) { 28045a18407fSRichard Henderson #ifdef DEBUG_DISAS 28055a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 28065a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 28071ee73216SRichard Henderson qemu_log_lock(); 28085a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 28095a18407fSRichard Henderson tcg_dump_ops(s); 28105a18407fSRichard Henderson qemu_log("\n"); 28111ee73216SRichard Henderson qemu_log_unlock(); 28125a18407fSRichard Henderson } 28135a18407fSRichard Henderson #endif 28145a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 28155a18407fSRichard Henderson if (liveness_pass_2(s, temp_state)) { 28165a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 28175a18407fSRichard Henderson liveness_pass_1(s, temp_state); 28185a18407fSRichard Henderson } 28195a18407fSRichard Henderson } 28205a18407fSRichard Henderson } 2821c5cc28ffSAurelien Jarno 2822a23a9ec6Sbellard #ifdef CONFIG_PROFILER 2823a23a9ec6Sbellard s->la_time += profile_getclock(); 2824a23a9ec6Sbellard #endif 2825c896fe29Sbellard 2826c896fe29Sbellard #ifdef DEBUG_DISAS 2827d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 2828d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 28291ee73216SRichard Henderson qemu_log_lock(); 2830c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 2831eeacee4dSBlue Swirl tcg_dump_ops(s); 283293fcfe39Saliguori qemu_log("\n"); 28331ee73216SRichard Henderson qemu_log_unlock(); 2834c896fe29Sbellard } 2835c896fe29Sbellard #endif 2836c896fe29Sbellard 2837c896fe29Sbellard tcg_reg_alloc_start(s); 2838c896fe29Sbellard 28395bd2ec3dSAlex Bennée s->code_buf = tb->tc_ptr; 28405bd2ec3dSAlex Bennée s->code_ptr = tb->tc_ptr; 2841c896fe29Sbellard 2842659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 2843659ef5cbSRichard Henderson s->ldst_labels = NULL; 2844659ef5cbSRichard Henderson #endif 284557a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 284657a26946SRichard Henderson s->pool_labels = NULL; 284757a26946SRichard Henderson #endif 28489ecefc84SRichard Henderson 2849fca8a500SRichard Henderson num_insns = -1; 2850dcb8e758SRichard Henderson for (oi = s->gen_op_buf[0].next; oi != 0; oi = oi_next) { 2851c45cb8bbSRichard Henderson TCGOp * const op = &s->gen_op_buf[oi]; 2852c45cb8bbSRichard Henderson TCGArg * const args = &s->gen_opparam_buf[op->args]; 2853c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2854c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2855bee158cbSRichard Henderson TCGLifeData arg_life = op->life; 2856b3db8758Sblueswir1 2857c45cb8bbSRichard Henderson oi_next = op->next; 2858c896fe29Sbellard #ifdef CONFIG_PROFILER 285954604f74Saurel32 tcg_table_op_count[opc]++; 2860c896fe29Sbellard #endif 2861c45cb8bbSRichard Henderson 2862c896fe29Sbellard switch (opc) { 2863c896fe29Sbellard case INDEX_op_mov_i32: 2864c896fe29Sbellard case INDEX_op_mov_i64: 2865a1b3c48dSRichard Henderson tcg_reg_alloc_mov(s, def, args, arg_life); 2866c896fe29Sbellard break; 2867e8996ee0Sbellard case INDEX_op_movi_i32: 2868e8996ee0Sbellard case INDEX_op_movi_i64: 2869a1b3c48dSRichard Henderson tcg_reg_alloc_movi(s, args, arg_life); 2870e8996ee0Sbellard break; 2871765b842aSRichard Henderson case INDEX_op_insn_start: 2872fca8a500SRichard Henderson if (num_insns >= 0) { 2873fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 2874fca8a500SRichard Henderson } 2875fca8a500SRichard Henderson num_insns++; 2876bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 2877bad729e2SRichard Henderson target_ulong a; 2878bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 2879bad729e2SRichard Henderson a = ((target_ulong)args[i * 2 + 1] << 32) | args[i * 2]; 2880bad729e2SRichard Henderson #else 2881bad729e2SRichard Henderson a = args[i]; 2882bad729e2SRichard Henderson #endif 2883fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 2884bad729e2SRichard Henderson } 2885c896fe29Sbellard break; 28865ff9d6a4Sbellard case INDEX_op_discard: 2887f8bf00f1SRichard Henderson temp_dead(s, &s->temps[args[0]]); 28885ff9d6a4Sbellard break; 2889c896fe29Sbellard case INDEX_op_set_label: 2890e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 2891bec16311SRichard Henderson tcg_out_label(s, arg_label(args[0]), s->code_ptr); 2892c896fe29Sbellard break; 2893c896fe29Sbellard case INDEX_op_call: 2894a1b3c48dSRichard Henderson tcg_reg_alloc_call(s, op->callo, op->calli, args, arg_life); 2895c45cb8bbSRichard Henderson break; 2896c896fe29Sbellard default: 289725c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 2898be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 2899c896fe29Sbellard /* Note: in order to speed up the code, it would be much 2900c896fe29Sbellard faster to have specialized register allocator functions for 2901c896fe29Sbellard some common argument patterns */ 2902a1b3c48dSRichard Henderson tcg_reg_alloc_op(s, def, opc, args, arg_life); 2903c896fe29Sbellard break; 2904c896fe29Sbellard } 29058d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2906c896fe29Sbellard check_regs(s); 2907c896fe29Sbellard #endif 2908b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 2909b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 2910b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 2911b125f9dcSRichard Henderson generating code without having to check during generation. */ 2912644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 2913b125f9dcSRichard Henderson return -1; 2914b125f9dcSRichard Henderson } 2915c896fe29Sbellard } 2916fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 2917fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 2918c45cb8bbSRichard Henderson 2919b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 2920659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 2921659ef5cbSRichard Henderson if (!tcg_out_ldst_finalize(s)) { 292223dceda6SRichard Henderson return -1; 292323dceda6SRichard Henderson } 2924659ef5cbSRichard Henderson #endif 292557a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 292657a26946SRichard Henderson if (!tcg_out_pool_finalize(s)) { 292757a26946SRichard Henderson return -1; 292857a26946SRichard Henderson } 292957a26946SRichard Henderson #endif 2930c896fe29Sbellard 2931c896fe29Sbellard /* flush instruction cache */ 29321813e175SRichard Henderson flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr); 29332aeabc08SStefan Weil 29341813e175SRichard Henderson return tcg_current_code_size(s); 2935c896fe29Sbellard } 2936c896fe29Sbellard 2937a23a9ec6Sbellard #ifdef CONFIG_PROFILER 2938405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 2939a23a9ec6Sbellard { 2940a23a9ec6Sbellard TCGContext *s = &tcg_ctx; 2941fca8a500SRichard Henderson int64_t tb_count = s->tb_count; 2942fca8a500SRichard Henderson int64_t tb_div_count = tb_count ? tb_count : 1; 2943fca8a500SRichard Henderson int64_t tot = s->interm_time + s->code_time; 2944a23a9ec6Sbellard 2945a23a9ec6Sbellard cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 2946a23a9ec6Sbellard tot, tot / 2.4e9); 2947a23a9ec6Sbellard cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n", 2948fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 2949fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 2950fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 2951a23a9ec6Sbellard cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n", 2952fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 2953a23a9ec6Sbellard cpu_fprintf(f, "deleted ops/TB %0.2f\n", 2954fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 2955a23a9ec6Sbellard cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n", 2956fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 2957fca8a500SRichard Henderson cpu_fprintf(f, "avg host code/TB %0.1f\n", 2958fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 2959fca8a500SRichard Henderson cpu_fprintf(f, "avg search data/TB %0.1f\n", 2960fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 2961a23a9ec6Sbellard 2962a23a9ec6Sbellard cpu_fprintf(f, "cycles/op %0.1f\n", 2963a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 2964a23a9ec6Sbellard cpu_fprintf(f, "cycles/in byte %0.1f\n", 2965a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 2966a23a9ec6Sbellard cpu_fprintf(f, "cycles/out byte %0.1f\n", 2967a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 2968fca8a500SRichard Henderson cpu_fprintf(f, "cycles/search byte %0.1f\n", 2969fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 2970fca8a500SRichard Henderson if (tot == 0) { 2971a23a9ec6Sbellard tot = 1; 2972fca8a500SRichard Henderson } 2973a23a9ec6Sbellard cpu_fprintf(f, " gen_interm time %0.1f%%\n", 2974a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 2975a23a9ec6Sbellard cpu_fprintf(f, " gen_code time %0.1f%%\n", 2976a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 2977c5cc28ffSAurelien Jarno cpu_fprintf(f, "optim./code time %0.1f%%\n", 2978c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 2979c5cc28ffSAurelien Jarno * 100.0); 2980a23a9ec6Sbellard cpu_fprintf(f, "liveness/code time %0.1f%%\n", 2981a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 2982a23a9ec6Sbellard cpu_fprintf(f, "cpu_restore count %" PRId64 "\n", 2983a23a9ec6Sbellard s->restore_count); 2984a23a9ec6Sbellard cpu_fprintf(f, " avg cycles %0.1f\n", 2985a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 2986a23a9ec6Sbellard } 2987a23a9ec6Sbellard #else 2988405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 2989a23a9ec6Sbellard { 299024bf7b3aSbellard cpu_fprintf(f, "[TCG profiler not compiled]\n"); 2991a23a9ec6Sbellard } 2992a23a9ec6Sbellard #endif 2993813da627SRichard Henderson 2994813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 29955872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 29965872bbf2SRichard Henderson 29975872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 29985872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 29995872bbf2SRichard Henderson 30005872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 30015872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 30025872bbf2SRichard Henderson prologue unwind info for the tcg machine. 30035872bbf2SRichard Henderson 30045872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 30055872bbf2SRichard Henderson */ 3006813da627SRichard Henderson 3007813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 3008813da627SRichard Henderson typedef enum { 3009813da627SRichard Henderson JIT_NOACTION = 0, 3010813da627SRichard Henderson JIT_REGISTER_FN, 3011813da627SRichard Henderson JIT_UNREGISTER_FN 3012813da627SRichard Henderson } jit_actions_t; 3013813da627SRichard Henderson 3014813da627SRichard Henderson struct jit_code_entry { 3015813da627SRichard Henderson struct jit_code_entry *next_entry; 3016813da627SRichard Henderson struct jit_code_entry *prev_entry; 3017813da627SRichard Henderson const void *symfile_addr; 3018813da627SRichard Henderson uint64_t symfile_size; 3019813da627SRichard Henderson }; 3020813da627SRichard Henderson 3021813da627SRichard Henderson struct jit_descriptor { 3022813da627SRichard Henderson uint32_t version; 3023813da627SRichard Henderson uint32_t action_flag; 3024813da627SRichard Henderson struct jit_code_entry *relevant_entry; 3025813da627SRichard Henderson struct jit_code_entry *first_entry; 3026813da627SRichard Henderson }; 3027813da627SRichard Henderson 3028813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 3029813da627SRichard Henderson void __jit_debug_register_code(void) 3030813da627SRichard Henderson { 3031813da627SRichard Henderson asm(""); 3032813da627SRichard Henderson } 3033813da627SRichard Henderson 3034813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 3035813da627SRichard Henderson the version before we can set it. */ 3036813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 3037813da627SRichard Henderson 3038813da627SRichard Henderson /* End GDB interface. */ 3039813da627SRichard Henderson 3040813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 3041813da627SRichard Henderson { 3042813da627SRichard Henderson const char *p = strtab + 1; 3043813da627SRichard Henderson 3044813da627SRichard Henderson while (1) { 3045813da627SRichard Henderson if (strcmp(p, str) == 0) { 3046813da627SRichard Henderson return p - strtab; 3047813da627SRichard Henderson } 3048813da627SRichard Henderson p += strlen(p) + 1; 3049813da627SRichard Henderson } 3050813da627SRichard Henderson } 3051813da627SRichard Henderson 30525872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size, 30532c90784aSRichard Henderson const void *debug_frame, 30542c90784aSRichard Henderson size_t debug_frame_size) 3055813da627SRichard Henderson { 30565872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 30575872bbf2SRichard Henderson uint32_t len; 30585872bbf2SRichard Henderson uint16_t version; 30595872bbf2SRichard Henderson uint32_t abbrev; 30605872bbf2SRichard Henderson uint8_t ptr_size; 30615872bbf2SRichard Henderson uint8_t cu_die; 30625872bbf2SRichard Henderson uint16_t cu_lang; 30635872bbf2SRichard Henderson uintptr_t cu_low_pc; 30645872bbf2SRichard Henderson uintptr_t cu_high_pc; 30655872bbf2SRichard Henderson uint8_t fn_die; 30665872bbf2SRichard Henderson char fn_name[16]; 30675872bbf2SRichard Henderson uintptr_t fn_low_pc; 30685872bbf2SRichard Henderson uintptr_t fn_high_pc; 30695872bbf2SRichard Henderson uint8_t cu_eoc; 30705872bbf2SRichard Henderson }; 3071813da627SRichard Henderson 3072813da627SRichard Henderson struct ElfImage { 3073813da627SRichard Henderson ElfW(Ehdr) ehdr; 3074813da627SRichard Henderson ElfW(Phdr) phdr; 30755872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 30765872bbf2SRichard Henderson ElfW(Sym) sym[2]; 30775872bbf2SRichard Henderson struct DebugInfo di; 30785872bbf2SRichard Henderson uint8_t da[24]; 30795872bbf2SRichard Henderson char str[80]; 30805872bbf2SRichard Henderson }; 30815872bbf2SRichard Henderson 30825872bbf2SRichard Henderson struct ElfImage *img; 30835872bbf2SRichard Henderson 30845872bbf2SRichard Henderson static const struct ElfImage img_template = { 30855872bbf2SRichard Henderson .ehdr = { 30865872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 30875872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 30885872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 30895872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 30905872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 30915872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 30925872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 30935872bbf2SRichard Henderson .e_type = ET_EXEC, 30945872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 30955872bbf2SRichard Henderson .e_version = EV_CURRENT, 30965872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 30975872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 30985872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 30995872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 31005872bbf2SRichard Henderson .e_phnum = 1, 31015872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 31025872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 31035872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 3104abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 3105abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 3106abbb3eaeSRichard Henderson #endif 3107abbb3eaeSRichard Henderson #ifdef ELF_OSABI 3108abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 3109abbb3eaeSRichard Henderson #endif 31105872bbf2SRichard Henderson }, 31115872bbf2SRichard Henderson .phdr = { 31125872bbf2SRichard Henderson .p_type = PT_LOAD, 31135872bbf2SRichard Henderson .p_flags = PF_X, 31145872bbf2SRichard Henderson }, 31155872bbf2SRichard Henderson .shdr = { 31165872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 31175872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 31185872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 31195872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 31205872bbf2SRichard Henderson will not look for contents. We can record any address. */ 31215872bbf2SRichard Henderson [1] = { /* .text */ 31225872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 31235872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 31245872bbf2SRichard Henderson }, 31255872bbf2SRichard Henderson [2] = { /* .debug_info */ 31265872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 31275872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 31285872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 31295872bbf2SRichard Henderson }, 31305872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 31315872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 31325872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 31335872bbf2SRichard Henderson .sh_size = sizeof(img->da), 31345872bbf2SRichard Henderson }, 31355872bbf2SRichard Henderson [4] = { /* .debug_frame */ 31365872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 31375872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 31385872bbf2SRichard Henderson }, 31395872bbf2SRichard Henderson [5] = { /* .symtab */ 31405872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 31415872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 31425872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 31435872bbf2SRichard Henderson .sh_info = 1, 31445872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 31455872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 31465872bbf2SRichard Henderson }, 31475872bbf2SRichard Henderson [6] = { /* .strtab */ 31485872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 31495872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 31505872bbf2SRichard Henderson .sh_size = sizeof(img->str), 31515872bbf2SRichard Henderson } 31525872bbf2SRichard Henderson }, 31535872bbf2SRichard Henderson .sym = { 31545872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 31555872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 31565872bbf2SRichard Henderson .st_shndx = 1, 31575872bbf2SRichard Henderson } 31585872bbf2SRichard Henderson }, 31595872bbf2SRichard Henderson .di = { 31605872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 31615872bbf2SRichard Henderson .version = 2, 31625872bbf2SRichard Henderson .ptr_size = sizeof(void *), 31635872bbf2SRichard Henderson .cu_die = 1, 31645872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 31655872bbf2SRichard Henderson .fn_die = 2, 31665872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 31675872bbf2SRichard Henderson }, 31685872bbf2SRichard Henderson .da = { 31695872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 31705872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 31715872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 31725872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 31735872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 31745872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 31755872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 31765872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 31775872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 31785872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 31795872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 31805872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 31815872bbf2SRichard Henderson 0 /* no more abbrev */ 31825872bbf2SRichard Henderson }, 31835872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 31845872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 3185813da627SRichard Henderson }; 3186813da627SRichard Henderson 3187813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 3188813da627SRichard Henderson static struct jit_code_entry one_entry; 3189813da627SRichard Henderson 31905872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 3191813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 31922c90784aSRichard Henderson DebugFrameHeader *dfh; 3193813da627SRichard Henderson 31945872bbf2SRichard Henderson img = g_malloc(img_size); 31955872bbf2SRichard Henderson *img = img_template; 3196813da627SRichard Henderson 31975872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 31985872bbf2SRichard Henderson img->phdr.p_paddr = buf; 31995872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 3200813da627SRichard Henderson 32015872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 32025872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 32035872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 3204813da627SRichard Henderson 32055872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 32065872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 32075872bbf2SRichard Henderson 32085872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 32095872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 32105872bbf2SRichard Henderson 32115872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 32125872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 32135872bbf2SRichard Henderson 32145872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 32155872bbf2SRichard Henderson img->sym[1].st_value = buf; 32165872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 32175872bbf2SRichard Henderson 32185872bbf2SRichard Henderson img->di.cu_low_pc = buf; 321945aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 32205872bbf2SRichard Henderson img->di.fn_low_pc = buf; 322145aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 3222813da627SRichard Henderson 32232c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 32242c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 32252c90784aSRichard Henderson dfh->fde.func_start = buf; 32262c90784aSRichard Henderson dfh->fde.func_len = buf_size; 32272c90784aSRichard Henderson 3228813da627SRichard Henderson #ifdef DEBUG_JIT 3229813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 3230813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 3231813da627SRichard Henderson { 3232813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 3233813da627SRichard Henderson if (f) { 32345872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 3235813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 3236813da627SRichard Henderson } 3237813da627SRichard Henderson fclose(f); 3238813da627SRichard Henderson } 3239813da627SRichard Henderson } 3240813da627SRichard Henderson #endif 3241813da627SRichard Henderson 3242813da627SRichard Henderson one_entry.symfile_addr = img; 3243813da627SRichard Henderson one_entry.symfile_size = img_size; 3244813da627SRichard Henderson 3245813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 3246813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 3247813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 3248813da627SRichard Henderson __jit_debug_register_code(); 3249813da627SRichard Henderson } 3250813da627SRichard Henderson #else 32515872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 32525872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 3253813da627SRichard Henderson 3254813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 32552c90784aSRichard Henderson const void *debug_frame, 32562c90784aSRichard Henderson size_t debug_frame_size) 3257813da627SRichard Henderson { 3258813da627SRichard Henderson } 3259813da627SRichard Henderson 3260813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size) 3261813da627SRichard Henderson { 3262813da627SRichard Henderson } 3263813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 3264