1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 33f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 341de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 351de7afc9SPaolo Bonzini #include "qemu/timer.h" 36c896fe29Sbellard 37c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 38c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 39c896fe29Sbellard instructions */ 40c896fe29Sbellard #define NO_CPU_IO_DEFS 41c896fe29Sbellard #include "cpu.h" 42c896fe29Sbellard 4363c91552SPaolo Bonzini #include "exec/cpu-common.h" 4463c91552SPaolo Bonzini #include "exec/exec-all.h" 4563c91552SPaolo Bonzini 46c896fe29Sbellard #include "tcg-op.h" 47813da627SRichard Henderson 48edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 49813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 50edee2579SRichard Henderson #else 51edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 52813da627SRichard Henderson #endif 53813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 54813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 55813da627SRichard Henderson #else 56813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 57813da627SRichard Henderson #endif 58813da627SRichard Henderson 59c896fe29Sbellard #include "elf.h" 60508127e2SPaolo Bonzini #include "exec/log.h" 61c896fe29Sbellard 62ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and 63ce151109SPeter Maydell used here. */ 64e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 65f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode); 66e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 671813e175SRichard Henderson static void patch_reloc(tcg_insn_unit *code_ptr, int type, 682ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 69c896fe29Sbellard 70497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 71497a22ebSRichard Henderson typedef struct { 72497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 73497a22ebSRichard Henderson uint32_t id; 74497a22ebSRichard Henderson uint8_t version; 75497a22ebSRichard Henderson char augmentation[1]; 76497a22ebSRichard Henderson uint8_t code_align; 77497a22ebSRichard Henderson uint8_t data_align; 78497a22ebSRichard Henderson uint8_t return_column; 79497a22ebSRichard Henderson } DebugFrameCIE; 80497a22ebSRichard Henderson 81497a22ebSRichard Henderson typedef struct QEMU_PACKED { 82497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 83497a22ebSRichard Henderson uint32_t cie_offset; 84edee2579SRichard Henderson uintptr_t func_start; 85edee2579SRichard Henderson uintptr_t func_len; 86497a22ebSRichard Henderson } DebugFrameFDEHeader; 87497a22ebSRichard Henderson 882c90784aSRichard Henderson typedef struct QEMU_PACKED { 892c90784aSRichard Henderson DebugFrameCIE cie; 902c90784aSRichard Henderson DebugFrameFDEHeader fde; 912c90784aSRichard Henderson } DebugFrameHeader; 922c90784aSRichard Henderson 93813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 942c90784aSRichard Henderson const void *debug_frame, 952c90784aSRichard Henderson size_t debug_frame_size) 96813da627SRichard Henderson __attribute__((unused)); 97813da627SRichard Henderson 98ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */ 99069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct, 100069ea736SRichard Henderson const char *ct_str, TCGType type); 1012a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 102a05b5b9bSRichard Henderson intptr_t arg2); 1032a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 104c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1052a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 106c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args, 107c0ad3001SStefan Weil const int *const_args); 1082a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 109a05b5b9bSRichard Henderson intptr_t arg2); 11059d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 11159d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 112cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); 113f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type, 114c0ad3001SStefan Weil const TCGArgConstraint *arg_ct); 115659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 116659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s); 117659ef5cbSRichard Henderson #endif 118c896fe29Sbellard 119*a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024 120*a505785cSEmilio G. Cota 121b1d8e52eSblueswir1 static TCGRegSet tcg_target_available_regs[2]; 122b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 123c896fe29Sbellard 1241813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1254196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 126c896fe29Sbellard { 127c896fe29Sbellard *s->code_ptr++ = v; 128c896fe29Sbellard } 129c896fe29Sbellard 1304196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1314196dca6SPeter Maydell uint8_t v) 1325c53bb81SPeter Maydell { 1331813e175SRichard Henderson *p = v; 1345c53bb81SPeter Maydell } 1351813e175SRichard Henderson #endif 1365c53bb81SPeter Maydell 1371813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1384196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 139c896fe29Sbellard { 1401813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1411813e175SRichard Henderson *s->code_ptr++ = v; 1421813e175SRichard Henderson } else { 1431813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1444387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1451813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 1461813e175SRichard Henderson } 147c896fe29Sbellard } 148c896fe29Sbellard 1494196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 1504196dca6SPeter Maydell uint16_t v) 1515c53bb81SPeter Maydell { 1521813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1531813e175SRichard Henderson *p = v; 1541813e175SRichard Henderson } else { 1555c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 1565c53bb81SPeter Maydell } 1571813e175SRichard Henderson } 1581813e175SRichard Henderson #endif 1595c53bb81SPeter Maydell 1601813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 1614196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 162c896fe29Sbellard { 1631813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 1641813e175SRichard Henderson *s->code_ptr++ = v; 1651813e175SRichard Henderson } else { 1661813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1674387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1681813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 1691813e175SRichard Henderson } 170c896fe29Sbellard } 171c896fe29Sbellard 1724196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 1734196dca6SPeter Maydell uint32_t v) 1745c53bb81SPeter Maydell { 1751813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 1761813e175SRichard Henderson *p = v; 1771813e175SRichard Henderson } else { 1785c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 1795c53bb81SPeter Maydell } 1801813e175SRichard Henderson } 1811813e175SRichard Henderson #endif 1825c53bb81SPeter Maydell 1831813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 1844196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 185ac26eb69SRichard Henderson { 1861813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 1871813e175SRichard Henderson *s->code_ptr++ = v; 1881813e175SRichard Henderson } else { 1891813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1904387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1911813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 1921813e175SRichard Henderson } 193ac26eb69SRichard Henderson } 194ac26eb69SRichard Henderson 1954196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 1964196dca6SPeter Maydell uint64_t v) 1975c53bb81SPeter Maydell { 1981813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 1991813e175SRichard Henderson *p = v; 2001813e175SRichard Henderson } else { 2015c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2025c53bb81SPeter Maydell } 2031813e175SRichard Henderson } 2041813e175SRichard Henderson #endif 2055c53bb81SPeter Maydell 206c896fe29Sbellard /* label relocation processing */ 207c896fe29Sbellard 2081813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 209bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 210c896fe29Sbellard { 211c896fe29Sbellard TCGRelocation *r; 212c896fe29Sbellard 213c896fe29Sbellard if (l->has_value) { 214623e265cSpbrook /* FIXME: This may break relocations on RISC targets that 215623e265cSpbrook modify instruction fields in place. The caller may not have 216623e265cSpbrook written the initial value. */ 217f54b3f92Saurel32 patch_reloc(code_ptr, type, l->u.value, addend); 218c896fe29Sbellard } else { 219c896fe29Sbellard /* add a new relocation entry */ 220c896fe29Sbellard r = tcg_malloc(sizeof(TCGRelocation)); 221c896fe29Sbellard r->type = type; 222c896fe29Sbellard r->ptr = code_ptr; 223c896fe29Sbellard r->addend = addend; 224c896fe29Sbellard r->next = l->u.first_reloc; 225c896fe29Sbellard l->u.first_reloc = r; 226c896fe29Sbellard } 227c896fe29Sbellard } 228c896fe29Sbellard 229bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr) 230c896fe29Sbellard { 2312ba7fae2SRichard Henderson intptr_t value = (intptr_t)ptr; 2321813e175SRichard Henderson TCGRelocation *r; 233c896fe29Sbellard 234eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 2351813e175SRichard Henderson 2361813e175SRichard Henderson for (r = l->u.first_reloc; r != NULL; r = r->next) { 237f54b3f92Saurel32 patch_reloc(r->ptr, r->type, value, r->addend); 238c896fe29Sbellard } 2391813e175SRichard Henderson 240c896fe29Sbellard l->has_value = 1; 2411813e175SRichard Henderson l->u.value_ptr = ptr; 242c896fe29Sbellard } 243c896fe29Sbellard 24442a268c2SRichard Henderson TCGLabel *gen_new_label(void) 245c896fe29Sbellard { 246c896fe29Sbellard TCGContext *s = &tcg_ctx; 24751e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 248c896fe29Sbellard 24951e3972cSRichard Henderson *l = (TCGLabel){ 25051e3972cSRichard Henderson .id = s->nb_labels++ 25151e3972cSRichard Henderson }; 25242a268c2SRichard Henderson 25342a268c2SRichard Henderson return l; 254c896fe29Sbellard } 255c896fe29Sbellard 256ce151109SPeter Maydell #include "tcg-target.inc.c" 257c896fe29Sbellard 258c896fe29Sbellard /* pool based memory allocation */ 259c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 260c896fe29Sbellard { 261c896fe29Sbellard TCGPool *p; 262c896fe29Sbellard int pool_size; 263c896fe29Sbellard 264c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 265c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 2667267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 267c896fe29Sbellard p->size = size; 2684055299eSKirill Batuzov p->next = s->pool_first_large; 2694055299eSKirill Batuzov s->pool_first_large = p; 2704055299eSKirill Batuzov return p->data; 271c896fe29Sbellard } else { 272c896fe29Sbellard p = s->pool_current; 273c896fe29Sbellard if (!p) { 274c896fe29Sbellard p = s->pool_first; 275c896fe29Sbellard if (!p) 276c896fe29Sbellard goto new_pool; 277c896fe29Sbellard } else { 278c896fe29Sbellard if (!p->next) { 279c896fe29Sbellard new_pool: 280c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 2817267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 282c896fe29Sbellard p->size = pool_size; 283c896fe29Sbellard p->next = NULL; 284c896fe29Sbellard if (s->pool_current) 285c896fe29Sbellard s->pool_current->next = p; 286c896fe29Sbellard else 287c896fe29Sbellard s->pool_first = p; 288c896fe29Sbellard } else { 289c896fe29Sbellard p = p->next; 290c896fe29Sbellard } 291c896fe29Sbellard } 292c896fe29Sbellard } 293c896fe29Sbellard s->pool_current = p; 294c896fe29Sbellard s->pool_cur = p->data + size; 295c896fe29Sbellard s->pool_end = p->data + p->size; 296c896fe29Sbellard return p->data; 297c896fe29Sbellard } 298c896fe29Sbellard 299c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 300c896fe29Sbellard { 3014055299eSKirill Batuzov TCGPool *p, *t; 3024055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 3034055299eSKirill Batuzov t = p->next; 3044055299eSKirill Batuzov g_free(p); 3054055299eSKirill Batuzov } 3064055299eSKirill Batuzov s->pool_first_large = NULL; 307c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 308c896fe29Sbellard s->pool_current = NULL; 309c896fe29Sbellard } 310c896fe29Sbellard 311100b5e01SRichard Henderson typedef struct TCGHelperInfo { 312100b5e01SRichard Henderson void *func; 313100b5e01SRichard Henderson const char *name; 314afb49896SRichard Henderson unsigned flags; 315afb49896SRichard Henderson unsigned sizemask; 316100b5e01SRichard Henderson } TCGHelperInfo; 317100b5e01SRichard Henderson 3182ef6175aSRichard Henderson #include "exec/helper-proto.h" 3192ef6175aSRichard Henderson 320100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 3212ef6175aSRichard Henderson #include "exec/helper-tcg.h" 322100b5e01SRichard Henderson }; 323619205fdSEmilio G. Cota static GHashTable *helper_table; 324100b5e01SRichard Henderson 32591478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 326f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 32791478cefSRichard Henderson 328c896fe29Sbellard void tcg_context_init(TCGContext *s) 329c896fe29Sbellard { 330100b5e01SRichard Henderson int op, total_args, n, i; 331c896fe29Sbellard TCGOpDef *def; 332c896fe29Sbellard TCGArgConstraint *args_ct; 333c896fe29Sbellard int *sorted_args; 334c896fe29Sbellard 335c896fe29Sbellard memset(s, 0, sizeof(*s)); 336c896fe29Sbellard s->nb_globals = 0; 337c896fe29Sbellard 338c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 339c896fe29Sbellard space */ 340c896fe29Sbellard total_args = 0; 341c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 342c896fe29Sbellard def = &tcg_op_defs[op]; 343c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 344c896fe29Sbellard total_args += n; 345c896fe29Sbellard } 346c896fe29Sbellard 3477267c094SAnthony Liguori args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args); 3487267c094SAnthony Liguori sorted_args = g_malloc(sizeof(int) * total_args); 349c896fe29Sbellard 350c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 351c896fe29Sbellard def = &tcg_op_defs[op]; 352c896fe29Sbellard def->args_ct = args_ct; 353c896fe29Sbellard def->sorted_args = sorted_args; 354c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 355c896fe29Sbellard sorted_args += n; 356c896fe29Sbellard args_ct += n; 357c896fe29Sbellard } 358c896fe29Sbellard 3595cd8f621SRichard Henderson /* Register helpers. */ 36084fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 361619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 36284fd9dd3SRichard Henderson 363100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 36484fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 36572866e82SRichard Henderson (gpointer)&all_helpers[i]); 366100b5e01SRichard Henderson } 3675cd8f621SRichard Henderson 368c896fe29Sbellard tcg_target_init(s); 369f69d277eSRichard Henderson process_op_defs(s); 37091478cefSRichard Henderson 37191478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 37291478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 37391478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 37491478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 37591478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 37691478cefSRichard Henderson break; 37791478cefSRichard Henderson } 37891478cefSRichard Henderson } 37991478cefSRichard Henderson for (i = 0; i < n; ++i) { 38091478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 38191478cefSRichard Henderson } 38291478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 38391478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 38491478cefSRichard Henderson } 3859002ec79SRichard Henderson } 386b03cce8eSbellard 3876e3b2bfdSEmilio G. Cota /* 3886e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 3896e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 3906e3b2bfdSEmilio G. Cota */ 3916e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 3926e3b2bfdSEmilio G. Cota { 3936e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 3946e3b2bfdSEmilio G. Cota TranslationBlock *tb; 3956e3b2bfdSEmilio G. Cota void *next; 3966e3b2bfdSEmilio G. Cota 3976e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 3986e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 3996e3b2bfdSEmilio G. Cota 4006e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 4016e3b2bfdSEmilio G. Cota return NULL; 4026e3b2bfdSEmilio G. Cota } 4036e3b2bfdSEmilio G. Cota s->code_gen_ptr = next; 40457a26946SRichard Henderson s->data_gen_ptr = NULL; 4056e3b2bfdSEmilio G. Cota return tb; 4066e3b2bfdSEmilio G. Cota } 4076e3b2bfdSEmilio G. Cota 4089002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 4099002ec79SRichard Henderson { 4108163b749SRichard Henderson size_t prologue_size, total_size; 4118163b749SRichard Henderson void *buf0, *buf1; 4128163b749SRichard Henderson 4138163b749SRichard Henderson /* Put the prologue at the beginning of code_gen_buffer. */ 4148163b749SRichard Henderson buf0 = s->code_gen_buffer; 4158163b749SRichard Henderson s->code_ptr = buf0; 4168163b749SRichard Henderson s->code_buf = buf0; 4178163b749SRichard Henderson s->code_gen_prologue = buf0; 4188163b749SRichard Henderson 4198163b749SRichard Henderson /* Generate the prologue. */ 420b03cce8eSbellard tcg_target_qemu_prologue(s); 4218163b749SRichard Henderson buf1 = s->code_ptr; 4228163b749SRichard Henderson flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1); 4238163b749SRichard Henderson 4248163b749SRichard Henderson /* Deduct the prologue from the buffer. */ 4258163b749SRichard Henderson prologue_size = tcg_current_code_size(s); 4268163b749SRichard Henderson s->code_gen_ptr = buf1; 4278163b749SRichard Henderson s->code_gen_buffer = buf1; 4288163b749SRichard Henderson s->code_buf = buf1; 4298163b749SRichard Henderson total_size = s->code_gen_buffer_size - prologue_size; 4308163b749SRichard Henderson s->code_gen_buffer_size = total_size; 4318163b749SRichard Henderson 432b125f9dcSRichard Henderson /* Compute a high-water mark, at which we voluntarily flush the buffer 433b125f9dcSRichard Henderson and start over. The size here is arbitrary, significantly larger 434b125f9dcSRichard Henderson than we expect the code generation for any one opcode to require. */ 435*a505785cSEmilio G. Cota s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER); 4368163b749SRichard Henderson 4378163b749SRichard Henderson tcg_register_jit(s->code_gen_buffer, total_size); 438d6b64b2bSRichard Henderson 439d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 440d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 4411ee73216SRichard Henderson qemu_log_lock(); 4428163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 4438163b749SRichard Henderson log_disas(buf0, prologue_size); 444d6b64b2bSRichard Henderson qemu_log("\n"); 445d6b64b2bSRichard Henderson qemu_log_flush(); 4461ee73216SRichard Henderson qemu_log_unlock(); 447d6b64b2bSRichard Henderson } 448d6b64b2bSRichard Henderson #endif 449cedbcb01SEmilio G. Cota 450cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 451cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 452cedbcb01SEmilio G. Cota tcg_debug_assert(s->code_gen_epilogue != NULL); 453cedbcb01SEmilio G. Cota } 454c896fe29Sbellard } 455c896fe29Sbellard 456c896fe29Sbellard void tcg_func_start(TCGContext *s) 457c896fe29Sbellard { 458c896fe29Sbellard tcg_pool_reset(s); 459c896fe29Sbellard s->nb_temps = s->nb_globals; 4600ec9eabcSRichard Henderson 4610ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 4620ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 4630ec9eabcSRichard Henderson 464c896fe29Sbellard s->nb_labels = 0; 465c896fe29Sbellard s->current_frame_offset = s->frame_start; 466c896fe29Sbellard 4670a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 4680a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 4690a209d4bSRichard Henderson #endif 4700a209d4bSRichard Henderson 471dcb8e758SRichard Henderson s->gen_op_buf[0].next = 1; 472dcb8e758SRichard Henderson s->gen_op_buf[0].prev = 0; 473dcb8e758SRichard Henderson s->gen_next_op_idx = 1; 474c45cb8bbSRichard Henderson s->gen_next_parm_idx = 0; 475c896fe29Sbellard } 476c896fe29Sbellard 4777ca4b752SRichard Henderson static inline int temp_idx(TCGContext *s, TCGTemp *ts) 478c896fe29Sbellard { 4797ca4b752SRichard Henderson ptrdiff_t n = ts - s->temps; 4807ca4b752SRichard Henderson tcg_debug_assert(n >= 0 && n < s->nb_temps); 4817ca4b752SRichard Henderson return n; 4827ca4b752SRichard Henderson } 4837ca4b752SRichard Henderson 4847ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s) 4857ca4b752SRichard Henderson { 4867ca4b752SRichard Henderson int n = s->nb_temps++; 4877ca4b752SRichard Henderson tcg_debug_assert(n < TCG_MAX_TEMPS); 4887ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 4897ca4b752SRichard Henderson } 4907ca4b752SRichard Henderson 4917ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s) 4927ca4b752SRichard Henderson { 4937ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 4947ca4b752SRichard Henderson s->nb_globals++; 4957ca4b752SRichard Henderson return tcg_temp_alloc(s); 496c896fe29Sbellard } 497c896fe29Sbellard 498b3a62939SRichard Henderson static int tcg_global_reg_new_internal(TCGContext *s, TCGType type, 499b6638662SRichard Henderson TCGReg reg, const char *name) 500c896fe29Sbellard { 501c896fe29Sbellard TCGTemp *ts; 502c896fe29Sbellard 503b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 504c896fe29Sbellard tcg_abort(); 505b3a62939SRichard Henderson } 5067ca4b752SRichard Henderson 5077ca4b752SRichard Henderson ts = tcg_global_alloc(s); 508c896fe29Sbellard ts->base_type = type; 509c896fe29Sbellard ts->type = type; 510c896fe29Sbellard ts->fixed_reg = 1; 511c896fe29Sbellard ts->reg = reg; 512c896fe29Sbellard ts->name = name; 513c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 5147ca4b752SRichard Henderson 5157ca4b752SRichard Henderson return temp_idx(s, ts); 516a7812ae4Spbrook } 517a7812ae4Spbrook 518b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 519a7812ae4Spbrook { 520a7812ae4Spbrook int idx; 521b3a62939SRichard Henderson s->frame_start = start; 522b3a62939SRichard Henderson s->frame_end = start + size; 523b3a62939SRichard Henderson idx = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 524b3a62939SRichard Henderson s->frame_temp = &s->temps[idx]; 525b3a62939SRichard Henderson } 526a7812ae4Spbrook 527b6638662SRichard Henderson TCGv_i32 tcg_global_reg_new_i32(TCGReg reg, const char *name) 528b3a62939SRichard Henderson { 529b3a62939SRichard Henderson TCGContext *s = &tcg_ctx; 530b3a62939SRichard Henderson int idx; 531b3a62939SRichard Henderson 532b3a62939SRichard Henderson if (tcg_regset_test_reg(s->reserved_regs, reg)) { 533b3a62939SRichard Henderson tcg_abort(); 534b3a62939SRichard Henderson } 535b3a62939SRichard Henderson idx = tcg_global_reg_new_internal(s, TCG_TYPE_I32, reg, name); 536a7812ae4Spbrook return MAKE_TCGV_I32(idx); 537a7812ae4Spbrook } 538a7812ae4Spbrook 539b6638662SRichard Henderson TCGv_i64 tcg_global_reg_new_i64(TCGReg reg, const char *name) 540a7812ae4Spbrook { 541b3a62939SRichard Henderson TCGContext *s = &tcg_ctx; 542a7812ae4Spbrook int idx; 543a7812ae4Spbrook 544b3a62939SRichard Henderson if (tcg_regset_test_reg(s->reserved_regs, reg)) { 545b3a62939SRichard Henderson tcg_abort(); 546b3a62939SRichard Henderson } 547b3a62939SRichard Henderson idx = tcg_global_reg_new_internal(s, TCG_TYPE_I64, reg, name); 548a7812ae4Spbrook return MAKE_TCGV_I64(idx); 549c896fe29Sbellard } 550c896fe29Sbellard 551e1ccc054SRichard Henderson int tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 552e1ccc054SRichard Henderson intptr_t offset, const char *name) 553c896fe29Sbellard { 554c896fe29Sbellard TCGContext *s = &tcg_ctx; 5557ca4b752SRichard Henderson TCGTemp *base_ts = &s->temps[GET_TCGV_PTR(base)]; 5567ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 557b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 5587ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 5597ca4b752SRichard Henderson bigendian = 1; 5607ca4b752SRichard Henderson #endif 561c896fe29Sbellard 562b3915dbbSRichard Henderson if (!base_ts->fixed_reg) { 5635a18407fSRichard Henderson /* We do not support double-indirect registers. */ 5645a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 565b3915dbbSRichard Henderson base_ts->indirect_base = 1; 5665a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 5675a18407fSRichard Henderson ? 2 : 1); 5685a18407fSRichard Henderson indirect_reg = 1; 569b3915dbbSRichard Henderson } 570b3915dbbSRichard Henderson 5717ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 5727ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 573c896fe29Sbellard char buf[64]; 5747ca4b752SRichard Henderson 5757ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 576c896fe29Sbellard ts->type = TCG_TYPE_I32; 577b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 578c896fe29Sbellard ts->mem_allocated = 1; 579b3a62939SRichard Henderson ts->mem_base = base_ts; 5807ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 581c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 582c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 583c896fe29Sbellard ts->name = strdup(buf); 584c896fe29Sbellard 5857ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 5867ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 5877ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 588b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 5897ca4b752SRichard Henderson ts2->mem_allocated = 1; 5907ca4b752SRichard Henderson ts2->mem_base = base_ts; 5917ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 592c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 593c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 594120c1084SRichard Henderson ts2->name = strdup(buf); 5957ca4b752SRichard Henderson } else { 596c896fe29Sbellard ts->base_type = type; 597c896fe29Sbellard ts->type = type; 598b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 599c896fe29Sbellard ts->mem_allocated = 1; 600b3a62939SRichard Henderson ts->mem_base = base_ts; 601c896fe29Sbellard ts->mem_offset = offset; 602c896fe29Sbellard ts->name = name; 603c896fe29Sbellard } 6047ca4b752SRichard Henderson return temp_idx(s, ts); 605c896fe29Sbellard } 606c896fe29Sbellard 6077ca4b752SRichard Henderson static int tcg_temp_new_internal(TCGType type, int temp_local) 608c896fe29Sbellard { 609c896fe29Sbellard TCGContext *s = &tcg_ctx; 610c896fe29Sbellard TCGTemp *ts; 611641d5fbeSbellard int idx, k; 612c896fe29Sbellard 6130ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 6140ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 6150ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 6160ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 6170ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 6180ec9eabcSRichard Henderson 619e8996ee0Sbellard ts = &s->temps[idx]; 620e8996ee0Sbellard ts->temp_allocated = 1; 6217ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 6227ca4b752SRichard Henderson tcg_debug_assert(ts->temp_local == temp_local); 623e8996ee0Sbellard } else { 6247ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 6257ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 6267ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 6277ca4b752SRichard Henderson 628c896fe29Sbellard ts->base_type = type; 629c896fe29Sbellard ts->type = TCG_TYPE_I32; 630e8996ee0Sbellard ts->temp_allocated = 1; 631641d5fbeSbellard ts->temp_local = temp_local; 6327ca4b752SRichard Henderson 6337ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 6347ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 6357ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 6367ca4b752SRichard Henderson ts2->temp_allocated = 1; 6377ca4b752SRichard Henderson ts2->temp_local = temp_local; 6387ca4b752SRichard Henderson } else { 639c896fe29Sbellard ts->base_type = type; 640c896fe29Sbellard ts->type = type; 641e8996ee0Sbellard ts->temp_allocated = 1; 642641d5fbeSbellard ts->temp_local = temp_local; 643c896fe29Sbellard } 6447ca4b752SRichard Henderson idx = temp_idx(s, ts); 645e8996ee0Sbellard } 64627bfd83cSPeter Maydell 64727bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 64827bfd83cSPeter Maydell s->temps_in_use++; 64927bfd83cSPeter Maydell #endif 650a7812ae4Spbrook return idx; 651c896fe29Sbellard } 652c896fe29Sbellard 653a7812ae4Spbrook TCGv_i32 tcg_temp_new_internal_i32(int temp_local) 654a7812ae4Spbrook { 655a7812ae4Spbrook int idx; 656a7812ae4Spbrook 657a7812ae4Spbrook idx = tcg_temp_new_internal(TCG_TYPE_I32, temp_local); 658a7812ae4Spbrook return MAKE_TCGV_I32(idx); 659a7812ae4Spbrook } 660a7812ae4Spbrook 661a7812ae4Spbrook TCGv_i64 tcg_temp_new_internal_i64(int temp_local) 662a7812ae4Spbrook { 663a7812ae4Spbrook int idx; 664a7812ae4Spbrook 665a7812ae4Spbrook idx = tcg_temp_new_internal(TCG_TYPE_I64, temp_local); 666a7812ae4Spbrook return MAKE_TCGV_I64(idx); 667a7812ae4Spbrook } 668a7812ae4Spbrook 6690ec9eabcSRichard Henderson static void tcg_temp_free_internal(int idx) 670c896fe29Sbellard { 671c896fe29Sbellard TCGContext *s = &tcg_ctx; 672c896fe29Sbellard TCGTemp *ts; 673641d5fbeSbellard int k; 674c896fe29Sbellard 67527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 67627bfd83cSPeter Maydell s->temps_in_use--; 67727bfd83cSPeter Maydell if (s->temps_in_use < 0) { 67827bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 67927bfd83cSPeter Maydell } 68027bfd83cSPeter Maydell #endif 68127bfd83cSPeter Maydell 682eabb7b91SAurelien Jarno tcg_debug_assert(idx >= s->nb_globals && idx < s->nb_temps); 683c896fe29Sbellard ts = &s->temps[idx]; 684eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 685e8996ee0Sbellard ts->temp_allocated = 0; 6860ec9eabcSRichard Henderson 68718d13fa2SAlexander Graf k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0); 6880ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 689e8996ee0Sbellard } 690e8996ee0Sbellard 691a7812ae4Spbrook void tcg_temp_free_i32(TCGv_i32 arg) 692e8996ee0Sbellard { 693a7812ae4Spbrook tcg_temp_free_internal(GET_TCGV_I32(arg)); 694a7812ae4Spbrook } 695a7812ae4Spbrook 696a7812ae4Spbrook void tcg_temp_free_i64(TCGv_i64 arg) 697a7812ae4Spbrook { 698a7812ae4Spbrook tcg_temp_free_internal(GET_TCGV_I64(arg)); 699a7812ae4Spbrook } 700a7812ae4Spbrook 701a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 702a7812ae4Spbrook { 703a7812ae4Spbrook TCGv_i32 t0; 704a7812ae4Spbrook t0 = tcg_temp_new_i32(); 705e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 706e8996ee0Sbellard return t0; 707c896fe29Sbellard } 708c896fe29Sbellard 709a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 710c896fe29Sbellard { 711a7812ae4Spbrook TCGv_i64 t0; 712a7812ae4Spbrook t0 = tcg_temp_new_i64(); 713e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 714e8996ee0Sbellard return t0; 715c896fe29Sbellard } 716c896fe29Sbellard 717a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 718bdffd4a9Saurel32 { 719a7812ae4Spbrook TCGv_i32 t0; 720a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 721bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 722bdffd4a9Saurel32 return t0; 723bdffd4a9Saurel32 } 724bdffd4a9Saurel32 725a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 726bdffd4a9Saurel32 { 727a7812ae4Spbrook TCGv_i64 t0; 728a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 729bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 730bdffd4a9Saurel32 return t0; 731bdffd4a9Saurel32 } 732bdffd4a9Saurel32 73327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 73427bfd83cSPeter Maydell void tcg_clear_temp_count(void) 73527bfd83cSPeter Maydell { 73627bfd83cSPeter Maydell TCGContext *s = &tcg_ctx; 73727bfd83cSPeter Maydell s->temps_in_use = 0; 73827bfd83cSPeter Maydell } 73927bfd83cSPeter Maydell 74027bfd83cSPeter Maydell int tcg_check_temp_count(void) 74127bfd83cSPeter Maydell { 74227bfd83cSPeter Maydell TCGContext *s = &tcg_ctx; 74327bfd83cSPeter Maydell if (s->temps_in_use) { 74427bfd83cSPeter Maydell /* Clear the count so that we don't give another 74527bfd83cSPeter Maydell * warning immediately next time around. 74627bfd83cSPeter Maydell */ 74727bfd83cSPeter Maydell s->temps_in_use = 0; 74827bfd83cSPeter Maydell return 1; 74927bfd83cSPeter Maydell } 75027bfd83cSPeter Maydell return 0; 75127bfd83cSPeter Maydell } 75227bfd83cSPeter Maydell #endif 75327bfd83cSPeter Maydell 754be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 755be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 756be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 757be0f34b5SRichard Henderson { 758be0f34b5SRichard Henderson switch (op) { 759be0f34b5SRichard Henderson case INDEX_op_discard: 760be0f34b5SRichard Henderson case INDEX_op_set_label: 761be0f34b5SRichard Henderson case INDEX_op_call: 762be0f34b5SRichard Henderson case INDEX_op_br: 763be0f34b5SRichard Henderson case INDEX_op_mb: 764be0f34b5SRichard Henderson case INDEX_op_insn_start: 765be0f34b5SRichard Henderson case INDEX_op_exit_tb: 766be0f34b5SRichard Henderson case INDEX_op_goto_tb: 767be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 768be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 769be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 770be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 771be0f34b5SRichard Henderson return true; 772be0f34b5SRichard Henderson 773be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 774be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 775be0f34b5SRichard Henderson 776be0f34b5SRichard Henderson case INDEX_op_mov_i32: 777be0f34b5SRichard Henderson case INDEX_op_movi_i32: 778be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 779be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 780be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 781be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 782be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 783be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 784be0f34b5SRichard Henderson case INDEX_op_ld_i32: 785be0f34b5SRichard Henderson case INDEX_op_st8_i32: 786be0f34b5SRichard Henderson case INDEX_op_st16_i32: 787be0f34b5SRichard Henderson case INDEX_op_st_i32: 788be0f34b5SRichard Henderson case INDEX_op_add_i32: 789be0f34b5SRichard Henderson case INDEX_op_sub_i32: 790be0f34b5SRichard Henderson case INDEX_op_mul_i32: 791be0f34b5SRichard Henderson case INDEX_op_and_i32: 792be0f34b5SRichard Henderson case INDEX_op_or_i32: 793be0f34b5SRichard Henderson case INDEX_op_xor_i32: 794be0f34b5SRichard Henderson case INDEX_op_shl_i32: 795be0f34b5SRichard Henderson case INDEX_op_shr_i32: 796be0f34b5SRichard Henderson case INDEX_op_sar_i32: 797be0f34b5SRichard Henderson return true; 798be0f34b5SRichard Henderson 799be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 800be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 801be0f34b5SRichard Henderson case INDEX_op_div_i32: 802be0f34b5SRichard Henderson case INDEX_op_divu_i32: 803be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 804be0f34b5SRichard Henderson case INDEX_op_rem_i32: 805be0f34b5SRichard Henderson case INDEX_op_remu_i32: 806be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 807be0f34b5SRichard Henderson case INDEX_op_div2_i32: 808be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 809be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 810be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 811be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 812be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 813be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 814be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 815be0f34b5SRichard Henderson case INDEX_op_extract_i32: 816be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 817be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 818be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 819be0f34b5SRichard Henderson case INDEX_op_add2_i32: 820be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 821be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 822be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 823be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 824be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 825be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 826be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 827be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 828be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 829be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 830be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 831be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 832be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 833be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 834be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 835be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 836be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 837be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 838be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 839be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 840be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 841be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 842be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 843be0f34b5SRichard Henderson case INDEX_op_not_i32: 844be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 845be0f34b5SRichard Henderson case INDEX_op_neg_i32: 846be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 847be0f34b5SRichard Henderson case INDEX_op_andc_i32: 848be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 849be0f34b5SRichard Henderson case INDEX_op_orc_i32: 850be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 851be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 852be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 853be0f34b5SRichard Henderson case INDEX_op_nand_i32: 854be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 855be0f34b5SRichard Henderson case INDEX_op_nor_i32: 856be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 857be0f34b5SRichard Henderson case INDEX_op_clz_i32: 858be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 859be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 860be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 861be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 862be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 863be0f34b5SRichard Henderson 864be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 865be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 866be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 867be0f34b5SRichard Henderson 868be0f34b5SRichard Henderson case INDEX_op_mov_i64: 869be0f34b5SRichard Henderson case INDEX_op_movi_i64: 870be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 871be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 872be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 873be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 874be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 875be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 876be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 877be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 878be0f34b5SRichard Henderson case INDEX_op_ld_i64: 879be0f34b5SRichard Henderson case INDEX_op_st8_i64: 880be0f34b5SRichard Henderson case INDEX_op_st16_i64: 881be0f34b5SRichard Henderson case INDEX_op_st32_i64: 882be0f34b5SRichard Henderson case INDEX_op_st_i64: 883be0f34b5SRichard Henderson case INDEX_op_add_i64: 884be0f34b5SRichard Henderson case INDEX_op_sub_i64: 885be0f34b5SRichard Henderson case INDEX_op_mul_i64: 886be0f34b5SRichard Henderson case INDEX_op_and_i64: 887be0f34b5SRichard Henderson case INDEX_op_or_i64: 888be0f34b5SRichard Henderson case INDEX_op_xor_i64: 889be0f34b5SRichard Henderson case INDEX_op_shl_i64: 890be0f34b5SRichard Henderson case INDEX_op_shr_i64: 891be0f34b5SRichard Henderson case INDEX_op_sar_i64: 892be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 893be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 894be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 895be0f34b5SRichard Henderson 896be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 897be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 898be0f34b5SRichard Henderson case INDEX_op_div_i64: 899be0f34b5SRichard Henderson case INDEX_op_divu_i64: 900be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 901be0f34b5SRichard Henderson case INDEX_op_rem_i64: 902be0f34b5SRichard Henderson case INDEX_op_remu_i64: 903be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 904be0f34b5SRichard Henderson case INDEX_op_div2_i64: 905be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 906be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 907be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 908be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 909be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 910be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 911be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 912be0f34b5SRichard Henderson case INDEX_op_extract_i64: 913be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 914be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 915be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 916be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 917be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 918be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 919be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 920be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 921be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 922be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 923be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 924be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 925be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 926be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 927be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 928be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 929be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 930be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 931be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 932be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 933be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 934be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 935be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 936be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 937be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 938be0f34b5SRichard Henderson case INDEX_op_not_i64: 939be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 940be0f34b5SRichard Henderson case INDEX_op_neg_i64: 941be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 942be0f34b5SRichard Henderson case INDEX_op_andc_i64: 943be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 944be0f34b5SRichard Henderson case INDEX_op_orc_i64: 945be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 946be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 947be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 948be0f34b5SRichard Henderson case INDEX_op_nand_i64: 949be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 950be0f34b5SRichard Henderson case INDEX_op_nor_i64: 951be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 952be0f34b5SRichard Henderson case INDEX_op_clz_i64: 953be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 954be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 955be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 956be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 957be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 958be0f34b5SRichard Henderson case INDEX_op_add2_i64: 959be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 960be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 961be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 962be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 963be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 964be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 965be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 966be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 967be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 968be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 969be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 970be0f34b5SRichard Henderson 971be0f34b5SRichard Henderson case NB_OPS: 972be0f34b5SRichard Henderson break; 973be0f34b5SRichard Henderson } 974be0f34b5SRichard Henderson g_assert_not_reached(); 975be0f34b5SRichard Henderson } 976be0f34b5SRichard Henderson 97739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 97839cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 97939cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 980bbb8a1b4SRichard Henderson void tcg_gen_callN(TCGContext *s, void *func, TCGArg ret, 981bbb8a1b4SRichard Henderson int nargs, TCGArg *args) 982c896fe29Sbellard { 983c45cb8bbSRichard Henderson int i, real_args, nb_rets, pi, pi_first; 984bbb8a1b4SRichard Henderson unsigned sizemask, flags; 985afb49896SRichard Henderson TCGHelperInfo *info; 986afb49896SRichard Henderson 987619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 988bbb8a1b4SRichard Henderson flags = info->flags; 989bbb8a1b4SRichard Henderson sizemask = info->sizemask; 9902bece2c8SRichard Henderson 99134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 99234b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 99334b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 99434b1a49cSRichard Henderson separate parameters. Split them. */ 99534b1a49cSRichard Henderson int orig_sizemask = sizemask; 99634b1a49cSRichard Henderson int orig_nargs = nargs; 99734b1a49cSRichard Henderson TCGv_i64 retl, reth; 99834b1a49cSRichard Henderson 99934b1a49cSRichard Henderson TCGV_UNUSED_I64(retl); 100034b1a49cSRichard Henderson TCGV_UNUSED_I64(reth); 100134b1a49cSRichard Henderson if (sizemask != 0) { 100234b1a49cSRichard Henderson TCGArg *split_args = __builtin_alloca(sizeof(TCGArg) * nargs * 2); 100334b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 100434b1a49cSRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 100534b1a49cSRichard Henderson if (is_64bit) { 100634b1a49cSRichard Henderson TCGv_i64 orig = MAKE_TCGV_I64(args[i]); 100734b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 100834b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 100934b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 101034b1a49cSRichard Henderson split_args[real_args++] = GET_TCGV_I32(h); 101134b1a49cSRichard Henderson split_args[real_args++] = GET_TCGV_I32(l); 101234b1a49cSRichard Henderson } else { 101334b1a49cSRichard Henderson split_args[real_args++] = args[i]; 101434b1a49cSRichard Henderson } 101534b1a49cSRichard Henderson } 101634b1a49cSRichard Henderson nargs = real_args; 101734b1a49cSRichard Henderson args = split_args; 101834b1a49cSRichard Henderson sizemask = 0; 101934b1a49cSRichard Henderson } 102034b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 10212bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 10222bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 10232bece2c8SRichard Henderson int is_signed = sizemask & (2 << (i+1)*2); 10242bece2c8SRichard Henderson if (!is_64bit) { 10252bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 10262bece2c8SRichard Henderson TCGv_i64 orig = MAKE_TCGV_I64(args[i]); 10272bece2c8SRichard Henderson if (is_signed) { 10282bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 10292bece2c8SRichard Henderson } else { 10302bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 10312bece2c8SRichard Henderson } 10322bece2c8SRichard Henderson args[i] = GET_TCGV_I64(temp); 10332bece2c8SRichard Henderson } 10342bece2c8SRichard Henderson } 10352bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 10362bece2c8SRichard Henderson 1037c45cb8bbSRichard Henderson pi_first = pi = s->gen_next_parm_idx; 1038a7812ae4Spbrook if (ret != TCG_CALL_DUMMY_ARG) { 103934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 104034b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 104134b1a49cSRichard Henderson if (orig_sizemask & 1) { 104234b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 104334b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 104434b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 104534b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 104634b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1047c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = GET_TCGV_I64(reth); 1048c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = GET_TCGV_I64(retl); 104934b1a49cSRichard Henderson nb_rets = 2; 105034b1a49cSRichard Henderson } else { 1051c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 105234b1a49cSRichard Henderson nb_rets = 1; 105334b1a49cSRichard Henderson } 105434b1a49cSRichard Henderson #else 105534b1a49cSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) { 105602eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1057c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret + 1; 1058c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 1059a7812ae4Spbrook #else 1060c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 1061c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret + 1; 1062a7812ae4Spbrook #endif 1063a7812ae4Spbrook nb_rets = 2; 106434b1a49cSRichard Henderson } else { 1065c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = ret; 1066a7812ae4Spbrook nb_rets = 1; 1067a7812ae4Spbrook } 106834b1a49cSRichard Henderson #endif 1069a7812ae4Spbrook } else { 1070a7812ae4Spbrook nb_rets = 0; 1071a7812ae4Spbrook } 1072a7812ae4Spbrook real_args = 0; 1073a7812ae4Spbrook for (i = 0; i < nargs; i++) { 10742bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 1075bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 107639cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 107739cf05d3Sbellard /* some targets want aligned 64 bit args */ 1078ebd486d5Smalc if (real_args & 1) { 1079c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = TCG_CALL_DUMMY_ARG; 1080ebd486d5Smalc real_args++; 108139cf05d3Sbellard } 108239cf05d3Sbellard #endif 10833f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 10843f90f252SRichard Henderson arguments at lower addresses, which means we need to 10853f90f252SRichard Henderson reverse the order compared to how we would normally 10863f90f252SRichard Henderson treat either big or little-endian. For those arguments 10873f90f252SRichard Henderson that will wind up in registers, this still works for 10883f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 10893f90f252SRichard Henderson argument registers are *also* allocated in decreasing 10903f90f252SRichard Henderson order. If another such target is added, this logic may 10913f90f252SRichard Henderson have to get more complicated to differentiate between 10923f90f252SRichard Henderson stack arguments and register arguments. */ 109302eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1094c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i] + 1; 1095c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i]; 1096c896fe29Sbellard #else 1097c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i]; 1098c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i] + 1; 1099c896fe29Sbellard #endif 1100a7812ae4Spbrook real_args += 2; 11012bece2c8SRichard Henderson continue; 11022bece2c8SRichard Henderson } 11032bece2c8SRichard Henderson 1104c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = args[i]; 1105a7812ae4Spbrook real_args++; 1106c896fe29Sbellard } 1107c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = (uintptr_t)func; 1108c45cb8bbSRichard Henderson s->gen_opparam_buf[pi++] = flags; 1109a7812ae4Spbrook 1110c45cb8bbSRichard Henderson i = s->gen_next_op_idx; 1111c45cb8bbSRichard Henderson tcg_debug_assert(i < OPC_BUF_SIZE); 1112c45cb8bbSRichard Henderson tcg_debug_assert(pi <= OPPARAM_BUF_SIZE); 1113a7812ae4Spbrook 1114c45cb8bbSRichard Henderson /* Set links for sequential allocation during translation. */ 1115c45cb8bbSRichard Henderson s->gen_op_buf[i] = (TCGOp){ 1116c45cb8bbSRichard Henderson .opc = INDEX_op_call, 1117c45cb8bbSRichard Henderson .callo = nb_rets, 1118c45cb8bbSRichard Henderson .calli = real_args, 1119c45cb8bbSRichard Henderson .args = pi_first, 1120c45cb8bbSRichard Henderson .prev = i - 1, 1121c45cb8bbSRichard Henderson .next = i + 1 1122c45cb8bbSRichard Henderson }; 1123c45cb8bbSRichard Henderson 1124c45cb8bbSRichard Henderson /* Make sure the calli field didn't overflow. */ 1125c45cb8bbSRichard Henderson tcg_debug_assert(s->gen_op_buf[i].calli == real_args); 1126c45cb8bbSRichard Henderson 1127dcb8e758SRichard Henderson s->gen_op_buf[0].prev = i; 1128c45cb8bbSRichard Henderson s->gen_next_op_idx = i + 1; 1129c45cb8bbSRichard Henderson s->gen_next_parm_idx = pi; 11302bece2c8SRichard Henderson 113134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 113234b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 113334b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 113434b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 113534b1a49cSRichard Henderson int is_64bit = orig_sizemask & (1 << (i+1)*2); 113634b1a49cSRichard Henderson if (is_64bit) { 113734b1a49cSRichard Henderson TCGv_i32 h = MAKE_TCGV_I32(args[real_args++]); 113834b1a49cSRichard Henderson TCGv_i32 l = MAKE_TCGV_I32(args[real_args++]); 113934b1a49cSRichard Henderson tcg_temp_free_i32(h); 114034b1a49cSRichard Henderson tcg_temp_free_i32(l); 114134b1a49cSRichard Henderson } else { 114234b1a49cSRichard Henderson real_args++; 114334b1a49cSRichard Henderson } 114434b1a49cSRichard Henderson } 114534b1a49cSRichard Henderson if (orig_sizemask & 1) { 114634b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 114734b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 114834b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 114934b1a49cSRichard Henderson tcg_gen_concat32_i64(MAKE_TCGV_I64(ret), retl, reth); 115034b1a49cSRichard Henderson tcg_temp_free_i64(retl); 115134b1a49cSRichard Henderson tcg_temp_free_i64(reth); 115234b1a49cSRichard Henderson } 115334b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 11542bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 11552bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 11562bece2c8SRichard Henderson if (!is_64bit) { 11572bece2c8SRichard Henderson TCGv_i64 temp = MAKE_TCGV_I64(args[i]); 11582bece2c8SRichard Henderson tcg_temp_free_i64(temp); 11592bece2c8SRichard Henderson } 11602bece2c8SRichard Henderson } 11612bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1162a7812ae4Spbrook } 1163c896fe29Sbellard 11648fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1165c896fe29Sbellard { 1166c896fe29Sbellard int i; 1167c896fe29Sbellard TCGTemp *ts; 1168c896fe29Sbellard for(i = 0; i < s->nb_globals; i++) { 1169c896fe29Sbellard ts = &s->temps[i]; 1170c896fe29Sbellard if (ts->fixed_reg) { 1171c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 1172c896fe29Sbellard } else { 1173c896fe29Sbellard ts->val_type = TEMP_VAL_MEM; 1174c896fe29Sbellard } 1175c896fe29Sbellard } 1176e8996ee0Sbellard for(i = s->nb_globals; i < s->nb_temps; i++) { 1177e8996ee0Sbellard ts = &s->temps[i]; 11787dfd8c6aSAurelien Jarno if (ts->temp_local) { 11797dfd8c6aSAurelien Jarno ts->val_type = TEMP_VAL_MEM; 11807dfd8c6aSAurelien Jarno } else { 1181e8996ee0Sbellard ts->val_type = TEMP_VAL_DEAD; 11827dfd8c6aSAurelien Jarno } 1183e8996ee0Sbellard ts->mem_allocated = 0; 1184e8996ee0Sbellard ts->fixed_reg = 0; 1185e8996ee0Sbellard } 1186f8b2f202SRichard Henderson 1187f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1188c896fe29Sbellard } 1189c896fe29Sbellard 1190f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1191f8b2f202SRichard Henderson TCGTemp *ts) 1192c896fe29Sbellard { 1193f8b2f202SRichard Henderson int idx = temp_idx(s, ts); 1194ac56dd48Spbrook 1195ac56dd48Spbrook if (idx < s->nb_globals) { 1196ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1197f8b2f202SRichard Henderson } else if (ts->temp_local) { 1198641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1199f8b2f202SRichard Henderson } else { 1200ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1201c896fe29Sbellard } 1202c896fe29Sbellard return buf; 1203c896fe29Sbellard } 1204c896fe29Sbellard 1205f8b2f202SRichard Henderson static char *tcg_get_arg_str_idx(TCGContext *s, char *buf, 1206f8b2f202SRichard Henderson int buf_size, int idx) 1207f8b2f202SRichard Henderson { 1208eabb7b91SAurelien Jarno tcg_debug_assert(idx >= 0 && idx < s->nb_temps); 1209f8b2f202SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, &s->temps[idx]); 1210f8b2f202SRichard Henderson } 1211f8b2f202SRichard Henderson 12126e085f72SRichard Henderson /* Find helper name. */ 12136e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val) 1214e8996ee0Sbellard { 12156e085f72SRichard Henderson const char *ret = NULL; 1216619205fdSEmilio G. Cota if (helper_table) { 1217619205fdSEmilio G. Cota TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val); 121872866e82SRichard Henderson if (info) { 121972866e82SRichard Henderson ret = info->name; 122072866e82SRichard Henderson } 1221e8996ee0Sbellard } 12226e085f72SRichard Henderson return ret; 12234dc81f28Sbellard } 12244dc81f28Sbellard 1225f48f3edeSblueswir1 static const char * const cond_name[] = 1226f48f3edeSblueswir1 { 12270aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 12280aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1229f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1230f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1231f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1232f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1233f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1234f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1235f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1236f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1237f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1238f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1239f48f3edeSblueswir1 }; 1240f48f3edeSblueswir1 1241f713d6adSRichard Henderson static const char * const ldst_name[] = 1242f713d6adSRichard Henderson { 1243f713d6adSRichard Henderson [MO_UB] = "ub", 1244f713d6adSRichard Henderson [MO_SB] = "sb", 1245f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1246f713d6adSRichard Henderson [MO_LESW] = "lesw", 1247f713d6adSRichard Henderson [MO_LEUL] = "leul", 1248f713d6adSRichard Henderson [MO_LESL] = "lesl", 1249f713d6adSRichard Henderson [MO_LEQ] = "leq", 1250f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1251f713d6adSRichard Henderson [MO_BESW] = "besw", 1252f713d6adSRichard Henderson [MO_BEUL] = "beul", 1253f713d6adSRichard Henderson [MO_BESL] = "besl", 1254f713d6adSRichard Henderson [MO_BEQ] = "beq", 1255f713d6adSRichard Henderson }; 1256f713d6adSRichard Henderson 12571f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 12581f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY 12591f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 12601f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 12611f00b27fSSergey Sorokin #else 12621f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 12631f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 12641f00b27fSSergey Sorokin #endif 12651f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 12661f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 12671f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 12681f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 12691f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 12701f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 12711f00b27fSSergey Sorokin }; 12721f00b27fSSergey Sorokin 1273eeacee4dSBlue Swirl void tcg_dump_ops(TCGContext *s) 1274c896fe29Sbellard { 1275c896fe29Sbellard char buf[128]; 1276c45cb8bbSRichard Henderson TCGOp *op; 1277c45cb8bbSRichard Henderson int oi; 1278c896fe29Sbellard 1279dcb8e758SRichard Henderson for (oi = s->gen_op_buf[0].next; oi != 0; oi = op->next) { 1280c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1281c45cb8bbSRichard Henderson const TCGOpDef *def; 1282c45cb8bbSRichard Henderson const TCGArg *args; 1283c45cb8bbSRichard Henderson TCGOpcode c; 1284bdfb460eSRichard Henderson int col = 0; 1285c45cb8bbSRichard Henderson 1286c45cb8bbSRichard Henderson op = &s->gen_op_buf[oi]; 1287c45cb8bbSRichard Henderson c = op->opc; 1288c896fe29Sbellard def = &tcg_op_defs[c]; 1289c45cb8bbSRichard Henderson args = &s->gen_opparam_buf[op->args]; 1290c45cb8bbSRichard Henderson 1291765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1292bdfb460eSRichard Henderson col += qemu_log("%s ----", oi != s->gen_op_buf[0].next ? "\n" : ""); 12939aef40edSRichard Henderson 12949aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 12959aef40edSRichard Henderson target_ulong a; 12967e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 12979aef40edSRichard Henderson a = ((target_ulong)args[i * 2 + 1] << 32) | args[i * 2]; 12987e4597d7Sbellard #else 12999aef40edSRichard Henderson a = args[i]; 13007e4597d7Sbellard #endif 1301bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1302eeacee4dSBlue Swirl } 13037e4597d7Sbellard } else if (c == INDEX_op_call) { 1304c896fe29Sbellard /* variable number of arguments */ 1305c45cb8bbSRichard Henderson nb_oargs = op->callo; 1306c45cb8bbSRichard Henderson nb_iargs = op->calli; 1307c896fe29Sbellard nb_cargs = def->nb_cargs; 1308b03cce8eSbellard 1309cf066674SRichard Henderson /* function name, flags, out args */ 1310bdfb460eSRichard Henderson col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name, 1311cf066674SRichard Henderson tcg_find_helper(s, args[nb_oargs + nb_iargs]), 1312cf066674SRichard Henderson args[nb_oargs + nb_iargs + 1], nb_oargs); 1313b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 1314bdfb460eSRichard Henderson col += qemu_log(",%s", tcg_get_arg_str_idx(s, buf, sizeof(buf), 1315eeacee4dSBlue Swirl args[i])); 1316b03cce8eSbellard } 1317cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1318cf066674SRichard Henderson TCGArg arg = args[nb_oargs + i]; 1319cf066674SRichard Henderson const char *t = "<dummy>"; 1320cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 1321cf066674SRichard Henderson t = tcg_get_arg_str_idx(s, buf, sizeof(buf), arg); 1322b03cce8eSbellard } 1323bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1324e8996ee0Sbellard } 1325b03cce8eSbellard } else { 1326bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1327c45cb8bbSRichard Henderson 1328c896fe29Sbellard nb_oargs = def->nb_oargs; 1329c896fe29Sbellard nb_iargs = def->nb_iargs; 1330c896fe29Sbellard nb_cargs = def->nb_cargs; 1331c896fe29Sbellard 1332c896fe29Sbellard k = 0; 1333c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1334eeacee4dSBlue Swirl if (k != 0) { 1335bdfb460eSRichard Henderson col += qemu_log(","); 1336eeacee4dSBlue Swirl } 1337bdfb460eSRichard Henderson col += qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf), 1338eeacee4dSBlue Swirl args[k++])); 1339c896fe29Sbellard } 1340c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1341eeacee4dSBlue Swirl if (k != 0) { 1342bdfb460eSRichard Henderson col += qemu_log(","); 1343eeacee4dSBlue Swirl } 1344bdfb460eSRichard Henderson col += qemu_log("%s", tcg_get_arg_str_idx(s, buf, sizeof(buf), 1345eeacee4dSBlue Swirl args[k++])); 1346c896fe29Sbellard } 1347be210acbSRichard Henderson switch (c) { 1348be210acbSRichard Henderson case INDEX_op_brcond_i32: 1349ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1350ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1351be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1352be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1353ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1354be210acbSRichard Henderson case INDEX_op_setcond_i64: 1355ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1356eeacee4dSBlue Swirl if (args[k] < ARRAY_SIZE(cond_name) && cond_name[args[k]]) { 1357bdfb460eSRichard Henderson col += qemu_log(",%s", cond_name[args[k++]]); 1358eeacee4dSBlue Swirl } else { 1359bdfb460eSRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, args[k++]); 1360eeacee4dSBlue Swirl } 1361f48f3edeSblueswir1 i = 1; 1362be210acbSRichard Henderson break; 1363f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1364f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 1365f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1366f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 136759227d5dSRichard Henderson { 136859227d5dSRichard Henderson TCGMemOpIdx oi = args[k++]; 136959227d5dSRichard Henderson TCGMemOp op = get_memop(oi); 137059227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 137159227d5dSRichard Henderson 137259c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1373bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 137459c4b7e8SRichard Henderson } else { 13751f00b27fSSergey Sorokin const char *s_al, *s_op; 13761f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 137759c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1378bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 1379f713d6adSRichard Henderson } 1380f713d6adSRichard Henderson i = 1; 138159227d5dSRichard Henderson } 1382f713d6adSRichard Henderson break; 1383be210acbSRichard Henderson default: 1384f48f3edeSblueswir1 i = 0; 1385be210acbSRichard Henderson break; 1386be210acbSRichard Henderson } 138751e3972cSRichard Henderson switch (c) { 138851e3972cSRichard Henderson case INDEX_op_set_label: 138951e3972cSRichard Henderson case INDEX_op_br: 139051e3972cSRichard Henderson case INDEX_op_brcond_i32: 139151e3972cSRichard Henderson case INDEX_op_brcond_i64: 139251e3972cSRichard Henderson case INDEX_op_brcond2_i32: 1393bdfb460eSRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", arg_label(args[k])->id); 139451e3972cSRichard Henderson i++, k++; 139551e3972cSRichard Henderson break; 139651e3972cSRichard Henderson default: 139751e3972cSRichard Henderson break; 1398eeacee4dSBlue Swirl } 139951e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 1400bdfb460eSRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", args[k]); 1401bdfb460eSRichard Henderson } 1402bdfb460eSRichard Henderson } 1403bdfb460eSRichard Henderson if (op->life) { 1404bdfb460eSRichard Henderson unsigned life = op->life; 1405bdfb460eSRichard Henderson 1406bdfb460eSRichard Henderson for (; col < 48; ++col) { 1407bdfb460eSRichard Henderson putc(' ', qemu_logfile); 1408bdfb460eSRichard Henderson } 1409bdfb460eSRichard Henderson 1410bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 1411bdfb460eSRichard Henderson qemu_log(" sync:"); 1412bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 1413bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 1414bdfb460eSRichard Henderson qemu_log(" %d", i); 1415bdfb460eSRichard Henderson } 1416bdfb460eSRichard Henderson } 1417bdfb460eSRichard Henderson } 1418bdfb460eSRichard Henderson life /= DEAD_ARG; 1419bdfb460eSRichard Henderson if (life) { 1420bdfb460eSRichard Henderson qemu_log(" dead:"); 1421bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 1422bdfb460eSRichard Henderson if (life & 1) { 1423bdfb460eSRichard Henderson qemu_log(" %d", i); 1424bdfb460eSRichard Henderson } 1425bdfb460eSRichard Henderson } 1426c896fe29Sbellard } 1427b03cce8eSbellard } 1428eeacee4dSBlue Swirl qemu_log("\n"); 1429c896fe29Sbellard } 1430c896fe29Sbellard } 1431c896fe29Sbellard 1432c896fe29Sbellard /* we give more priority to constraints with less registers */ 1433c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 1434c896fe29Sbellard { 1435c896fe29Sbellard const TCGArgConstraint *arg_ct; 1436c896fe29Sbellard 1437c896fe29Sbellard int i, n; 1438c896fe29Sbellard arg_ct = &def->args_ct[k]; 1439c896fe29Sbellard if (arg_ct->ct & TCG_CT_ALIAS) { 1440c896fe29Sbellard /* an alias is equivalent to a single register */ 1441c896fe29Sbellard n = 1; 1442c896fe29Sbellard } else { 1443c896fe29Sbellard if (!(arg_ct->ct & TCG_CT_REG)) 1444c896fe29Sbellard return 0; 1445c896fe29Sbellard n = 0; 1446c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 1447c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, i)) 1448c896fe29Sbellard n++; 1449c896fe29Sbellard } 1450c896fe29Sbellard } 1451c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 1452c896fe29Sbellard } 1453c896fe29Sbellard 1454c896fe29Sbellard /* sort from highest priority to lowest */ 1455c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 1456c896fe29Sbellard { 1457c896fe29Sbellard int i, j, p1, p2, tmp; 1458c896fe29Sbellard 1459c896fe29Sbellard for(i = 0; i < n; i++) 1460c896fe29Sbellard def->sorted_args[start + i] = start + i; 1461c896fe29Sbellard if (n <= 1) 1462c896fe29Sbellard return; 1463c896fe29Sbellard for(i = 0; i < n - 1; i++) { 1464c896fe29Sbellard for(j = i + 1; j < n; j++) { 1465c896fe29Sbellard p1 = get_constraint_priority(def, def->sorted_args[start + i]); 1466c896fe29Sbellard p2 = get_constraint_priority(def, def->sorted_args[start + j]); 1467c896fe29Sbellard if (p1 < p2) { 1468c896fe29Sbellard tmp = def->sorted_args[start + i]; 1469c896fe29Sbellard def->sorted_args[start + i] = def->sorted_args[start + j]; 1470c896fe29Sbellard def->sorted_args[start + j] = tmp; 1471c896fe29Sbellard } 1472c896fe29Sbellard } 1473c896fe29Sbellard } 1474c896fe29Sbellard } 1475c896fe29Sbellard 1476f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 1477c896fe29Sbellard { 1478a9751609SRichard Henderson TCGOpcode op; 1479c896fe29Sbellard 1480f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 1481f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 1482f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 1483069ea736SRichard Henderson TCGType type; 1484069ea736SRichard Henderson int i, nb_args; 1485f69d277eSRichard Henderson 1486f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 1487f69d277eSRichard Henderson continue; 1488f69d277eSRichard Henderson } 1489f69d277eSRichard Henderson 1490c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 1491f69d277eSRichard Henderson if (nb_args == 0) { 1492f69d277eSRichard Henderson continue; 1493f69d277eSRichard Henderson } 1494f69d277eSRichard Henderson 1495f69d277eSRichard Henderson tdefs = tcg_target_op_def(op); 1496f69d277eSRichard Henderson /* Missing TCGTargetOpDef entry. */ 1497f69d277eSRichard Henderson tcg_debug_assert(tdefs != NULL); 1498f69d277eSRichard Henderson 1499069ea736SRichard Henderson type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32); 1500c896fe29Sbellard for (i = 0; i < nb_args; i++) { 1501f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 1502f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 1503eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 1504f69d277eSRichard Henderson 1505ccb1bb66SRichard Henderson def->args_ct[i].u.regs = 0; 1506c896fe29Sbellard def->args_ct[i].ct = 0; 150717280ff4SRichard Henderson while (*ct_str != '\0') { 150817280ff4SRichard Henderson switch(*ct_str) { 150917280ff4SRichard Henderson case '0' ... '9': 151017280ff4SRichard Henderson { 151117280ff4SRichard Henderson int oarg = *ct_str - '0'; 151217280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 1513eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 1514eabb7b91SAurelien Jarno tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG); 151517280ff4SRichard Henderson /* TCG_CT_ALIAS is for the output arguments. 151617280ff4SRichard Henderson The input is tagged with TCG_CT_IALIAS. */ 1517c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 151817280ff4SRichard Henderson def->args_ct[oarg].ct |= TCG_CT_ALIAS; 15195ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 1520c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_IALIAS; 15215ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 152217280ff4SRichard Henderson } 152317280ff4SRichard Henderson ct_str++; 1524c896fe29Sbellard break; 152582790a87SRichard Henderson case '&': 152682790a87SRichard Henderson def->args_ct[i].ct |= TCG_CT_NEWREG; 152782790a87SRichard Henderson ct_str++; 152882790a87SRichard Henderson break; 1529c896fe29Sbellard case 'i': 1530c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 1531c896fe29Sbellard ct_str++; 1532c896fe29Sbellard break; 1533c896fe29Sbellard default: 1534069ea736SRichard Henderson ct_str = target_parse_constraint(&def->args_ct[i], 1535069ea736SRichard Henderson ct_str, type); 1536f69d277eSRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 1537069ea736SRichard Henderson tcg_debug_assert(ct_str != NULL); 1538c896fe29Sbellard } 1539c896fe29Sbellard } 1540c896fe29Sbellard } 1541c896fe29Sbellard 1542c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 1543eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 1544c68aaa18SStefan Weil 1545c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 1546c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 1547c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 1548c896fe29Sbellard } 1549c896fe29Sbellard } 1550c896fe29Sbellard 15510c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 15520c627cdcSRichard Henderson { 15530c627cdcSRichard Henderson int next = op->next; 15540c627cdcSRichard Henderson int prev = op->prev; 15550c627cdcSRichard Henderson 1556dcb8e758SRichard Henderson /* We should never attempt to remove the list terminator. */ 1557dcb8e758SRichard Henderson tcg_debug_assert(op != &s->gen_op_buf[0]); 15580c627cdcSRichard Henderson 1559dcb8e758SRichard Henderson s->gen_op_buf[next].prev = prev; 1560dcb8e758SRichard Henderson s->gen_op_buf[prev].next = next; 1561dcb8e758SRichard Henderson 1562dcb8e758SRichard Henderson memset(op, 0, sizeof(*op)); 15630c627cdcSRichard Henderson 15640c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 15650c627cdcSRichard Henderson s->del_op_count++; 15660c627cdcSRichard Henderson #endif 15670c627cdcSRichard Henderson } 15680c627cdcSRichard Henderson 15695a18407fSRichard Henderson TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, 15705a18407fSRichard Henderson TCGOpcode opc, int nargs) 15715a18407fSRichard Henderson { 15725a18407fSRichard Henderson int oi = s->gen_next_op_idx; 15735a18407fSRichard Henderson int pi = s->gen_next_parm_idx; 15745a18407fSRichard Henderson int prev = old_op->prev; 15755a18407fSRichard Henderson int next = old_op - s->gen_op_buf; 15765a18407fSRichard Henderson TCGOp *new_op; 15775a18407fSRichard Henderson 15785a18407fSRichard Henderson tcg_debug_assert(oi < OPC_BUF_SIZE); 15795a18407fSRichard Henderson tcg_debug_assert(pi + nargs <= OPPARAM_BUF_SIZE); 15805a18407fSRichard Henderson s->gen_next_op_idx = oi + 1; 15815a18407fSRichard Henderson s->gen_next_parm_idx = pi + nargs; 15825a18407fSRichard Henderson 15835a18407fSRichard Henderson new_op = &s->gen_op_buf[oi]; 15845a18407fSRichard Henderson *new_op = (TCGOp){ 15855a18407fSRichard Henderson .opc = opc, 15865a18407fSRichard Henderson .args = pi, 15875a18407fSRichard Henderson .prev = prev, 15885a18407fSRichard Henderson .next = next 15895a18407fSRichard Henderson }; 15905a18407fSRichard Henderson s->gen_op_buf[prev].next = oi; 15915a18407fSRichard Henderson old_op->prev = oi; 15925a18407fSRichard Henderson 15935a18407fSRichard Henderson return new_op; 15945a18407fSRichard Henderson } 15955a18407fSRichard Henderson 15965a18407fSRichard Henderson TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, 15975a18407fSRichard Henderson TCGOpcode opc, int nargs) 15985a18407fSRichard Henderson { 15995a18407fSRichard Henderson int oi = s->gen_next_op_idx; 16005a18407fSRichard Henderson int pi = s->gen_next_parm_idx; 16015a18407fSRichard Henderson int prev = old_op - s->gen_op_buf; 16025a18407fSRichard Henderson int next = old_op->next; 16035a18407fSRichard Henderson TCGOp *new_op; 16045a18407fSRichard Henderson 16055a18407fSRichard Henderson tcg_debug_assert(oi < OPC_BUF_SIZE); 16065a18407fSRichard Henderson tcg_debug_assert(pi + nargs <= OPPARAM_BUF_SIZE); 16075a18407fSRichard Henderson s->gen_next_op_idx = oi + 1; 16085a18407fSRichard Henderson s->gen_next_parm_idx = pi + nargs; 16095a18407fSRichard Henderson 16105a18407fSRichard Henderson new_op = &s->gen_op_buf[oi]; 16115a18407fSRichard Henderson *new_op = (TCGOp){ 16125a18407fSRichard Henderson .opc = opc, 16135a18407fSRichard Henderson .args = pi, 16145a18407fSRichard Henderson .prev = prev, 16155a18407fSRichard Henderson .next = next 16165a18407fSRichard Henderson }; 16175a18407fSRichard Henderson s->gen_op_buf[next].prev = oi; 16185a18407fSRichard Henderson old_op->next = oi; 16195a18407fSRichard Henderson 16205a18407fSRichard Henderson return new_op; 16215a18407fSRichard Henderson } 16225a18407fSRichard Henderson 1623c70fbf0aSRichard Henderson #define TS_DEAD 1 1624c70fbf0aSRichard Henderson #define TS_MEM 2 1625c70fbf0aSRichard Henderson 16265a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 16275a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 16285a18407fSRichard Henderson 16299c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 16309c43b68dSAurelien Jarno should be in memory. */ 1631c70fbf0aSRichard Henderson static inline void tcg_la_func_end(TCGContext *s, uint8_t *temp_state) 1632c896fe29Sbellard { 1633c70fbf0aSRichard Henderson memset(temp_state, TS_DEAD | TS_MEM, s->nb_globals); 1634c70fbf0aSRichard Henderson memset(temp_state + s->nb_globals, TS_DEAD, s->nb_temps - s->nb_globals); 1635c896fe29Sbellard } 1636c896fe29Sbellard 16379c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 16389c43b68dSAurelien Jarno and local temps should be in memory. */ 1639c70fbf0aSRichard Henderson static inline void tcg_la_bb_end(TCGContext *s, uint8_t *temp_state) 1640641d5fbeSbellard { 1641c70fbf0aSRichard Henderson int i, n; 1642641d5fbeSbellard 1643c70fbf0aSRichard Henderson tcg_la_func_end(s, temp_state); 1644c70fbf0aSRichard Henderson for (i = s->nb_globals, n = s->nb_temps; i < n; i++) { 1645c70fbf0aSRichard Henderson if (s->temps[i].temp_local) { 1646c70fbf0aSRichard Henderson temp_state[i] |= TS_MEM; 1647c70fbf0aSRichard Henderson } 1648641d5fbeSbellard } 1649641d5fbeSbellard } 1650641d5fbeSbellard 1651a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 1652c896fe29Sbellard given input arguments is dead. Instructions updating dead 1653c896fe29Sbellard temporaries are removed. */ 16545a18407fSRichard Henderson static void liveness_pass_1(TCGContext *s, uint8_t *temp_state) 1655c896fe29Sbellard { 1656c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 16575a18407fSRichard Henderson int oi, oi_prev; 1658c896fe29Sbellard 1659c70fbf0aSRichard Henderson tcg_la_func_end(s, temp_state); 1660c896fe29Sbellard 1661dcb8e758SRichard Henderson for (oi = s->gen_op_buf[0].prev; oi != 0; oi = oi_prev) { 1662c45cb8bbSRichard Henderson int i, nb_iargs, nb_oargs; 1663c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 1664c45cb8bbSRichard Henderson bool have_opc_new2; 1665a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 1666c45cb8bbSRichard Henderson TCGArg arg; 1667c45cb8bbSRichard Henderson 1668c45cb8bbSRichard Henderson TCGOp * const op = &s->gen_op_buf[oi]; 1669c45cb8bbSRichard Henderson TCGArg * const args = &s->gen_opparam_buf[op->args]; 1670c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 1671c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 1672c45cb8bbSRichard Henderson 1673c45cb8bbSRichard Henderson oi_prev = op->prev; 1674c45cb8bbSRichard Henderson 1675c45cb8bbSRichard Henderson switch (opc) { 1676c896fe29Sbellard case INDEX_op_call: 1677c6e113f5Sbellard { 1678c6e113f5Sbellard int call_flags; 1679c6e113f5Sbellard 1680c45cb8bbSRichard Henderson nb_oargs = op->callo; 1681c45cb8bbSRichard Henderson nb_iargs = op->calli; 1682cf066674SRichard Henderson call_flags = args[nb_oargs + nb_iargs + 1]; 1683c6e113f5Sbellard 1684c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 168578505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 1686c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 1687c6e113f5Sbellard arg = args[i]; 1688c70fbf0aSRichard Henderson if (temp_state[arg] != TS_DEAD) { 1689c6e113f5Sbellard goto do_not_remove_call; 1690c6e113f5Sbellard } 16919c43b68dSAurelien Jarno } 1692c45cb8bbSRichard Henderson goto do_remove; 1693c6e113f5Sbellard } else { 1694c6e113f5Sbellard do_not_remove_call: 1695c896fe29Sbellard 1696c896fe29Sbellard /* output args are dead */ 1697c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1698c896fe29Sbellard arg = args[i]; 1699c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1700a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 17016b64b624SAurelien Jarno } 1702c70fbf0aSRichard Henderson if (temp_state[arg] & TS_MEM) { 1703a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 17049c43b68dSAurelien Jarno } 1705c70fbf0aSRichard Henderson temp_state[arg] = TS_DEAD; 1706c896fe29Sbellard } 1707c896fe29Sbellard 170878505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 170978505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 17109c43b68dSAurelien Jarno /* globals should go back to memory */ 1711c70fbf0aSRichard Henderson memset(temp_state, TS_DEAD | TS_MEM, nb_globals); 1712c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 1713c70fbf0aSRichard Henderson /* globals should be synced to memory */ 1714c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 1715c70fbf0aSRichard Henderson temp_state[i] |= TS_MEM; 1716c70fbf0aSRichard Henderson } 1717b9c18f56Saurel32 } 1718c896fe29Sbellard 1719c19f47bfSAurelien Jarno /* record arguments that die in this helper */ 1720866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 1721866cb6cbSAurelien Jarno arg = args[i]; 172239cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 1723c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1724a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 1725c896fe29Sbellard } 1726c896fe29Sbellard } 172739cf05d3Sbellard } 172867cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 1729c70fbf0aSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 1730c19f47bfSAurelien Jarno arg = args[i]; 1731c70fbf0aSRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 1732c70fbf0aSRichard Henderson temp_state[arg] &= ~TS_DEAD; 1733c70fbf0aSRichard Henderson } 1734c19f47bfSAurelien Jarno } 1735c6e113f5Sbellard } 1736c6e113f5Sbellard } 1737c896fe29Sbellard break; 1738765b842aSRichard Henderson case INDEX_op_insn_start: 1739c896fe29Sbellard break; 17405ff9d6a4Sbellard case INDEX_op_discard: 17415ff9d6a4Sbellard /* mark the temporary as dead */ 1742c70fbf0aSRichard Henderson temp_state[args[0]] = TS_DEAD; 17435ff9d6a4Sbellard break; 17441305c451SRichard Henderson 17451305c451SRichard Henderson case INDEX_op_add2_i32: 1746c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 1747f1fae40cSRichard Henderson goto do_addsub2; 17481305c451SRichard Henderson case INDEX_op_sub2_i32: 1749c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 1750f1fae40cSRichard Henderson goto do_addsub2; 1751f1fae40cSRichard Henderson case INDEX_op_add2_i64: 1752c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 1753f1fae40cSRichard Henderson goto do_addsub2; 1754f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 1755c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 1756f1fae40cSRichard Henderson do_addsub2: 17571305c451SRichard Henderson nb_iargs = 4; 17581305c451SRichard Henderson nb_oargs = 2; 17591305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 17601305c451SRichard Henderson the low part. The result can be optimized to a simple 17611305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 17621305c451SRichard Henderson cpu mode is set to 32 bit. */ 1763c70fbf0aSRichard Henderson if (temp_state[args[1]] == TS_DEAD) { 1764c70fbf0aSRichard Henderson if (temp_state[args[0]] == TS_DEAD) { 17651305c451SRichard Henderson goto do_remove; 17661305c451SRichard Henderson } 1767c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 1768c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 1769c45cb8bbSRichard Henderson op->opc = opc = opc_new; 17701305c451SRichard Henderson args[1] = args[2]; 17711305c451SRichard Henderson args[2] = args[4]; 17721305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 17731305c451SRichard Henderson nb_iargs = 2; 17741305c451SRichard Henderson nb_oargs = 1; 17751305c451SRichard Henderson } 17761305c451SRichard Henderson goto do_not_remove; 17771305c451SRichard Henderson 17781414968aSRichard Henderson case INDEX_op_mulu2_i32: 1779c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 1780c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 1781c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 178203271524SRichard Henderson goto do_mul2; 1783f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 1784c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 1785c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 1786c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 1787f1fae40cSRichard Henderson goto do_mul2; 1788f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 1789c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 1790c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 1791c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 179203271524SRichard Henderson goto do_mul2; 1793f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 1794c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 1795c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 1796c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 179703271524SRichard Henderson goto do_mul2; 1798f1fae40cSRichard Henderson do_mul2: 17991414968aSRichard Henderson nb_iargs = 2; 18001414968aSRichard Henderson nb_oargs = 2; 1801c70fbf0aSRichard Henderson if (temp_state[args[1]] == TS_DEAD) { 1802c70fbf0aSRichard Henderson if (temp_state[args[0]] == TS_DEAD) { 180303271524SRichard Henderson /* Both parts of the operation are dead. */ 18041414968aSRichard Henderson goto do_remove; 18051414968aSRichard Henderson } 180603271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 1807c45cb8bbSRichard Henderson op->opc = opc = opc_new; 18081414968aSRichard Henderson args[1] = args[2]; 18091414968aSRichard Henderson args[2] = args[3]; 1810c70fbf0aSRichard Henderson } else if (temp_state[args[0]] == TS_DEAD && have_opc_new2) { 181103271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 1812c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 181303271524SRichard Henderson args[0] = args[1]; 181403271524SRichard Henderson args[1] = args[2]; 181503271524SRichard Henderson args[2] = args[3]; 181603271524SRichard Henderson } else { 181703271524SRichard Henderson goto do_not_remove; 181803271524SRichard Henderson } 181903271524SRichard Henderson /* Mark the single-word operation live. */ 18201414968aSRichard Henderson nb_oargs = 1; 18211414968aSRichard Henderson goto do_not_remove; 18221414968aSRichard Henderson 1823c896fe29Sbellard default: 18241305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 1825c896fe29Sbellard nb_iargs = def->nb_iargs; 1826c896fe29Sbellard nb_oargs = def->nb_oargs; 1827c896fe29Sbellard 1828c896fe29Sbellard /* Test if the operation can be removed because all 18295ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 18305ff9d6a4Sbellard implies side effects */ 18315ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 1832c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1833c70fbf0aSRichard Henderson if (temp_state[args[i]] != TS_DEAD) { 1834c896fe29Sbellard goto do_not_remove; 1835c896fe29Sbellard } 18369c43b68dSAurelien Jarno } 18371305c451SRichard Henderson do_remove: 18380c627cdcSRichard Henderson tcg_op_remove(s, op); 1839c896fe29Sbellard } else { 1840c896fe29Sbellard do_not_remove: 1841c896fe29Sbellard /* output args are dead */ 1842c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1843c896fe29Sbellard arg = args[i]; 1844c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1845a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 18466b64b624SAurelien Jarno } 1847c70fbf0aSRichard Henderson if (temp_state[arg] & TS_MEM) { 1848a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 18499c43b68dSAurelien Jarno } 1850c70fbf0aSRichard Henderson temp_state[arg] = TS_DEAD; 1851c896fe29Sbellard } 1852c896fe29Sbellard 1853c896fe29Sbellard /* if end of basic block, update */ 1854c896fe29Sbellard if (def->flags & TCG_OPF_BB_END) { 1855c70fbf0aSRichard Henderson tcg_la_bb_end(s, temp_state); 18563d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 18573d5c5f87SAurelien Jarno /* globals should be synced to memory */ 1858c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 1859c70fbf0aSRichard Henderson temp_state[i] |= TS_MEM; 1860c70fbf0aSRichard Henderson } 1861c896fe29Sbellard } 1862c896fe29Sbellard 1863c19f47bfSAurelien Jarno /* record arguments that die in this opcode */ 1864866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 1865866cb6cbSAurelien Jarno arg = args[i]; 1866c70fbf0aSRichard Henderson if (temp_state[arg] & TS_DEAD) { 1867a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 1868c896fe29Sbellard } 1869c19f47bfSAurelien Jarno } 187067cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 1871c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 1872c70fbf0aSRichard Henderson temp_state[args[i]] &= ~TS_DEAD; 1873c896fe29Sbellard } 1874c896fe29Sbellard } 1875c896fe29Sbellard break; 1876c896fe29Sbellard } 1877bee158cbSRichard Henderson op->life = arg_life; 1878c896fe29Sbellard } 18791ff0a2c5SEvgeny Voevodin } 1880c896fe29Sbellard 18815a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 18825a18407fSRichard Henderson static bool liveness_pass_2(TCGContext *s, uint8_t *temp_state) 18835a18407fSRichard Henderson { 18845a18407fSRichard Henderson int nb_globals = s->nb_globals; 18855a18407fSRichard Henderson int16_t *dir_temps; 18865a18407fSRichard Henderson int i, oi, oi_next; 18875a18407fSRichard Henderson bool changes = false; 18885a18407fSRichard Henderson 18895a18407fSRichard Henderson dir_temps = tcg_malloc(nb_globals * sizeof(int16_t)); 18905a18407fSRichard Henderson memset(dir_temps, 0, nb_globals * sizeof(int16_t)); 18915a18407fSRichard Henderson 18925a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 18935a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 18945a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 18955a18407fSRichard Henderson if (its->indirect_reg) { 18965a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 18975a18407fSRichard Henderson dts->type = its->type; 18985a18407fSRichard Henderson dts->base_type = its->base_type; 18995a18407fSRichard Henderson dir_temps[i] = temp_idx(s, dts); 19005a18407fSRichard Henderson } 19015a18407fSRichard Henderson } 19025a18407fSRichard Henderson 19035a18407fSRichard Henderson memset(temp_state, TS_DEAD, nb_globals); 19045a18407fSRichard Henderson 19055a18407fSRichard Henderson for (oi = s->gen_op_buf[0].next; oi != 0; oi = oi_next) { 19065a18407fSRichard Henderson TCGOp *op = &s->gen_op_buf[oi]; 19075a18407fSRichard Henderson TCGArg *args = &s->gen_opparam_buf[op->args]; 19085a18407fSRichard Henderson TCGOpcode opc = op->opc; 19095a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 19105a18407fSRichard Henderson TCGLifeData arg_life = op->life; 19115a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 19125a18407fSRichard Henderson TCGArg arg, dir; 19135a18407fSRichard Henderson 19145a18407fSRichard Henderson oi_next = op->next; 19155a18407fSRichard Henderson 19165a18407fSRichard Henderson if (opc == INDEX_op_call) { 19175a18407fSRichard Henderson nb_oargs = op->callo; 19185a18407fSRichard Henderson nb_iargs = op->calli; 19195a18407fSRichard Henderson call_flags = args[nb_oargs + nb_iargs + 1]; 19205a18407fSRichard Henderson } else { 19215a18407fSRichard Henderson nb_iargs = def->nb_iargs; 19225a18407fSRichard Henderson nb_oargs = def->nb_oargs; 19235a18407fSRichard Henderson 19245a18407fSRichard Henderson /* Set flags similar to how calls require. */ 19255a18407fSRichard Henderson if (def->flags & TCG_OPF_BB_END) { 19265a18407fSRichard Henderson /* Like writing globals: save_globals */ 19275a18407fSRichard Henderson call_flags = 0; 19285a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 19295a18407fSRichard Henderson /* Like reading globals: sync_globals */ 19305a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 19315a18407fSRichard Henderson } else { 19325a18407fSRichard Henderson /* No effect on globals. */ 19335a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 19345a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 19355a18407fSRichard Henderson } 19365a18407fSRichard Henderson } 19375a18407fSRichard Henderson 19385a18407fSRichard Henderson /* Make sure that input arguments are available. */ 19395a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 19405a18407fSRichard Henderson arg = args[i]; 19415a18407fSRichard Henderson /* Note this unsigned test catches TCG_CALL_ARG_DUMMY too. */ 19425a18407fSRichard Henderson if (arg < nb_globals) { 19435a18407fSRichard Henderson dir = dir_temps[arg]; 19445a18407fSRichard Henderson if (dir != 0 && temp_state[arg] == TS_DEAD) { 19455a18407fSRichard Henderson TCGTemp *its = &s->temps[arg]; 19465a18407fSRichard Henderson TCGOpcode lopc = (its->type == TCG_TYPE_I32 19475a18407fSRichard Henderson ? INDEX_op_ld_i32 19485a18407fSRichard Henderson : INDEX_op_ld_i64); 19495a18407fSRichard Henderson TCGOp *lop = tcg_op_insert_before(s, op, lopc, 3); 19505a18407fSRichard Henderson TCGArg *largs = &s->gen_opparam_buf[lop->args]; 19515a18407fSRichard Henderson 19525a18407fSRichard Henderson largs[0] = dir; 19535a18407fSRichard Henderson largs[1] = temp_idx(s, its->mem_base); 19545a18407fSRichard Henderson largs[2] = its->mem_offset; 19555a18407fSRichard Henderson 19565a18407fSRichard Henderson /* Loaded, but synced with memory. */ 19575a18407fSRichard Henderson temp_state[arg] = TS_MEM; 19585a18407fSRichard Henderson } 19595a18407fSRichard Henderson } 19605a18407fSRichard Henderson } 19615a18407fSRichard Henderson 19625a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 19635a18407fSRichard Henderson No action is required except keeping temp_state up to date 19645a18407fSRichard Henderson so that we reload when needed. */ 19655a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 19665a18407fSRichard Henderson arg = args[i]; 19675a18407fSRichard Henderson if (arg < nb_globals) { 19685a18407fSRichard Henderson dir = dir_temps[arg]; 19695a18407fSRichard Henderson if (dir != 0) { 19705a18407fSRichard Henderson args[i] = dir; 19715a18407fSRichard Henderson changes = true; 19725a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 19735a18407fSRichard Henderson temp_state[arg] = TS_DEAD; 19745a18407fSRichard Henderson } 19755a18407fSRichard Henderson } 19765a18407fSRichard Henderson } 19775a18407fSRichard Henderson } 19785a18407fSRichard Henderson 19795a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 19805a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 19815a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 19825a18407fSRichard Henderson /* Nothing to do */ 19835a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 19845a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 19855a18407fSRichard Henderson /* Liveness should see that globals are synced back, 19865a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 19875a18407fSRichard Henderson tcg_debug_assert(dir_temps[i] == 0 19885a18407fSRichard Henderson || temp_state[i] != 0); 19895a18407fSRichard Henderson } 19905a18407fSRichard Henderson } else { 19915a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 19925a18407fSRichard Henderson /* Liveness should see that globals are saved back, 19935a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 19945a18407fSRichard Henderson tcg_debug_assert(dir_temps[i] == 0 19955a18407fSRichard Henderson || temp_state[i] == TS_DEAD); 19965a18407fSRichard Henderson } 19975a18407fSRichard Henderson } 19985a18407fSRichard Henderson 19995a18407fSRichard Henderson /* Outputs become available. */ 20005a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 20015a18407fSRichard Henderson arg = args[i]; 20025a18407fSRichard Henderson if (arg >= nb_globals) { 20035a18407fSRichard Henderson continue; 20045a18407fSRichard Henderson } 20055a18407fSRichard Henderson dir = dir_temps[arg]; 20065a18407fSRichard Henderson if (dir == 0) { 20075a18407fSRichard Henderson continue; 20085a18407fSRichard Henderson } 20095a18407fSRichard Henderson args[i] = dir; 20105a18407fSRichard Henderson changes = true; 20115a18407fSRichard Henderson 20125a18407fSRichard Henderson /* The output is now live and modified. */ 20135a18407fSRichard Henderson temp_state[arg] = 0; 20145a18407fSRichard Henderson 20155a18407fSRichard Henderson /* Sync outputs upon their last write. */ 20165a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 20175a18407fSRichard Henderson TCGTemp *its = &s->temps[arg]; 20185a18407fSRichard Henderson TCGOpcode sopc = (its->type == TCG_TYPE_I32 20195a18407fSRichard Henderson ? INDEX_op_st_i32 20205a18407fSRichard Henderson : INDEX_op_st_i64); 20215a18407fSRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc, 3); 20225a18407fSRichard Henderson TCGArg *sargs = &s->gen_opparam_buf[sop->args]; 20235a18407fSRichard Henderson 20245a18407fSRichard Henderson sargs[0] = dir; 20255a18407fSRichard Henderson sargs[1] = temp_idx(s, its->mem_base); 20265a18407fSRichard Henderson sargs[2] = its->mem_offset; 20275a18407fSRichard Henderson 20285a18407fSRichard Henderson temp_state[arg] = TS_MEM; 20295a18407fSRichard Henderson } 20305a18407fSRichard Henderson /* Drop outputs that are dead. */ 20315a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 20325a18407fSRichard Henderson temp_state[arg] = TS_DEAD; 20335a18407fSRichard Henderson } 20345a18407fSRichard Henderson } 20355a18407fSRichard Henderson } 20365a18407fSRichard Henderson 20375a18407fSRichard Henderson return changes; 20385a18407fSRichard Henderson } 20395a18407fSRichard Henderson 20408d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2041c896fe29Sbellard static void dump_regs(TCGContext *s) 2042c896fe29Sbellard { 2043c896fe29Sbellard TCGTemp *ts; 2044c896fe29Sbellard int i; 2045c896fe29Sbellard char buf[64]; 2046c896fe29Sbellard 2047c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2048c896fe29Sbellard ts = &s->temps[i]; 2049ac56dd48Spbrook printf(" %10s: ", tcg_get_arg_str_idx(s, buf, sizeof(buf), i)); 2050c896fe29Sbellard switch(ts->val_type) { 2051c896fe29Sbellard case TEMP_VAL_REG: 2052c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2053c896fe29Sbellard break; 2054c896fe29Sbellard case TEMP_VAL_MEM: 2055b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2056b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2057c896fe29Sbellard break; 2058c896fe29Sbellard case TEMP_VAL_CONST: 2059c896fe29Sbellard printf("$0x%" TCG_PRIlx, ts->val); 2060c896fe29Sbellard break; 2061c896fe29Sbellard case TEMP_VAL_DEAD: 2062c896fe29Sbellard printf("D"); 2063c896fe29Sbellard break; 2064c896fe29Sbellard default: 2065c896fe29Sbellard printf("???"); 2066c896fe29Sbellard break; 2067c896fe29Sbellard } 2068c896fe29Sbellard printf("\n"); 2069c896fe29Sbellard } 2070c896fe29Sbellard 2071c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2072f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2073c896fe29Sbellard printf("%s: %s\n", 2074c896fe29Sbellard tcg_target_reg_names[i], 2075f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2076c896fe29Sbellard } 2077c896fe29Sbellard } 2078c896fe29Sbellard } 2079c896fe29Sbellard 2080c896fe29Sbellard static void check_regs(TCGContext *s) 2081c896fe29Sbellard { 2082869938aeSRichard Henderson int reg; 2083b6638662SRichard Henderson int k; 2084c896fe29Sbellard TCGTemp *ts; 2085c896fe29Sbellard char buf[64]; 2086c896fe29Sbellard 2087c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2088f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2089f8b2f202SRichard Henderson if (ts != NULL) { 2090f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2091c896fe29Sbellard printf("Inconsistency for register %s:\n", 2092c896fe29Sbellard tcg_target_reg_names[reg]); 2093b03cce8eSbellard goto fail; 2094c896fe29Sbellard } 2095c896fe29Sbellard } 2096c896fe29Sbellard } 2097c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2098c896fe29Sbellard ts = &s->temps[k]; 2099f8b2f202SRichard Henderson if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg 2100f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2101c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2102f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2103b03cce8eSbellard fail: 2104c896fe29Sbellard printf("reg state:\n"); 2105c896fe29Sbellard dump_regs(s); 2106c896fe29Sbellard tcg_abort(); 2107c896fe29Sbellard } 2108c896fe29Sbellard } 2109c896fe29Sbellard } 2110c896fe29Sbellard #endif 2111c896fe29Sbellard 2112c896fe29Sbellard static void temp_allocate_frame(TCGContext *s, int temp) 2113c896fe29Sbellard { 2114c896fe29Sbellard TCGTemp *ts; 2115c896fe29Sbellard ts = &s->temps[temp]; 21169b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 21179b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2118b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2119b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2120b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2121f44c9960SBlue Swirl #endif 2122b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2123b591dc59SBlue Swirl s->frame_end) { 21245ff9d6a4Sbellard tcg_abort(); 2125b591dc59SBlue Swirl } 2126c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2127b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2128c896fe29Sbellard ts->mem_allocated = 1; 2129e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2130c896fe29Sbellard } 2131c896fe29Sbellard 2132b3915dbbSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet); 2133b3915dbbSRichard Henderson 213459d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 213559d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 213659d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2137c896fe29Sbellard { 213859d7c14eSRichard Henderson if (ts->fixed_reg) { 213959d7c14eSRichard Henderson return; 214059d7c14eSRichard Henderson } 214159d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 214259d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 214359d7c14eSRichard Henderson } 214459d7c14eSRichard Henderson ts->val_type = (free_or_dead < 0 214559d7c14eSRichard Henderson || ts->temp_local 214659d7c14eSRichard Henderson || temp_idx(s, ts) < s->nb_globals 214759d7c14eSRichard Henderson ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 214859d7c14eSRichard Henderson } 2149c896fe29Sbellard 215059d7c14eSRichard Henderson /* Mark a temporary as dead. */ 215159d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 215259d7c14eSRichard Henderson { 215359d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 215459d7c14eSRichard Henderson } 215559d7c14eSRichard Henderson 215659d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 215759d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 215859d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 215959d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 216059d7c14eSRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, 216159d7c14eSRichard Henderson TCGRegSet allocated_regs, int free_or_dead) 216259d7c14eSRichard Henderson { 216359d7c14eSRichard Henderson if (ts->fixed_reg) { 216459d7c14eSRichard Henderson return; 216559d7c14eSRichard Henderson } 216659d7c14eSRichard Henderson if (!ts->mem_coherent) { 21677f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 2168f8b2f202SRichard Henderson temp_allocate_frame(s, temp_idx(s, ts)); 216959d7c14eSRichard Henderson } 217059d7c14eSRichard Henderson switch (ts->val_type) { 217159d7c14eSRichard Henderson case TEMP_VAL_CONST: 217259d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 217359d7c14eSRichard Henderson require it later in a register, so attempt to store the 217459d7c14eSRichard Henderson constant to memory directly. */ 217559d7c14eSRichard Henderson if (free_or_dead 217659d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 217759d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 217859d7c14eSRichard Henderson break; 217959d7c14eSRichard Henderson } 218059d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 218159d7c14eSRichard Henderson allocated_regs); 218259d7c14eSRichard Henderson /* fallthrough */ 218359d7c14eSRichard Henderson 218459d7c14eSRichard Henderson case TEMP_VAL_REG: 218559d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 218659d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 218759d7c14eSRichard Henderson break; 218859d7c14eSRichard Henderson 218959d7c14eSRichard Henderson case TEMP_VAL_MEM: 219059d7c14eSRichard Henderson break; 219159d7c14eSRichard Henderson 219259d7c14eSRichard Henderson case TEMP_VAL_DEAD: 219359d7c14eSRichard Henderson default: 219459d7c14eSRichard Henderson tcg_abort(); 2195c896fe29Sbellard } 21967f6ceedfSAurelien Jarno ts->mem_coherent = 1; 21977f6ceedfSAurelien Jarno } 219859d7c14eSRichard Henderson if (free_or_dead) { 219959d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 220059d7c14eSRichard Henderson } 220159d7c14eSRichard Henderson } 22027f6ceedfSAurelien Jarno 22037f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 2204b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 22057f6ceedfSAurelien Jarno { 2206f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 2207f8b2f202SRichard Henderson if (ts != NULL) { 220859d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, -1); 2209c896fe29Sbellard } 2210c896fe29Sbellard } 2211c896fe29Sbellard 2212c896fe29Sbellard /* Allocate a register belonging to reg1 & ~reg2 */ 2213b3915dbbSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet desired_regs, 221491478cefSRichard Henderson TCGRegSet allocated_regs, bool rev) 2215c896fe29Sbellard { 221691478cefSRichard Henderson int i, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 221791478cefSRichard Henderson const int *order; 2218b6638662SRichard Henderson TCGReg reg; 2219c896fe29Sbellard TCGRegSet reg_ct; 2220c896fe29Sbellard 222107ddf036SRichard Henderson reg_ct = desired_regs & ~allocated_regs; 222291478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 2223c896fe29Sbellard 2224c896fe29Sbellard /* first try free registers */ 222591478cefSRichard Henderson for(i = 0; i < n; i++) { 222691478cefSRichard Henderson reg = order[i]; 2227f8b2f202SRichard Henderson if (tcg_regset_test_reg(reg_ct, reg) && s->reg_to_temp[reg] == NULL) 2228c896fe29Sbellard return reg; 2229c896fe29Sbellard } 2230c896fe29Sbellard 2231c896fe29Sbellard /* XXX: do better spill choice */ 223291478cefSRichard Henderson for(i = 0; i < n; i++) { 223391478cefSRichard Henderson reg = order[i]; 2234c896fe29Sbellard if (tcg_regset_test_reg(reg_ct, reg)) { 2235b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 2236c896fe29Sbellard return reg; 2237c896fe29Sbellard } 2238c896fe29Sbellard } 2239c896fe29Sbellard 2240c896fe29Sbellard tcg_abort(); 2241c896fe29Sbellard } 2242c896fe29Sbellard 224340ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 224440ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 224540ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 224640ae5c62SRichard Henderson TCGRegSet allocated_regs) 224740ae5c62SRichard Henderson { 224840ae5c62SRichard Henderson TCGReg reg; 224940ae5c62SRichard Henderson 225040ae5c62SRichard Henderson switch (ts->val_type) { 225140ae5c62SRichard Henderson case TEMP_VAL_REG: 225240ae5c62SRichard Henderson return; 225340ae5c62SRichard Henderson case TEMP_VAL_CONST: 225491478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 225540ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 225640ae5c62SRichard Henderson ts->mem_coherent = 0; 225740ae5c62SRichard Henderson break; 225840ae5c62SRichard Henderson case TEMP_VAL_MEM: 225991478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 226040ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 226140ae5c62SRichard Henderson ts->mem_coherent = 1; 226240ae5c62SRichard Henderson break; 226340ae5c62SRichard Henderson case TEMP_VAL_DEAD: 226440ae5c62SRichard Henderson default: 226540ae5c62SRichard Henderson tcg_abort(); 226640ae5c62SRichard Henderson } 226740ae5c62SRichard Henderson ts->reg = reg; 226840ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 226940ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 227040ae5c62SRichard Henderson } 227140ae5c62SRichard Henderson 227259d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 2273e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 227459d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 22751ad80729SAurelien Jarno { 22762c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 2277eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 2278f8bf00f1SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg); 22791ad80729SAurelien Jarno } 22801ad80729SAurelien Jarno 22819814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 2282641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 2283641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 2284641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 2285641d5fbeSbellard { 2286641d5fbeSbellard int i; 2287641d5fbeSbellard 2288641d5fbeSbellard for (i = 0; i < s->nb_globals; i++) { 2289b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 2290641d5fbeSbellard } 2291e5097dc8Sbellard } 2292e5097dc8Sbellard 22933d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 22943d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 22953d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 22963d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 22973d5c5f87SAurelien Jarno { 22983d5c5f87SAurelien Jarno int i; 22993d5c5f87SAurelien Jarno 23003d5c5f87SAurelien Jarno for (i = 0; i < s->nb_globals; i++) { 230112b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 230212b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 230312b9b11aSRichard Henderson || ts->fixed_reg 230412b9b11aSRichard Henderson || ts->mem_coherent); 23053d5c5f87SAurelien Jarno } 23063d5c5f87SAurelien Jarno } 23073d5c5f87SAurelien Jarno 2308e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 2309e8996ee0Sbellard all globals are stored at their canonical location. */ 2310e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 2311e5097dc8Sbellard { 2312e5097dc8Sbellard int i; 2313e5097dc8Sbellard 2314c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 2315b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 2316641d5fbeSbellard if (ts->temp_local) { 2317b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 2318641d5fbeSbellard } else { 23192c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 2320eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 2321eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 2322c896fe29Sbellard } 2323641d5fbeSbellard } 2324e8996ee0Sbellard 2325e8996ee0Sbellard save_globals(s, allocated_regs); 2326c896fe29Sbellard } 2327c896fe29Sbellard 23280fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 23290fe4fca4SPaolo Bonzini tcg_target_ulong val, TCGLifeData arg_life) 2330e8996ee0Sbellard { 2331e8996ee0Sbellard if (ots->fixed_reg) { 233259d7c14eSRichard Henderson /* For fixed registers, we do not do any constant propagation. */ 2333e8996ee0Sbellard tcg_out_movi(s, ots->type, ots->reg, val); 233459d7c14eSRichard Henderson return; 233559d7c14eSRichard Henderson } 233659d7c14eSRichard Henderson 233759d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 2338f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 2339f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2340f8b2f202SRichard Henderson } 2341e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 2342e8996ee0Sbellard ots->val = val; 234359d7c14eSRichard Henderson ots->mem_coherent = 0; 2344ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 234559d7c14eSRichard Henderson temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0)); 234659d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 2347f8bf00f1SRichard Henderson temp_dead(s, ots); 23484c4e1ab2SAurelien Jarno } 2349e8996ee0Sbellard } 2350e8996ee0Sbellard 23510fe4fca4SPaolo Bonzini static void tcg_reg_alloc_movi(TCGContext *s, const TCGArg *args, 23520fe4fca4SPaolo Bonzini TCGLifeData arg_life) 23530fe4fca4SPaolo Bonzini { 23540fe4fca4SPaolo Bonzini TCGTemp *ots = &s->temps[args[0]]; 23550fe4fca4SPaolo Bonzini tcg_target_ulong val = args[1]; 23560fe4fca4SPaolo Bonzini 23570fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 23580fe4fca4SPaolo Bonzini } 23590fe4fca4SPaolo Bonzini 2360c896fe29Sbellard static void tcg_reg_alloc_mov(TCGContext *s, const TCGOpDef *def, 2361a1b3c48dSRichard Henderson const TCGArg *args, TCGLifeData arg_life) 2362c896fe29Sbellard { 2363c29c1d7eSAurelien Jarno TCGRegSet allocated_regs; 2364c896fe29Sbellard TCGTemp *ts, *ots; 2365450445d5SRichard Henderson TCGType otype, itype; 2366c896fe29Sbellard 2367d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 2368c896fe29Sbellard ots = &s->temps[args[0]]; 2369c896fe29Sbellard ts = &s->temps[args[1]]; 2370450445d5SRichard Henderson 2371450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 2372450445d5SRichard Henderson otype = ots->type; 2373450445d5SRichard Henderson itype = ts->type; 2374c896fe29Sbellard 23750fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 23760fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 23770fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 23780fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 23790fe4fca4SPaolo Bonzini temp_dead(s, ts); 23800fe4fca4SPaolo Bonzini } 23810fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 23820fe4fca4SPaolo Bonzini return; 23830fe4fca4SPaolo Bonzini } 23840fe4fca4SPaolo Bonzini 23850fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 23860fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 23870fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 23880fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 23890fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 239040ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], allocated_regs); 2391c29c1d7eSAurelien Jarno } 2392c29c1d7eSAurelien Jarno 23930fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 2394c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(0) && !ots->fixed_reg) { 2395c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 2396c29c1d7eSAurelien Jarno liveness analysis disabled). */ 2397eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 2398c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 2399c29c1d7eSAurelien Jarno temp_allocate_frame(s, args[0]); 2400c29c1d7eSAurelien Jarno } 2401b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 2402c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 2403f8bf00f1SRichard Henderson temp_dead(s, ts); 2404c29c1d7eSAurelien Jarno } 2405f8bf00f1SRichard Henderson temp_dead(s, ots); 2406e8996ee0Sbellard } else { 2407c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) { 2408c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 2409c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 2410f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2411c896fe29Sbellard } 2412c29c1d7eSAurelien Jarno ots->reg = ts->reg; 2413f8bf00f1SRichard Henderson temp_dead(s, ts); 2414c29c1d7eSAurelien Jarno } else { 2415c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 2416c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 2417c29c1d7eSAurelien Jarno input one. */ 2418c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 2419450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 242091478cefSRichard Henderson allocated_regs, ots->indirect_base); 2421c29c1d7eSAurelien Jarno } 2422450445d5SRichard Henderson tcg_out_mov(s, otype, ots->reg, ts->reg); 2423c29c1d7eSAurelien Jarno } 2424c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 2425c896fe29Sbellard ots->mem_coherent = 0; 2426f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 2427ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 242859d7c14eSRichard Henderson temp_sync(s, ots, allocated_regs, 0); 2429c29c1d7eSAurelien Jarno } 2430ec7a869dSAurelien Jarno } 2431c896fe29Sbellard } 2432c896fe29Sbellard 2433c896fe29Sbellard static void tcg_reg_alloc_op(TCGContext *s, 2434a9751609SRichard Henderson const TCGOpDef *def, TCGOpcode opc, 2435a1b3c48dSRichard Henderson const TCGArg *args, TCGLifeData arg_life) 2436c896fe29Sbellard { 243782790a87SRichard Henderson TCGRegSet i_allocated_regs; 243882790a87SRichard Henderson TCGRegSet o_allocated_regs; 2439b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 2440b6638662SRichard Henderson TCGReg reg; 2441c896fe29Sbellard TCGArg arg; 2442c896fe29Sbellard const TCGArgConstraint *arg_ct; 2443c896fe29Sbellard TCGTemp *ts; 2444c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 2445c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 2446c896fe29Sbellard 2447c896fe29Sbellard nb_oargs = def->nb_oargs; 2448c896fe29Sbellard nb_iargs = def->nb_iargs; 2449c896fe29Sbellard 2450c896fe29Sbellard /* copy constants */ 2451c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 2452c896fe29Sbellard args + nb_oargs + nb_iargs, 2453c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 2454c896fe29Sbellard 2455d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 2456d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 245782790a87SRichard Henderson 2458c896fe29Sbellard /* satisfy input constraints */ 2459c896fe29Sbellard for(k = 0; k < nb_iargs; k++) { 2460c896fe29Sbellard i = def->sorted_args[nb_oargs + k]; 2461c896fe29Sbellard arg = args[i]; 2462c896fe29Sbellard arg_ct = &def->args_ct[i]; 2463c896fe29Sbellard ts = &s->temps[arg]; 246440ae5c62SRichard Henderson 246540ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 246640ae5c62SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct)) { 2467c896fe29Sbellard /* constant is OK for instruction */ 2468c896fe29Sbellard const_args[i] = 1; 2469c896fe29Sbellard new_args[i] = ts->val; 2470c896fe29Sbellard goto iarg_end; 2471c896fe29Sbellard } 247240ae5c62SRichard Henderson 247382790a87SRichard Henderson temp_load(s, ts, arg_ct->u.regs, i_allocated_regs); 247440ae5c62SRichard Henderson 24755ff9d6a4Sbellard if (arg_ct->ct & TCG_CT_IALIAS) { 24765ff9d6a4Sbellard if (ts->fixed_reg) { 24775ff9d6a4Sbellard /* if fixed register, we must allocate a new register 24785ff9d6a4Sbellard if the alias is not the same register */ 24795ff9d6a4Sbellard if (arg != args[arg_ct->alias_index]) 24805ff9d6a4Sbellard goto allocate_in_reg; 24815ff9d6a4Sbellard } else { 2482c896fe29Sbellard /* if the input is aliased to an output and if it is 2483c896fe29Sbellard not dead after the instruction, we must allocate 2484c896fe29Sbellard a new register and move it */ 2485866cb6cbSAurelien Jarno if (!IS_DEAD_ARG(i)) { 2486c896fe29Sbellard goto allocate_in_reg; 2487c896fe29Sbellard } 24887e1df267SAurelien Jarno /* check if the current register has already been allocated 24897e1df267SAurelien Jarno for another input aliased to an output */ 24907e1df267SAurelien Jarno int k2, i2; 24917e1df267SAurelien Jarno for (k2 = 0 ; k2 < k ; k2++) { 24927e1df267SAurelien Jarno i2 = def->sorted_args[nb_oargs + k2]; 24937e1df267SAurelien Jarno if ((def->args_ct[i2].ct & TCG_CT_IALIAS) && 24947e1df267SAurelien Jarno (new_args[i2] == ts->reg)) { 24957e1df267SAurelien Jarno goto allocate_in_reg; 24967e1df267SAurelien Jarno } 24977e1df267SAurelien Jarno } 24985ff9d6a4Sbellard } 2499866cb6cbSAurelien Jarno } 2500c896fe29Sbellard reg = ts->reg; 2501c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, reg)) { 2502c896fe29Sbellard /* nothing to do : the constraint is satisfied */ 2503c896fe29Sbellard } else { 2504c896fe29Sbellard allocate_in_reg: 2505c896fe29Sbellard /* allocate a new register matching the constraint 2506c896fe29Sbellard and move the temporary register into it */ 250782790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs, 250891478cefSRichard Henderson ts->indirect_base); 25093b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 2510c896fe29Sbellard } 2511c896fe29Sbellard new_args[i] = reg; 2512c896fe29Sbellard const_args[i] = 0; 251382790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 2514c896fe29Sbellard iarg_end: ; 2515c896fe29Sbellard } 2516c896fe29Sbellard 2517c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 2518866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2519866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 2520f8bf00f1SRichard Henderson temp_dead(s, &s->temps[args[i]]); 2521c896fe29Sbellard } 2522c896fe29Sbellard } 2523c896fe29Sbellard 2524a52ad07eSAurelien Jarno if (def->flags & TCG_OPF_BB_END) { 252582790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 2526a52ad07eSAurelien Jarno } else { 2527c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 2528b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 2529c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 2530c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 253182790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 2532c896fe29Sbellard } 2533c896fe29Sbellard } 25343d5c5f87SAurelien Jarno } 25353d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 25363d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 25373d5c5f87SAurelien Jarno an exception. */ 253882790a87SRichard Henderson sync_globals(s, i_allocated_regs); 2539c896fe29Sbellard } 2540c896fe29Sbellard 2541c896fe29Sbellard /* satisfy the output constraints */ 2542c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 2543c896fe29Sbellard i = def->sorted_args[k]; 2544c896fe29Sbellard arg = args[i]; 2545c896fe29Sbellard arg_ct = &def->args_ct[i]; 2546c896fe29Sbellard ts = &s->temps[arg]; 254717280ff4SRichard Henderson if ((arg_ct->ct & TCG_CT_ALIAS) 254817280ff4SRichard Henderson && !const_args[arg_ct->alias_index]) { 25495ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 255082790a87SRichard Henderson } else if (arg_ct->ct & TCG_CT_NEWREG) { 255182790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, 255282790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 255382790a87SRichard Henderson ts->indirect_base); 2554c896fe29Sbellard } else { 2555c896fe29Sbellard /* if fixed register, we try to use it */ 2556c896fe29Sbellard reg = ts->reg; 2557c896fe29Sbellard if (ts->fixed_reg && 2558c896fe29Sbellard tcg_regset_test_reg(arg_ct->u.regs, reg)) { 2559c896fe29Sbellard goto oarg_end; 2560c896fe29Sbellard } 256182790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs, 256291478cefSRichard Henderson ts->indirect_base); 2563c896fe29Sbellard } 256482790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 2565c896fe29Sbellard /* if a fixed register is used, then a move will be done afterwards */ 2566c896fe29Sbellard if (!ts->fixed_reg) { 2567639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 2568f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 2569639368ddSAurelien Jarno } 2570c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 2571c896fe29Sbellard ts->reg = reg; 2572c896fe29Sbellard /* temp value is modified, so the value kept in memory is 2573c896fe29Sbellard potentially not the same */ 2574c896fe29Sbellard ts->mem_coherent = 0; 2575f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 2576c896fe29Sbellard } 2577c896fe29Sbellard oarg_end: 2578c896fe29Sbellard new_args[i] = reg; 2579c896fe29Sbellard } 2580e8996ee0Sbellard } 2581c896fe29Sbellard 2582c896fe29Sbellard /* emit instruction */ 2583c896fe29Sbellard tcg_out_op(s, opc, new_args, const_args); 2584c896fe29Sbellard 2585c896fe29Sbellard /* move the outputs in the correct register if needed */ 2586c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 2587c896fe29Sbellard ts = &s->temps[args[i]]; 2588c896fe29Sbellard reg = new_args[i]; 2589c896fe29Sbellard if (ts->fixed_reg && ts->reg != reg) { 25903b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 2591c896fe29Sbellard } 2592ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 259382790a87SRichard Henderson temp_sync(s, ts, o_allocated_regs, IS_DEAD_ARG(i)); 259459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 2595f8bf00f1SRichard Henderson temp_dead(s, ts); 2596ec7a869dSAurelien Jarno } 2597c896fe29Sbellard } 2598c896fe29Sbellard } 2599c896fe29Sbellard 2600b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 2601b03cce8eSbellard #define STACK_DIR(x) (-(x)) 2602b03cce8eSbellard #else 2603b03cce8eSbellard #define STACK_DIR(x) (x) 2604b03cce8eSbellard #endif 2605b03cce8eSbellard 2606c45cb8bbSRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, int nb_oargs, int nb_iargs, 2607a1b3c48dSRichard Henderson const TCGArg * const args, TCGLifeData arg_life) 2608c896fe29Sbellard { 2609b6638662SRichard Henderson int flags, nb_regs, i; 2610b6638662SRichard Henderson TCGReg reg; 2611cf066674SRichard Henderson TCGArg arg; 2612c896fe29Sbellard TCGTemp *ts; 2613d3452f1fSRichard Henderson intptr_t stack_offset; 2614d3452f1fSRichard Henderson size_t call_stack_size; 2615cf066674SRichard Henderson tcg_insn_unit *func_addr; 2616cf066674SRichard Henderson int allocate_args; 2617c896fe29Sbellard TCGRegSet allocated_regs; 2618c896fe29Sbellard 2619cf066674SRichard Henderson func_addr = (tcg_insn_unit *)(intptr_t)args[nb_oargs + nb_iargs]; 2620cf066674SRichard Henderson flags = args[nb_oargs + nb_iargs + 1]; 2621c896fe29Sbellard 26226e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 2623c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 2624c45cb8bbSRichard Henderson nb_regs = nb_iargs; 2625cf066674SRichard Henderson } 2626c896fe29Sbellard 2627c896fe29Sbellard /* assign stack slots first */ 2628c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 2629c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 2630c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 2631b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 2632b03cce8eSbellard if (allocate_args) { 2633345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 2634345649c0SBlue Swirl preallocate call stack */ 2635345649c0SBlue Swirl tcg_abort(); 2636b03cce8eSbellard } 263739cf05d3Sbellard 263839cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 2639c45cb8bbSRichard Henderson for(i = nb_regs; i < nb_iargs; i++) { 2640c896fe29Sbellard arg = args[nb_oargs + i]; 264139cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 264239cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 264339cf05d3Sbellard #endif 264439cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 2645c896fe29Sbellard ts = &s->temps[arg]; 264640ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 264740ae5c62SRichard Henderson s->reserved_regs); 2648e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 264939cf05d3Sbellard } 265039cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 265139cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 265239cf05d3Sbellard #endif 2653c896fe29Sbellard } 2654c896fe29Sbellard 2655c896fe29Sbellard /* assign input registers */ 2656d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 2657c896fe29Sbellard for(i = 0; i < nb_regs; i++) { 2658c896fe29Sbellard arg = args[nb_oargs + i]; 265939cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 2660c896fe29Sbellard ts = &s->temps[arg]; 2661c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 2662b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 266340ae5c62SRichard Henderson 2664c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 2665c896fe29Sbellard if (ts->reg != reg) { 26663b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 2667c896fe29Sbellard } 2668c896fe29Sbellard } else { 2669ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 267040ae5c62SRichard Henderson 267140ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 267240ae5c62SRichard Henderson temp_load(s, ts, arg_set, allocated_regs); 2673c896fe29Sbellard } 267440ae5c62SRichard Henderson 2675c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 2676c896fe29Sbellard } 267739cf05d3Sbellard } 2678c896fe29Sbellard 2679c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 2680866cb6cbSAurelien Jarno for(i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2681866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 2682f8bf00f1SRichard Henderson temp_dead(s, &s->temps[args[i]]); 2683c896fe29Sbellard } 2684c896fe29Sbellard } 2685c896fe29Sbellard 2686c896fe29Sbellard /* clobber call registers */ 2687c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 2688c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 2689b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 2690c896fe29Sbellard } 2691c896fe29Sbellard } 2692c896fe29Sbellard 269378505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 269478505279SAurelien Jarno they might be read. */ 269578505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 269678505279SAurelien Jarno /* Nothing to do */ 269778505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 269878505279SAurelien Jarno sync_globals(s, allocated_regs); 269978505279SAurelien Jarno } else { 2700e8996ee0Sbellard save_globals(s, allocated_regs); 2701b9c18f56Saurel32 } 2702c896fe29Sbellard 2703cf066674SRichard Henderson tcg_out_call(s, func_addr); 2704c896fe29Sbellard 2705c896fe29Sbellard /* assign output registers and emit moves if needed */ 2706c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 2707c896fe29Sbellard arg = args[i]; 2708c896fe29Sbellard ts = &s->temps[arg]; 2709c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 2710eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 271134b1a49cSRichard Henderson 2712c896fe29Sbellard if (ts->fixed_reg) { 2713c896fe29Sbellard if (ts->reg != reg) { 27143b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 2715c896fe29Sbellard } 2716c896fe29Sbellard } else { 2717639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 2718f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 2719639368ddSAurelien Jarno } 2720c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 2721c896fe29Sbellard ts->reg = reg; 2722c896fe29Sbellard ts->mem_coherent = 0; 2723f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 2724ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 272559d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i)); 272659d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 2727f8bf00f1SRichard Henderson temp_dead(s, ts); 2728c896fe29Sbellard } 2729c896fe29Sbellard } 27308c11ad25SAurelien Jarno } 2731c896fe29Sbellard } 2732c896fe29Sbellard 2733c896fe29Sbellard #ifdef CONFIG_PROFILER 2734c896fe29Sbellard 273554604f74Saurel32 static int64_t tcg_table_op_count[NB_OPS]; 2736c896fe29Sbellard 2737246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 2738c896fe29Sbellard { 2739c896fe29Sbellard int i; 2740d70724ceSzhanghailiang 274115fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 2742246ae24dSMax Filippov cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, 2743246ae24dSMax Filippov tcg_table_op_count[i]); 2744c896fe29Sbellard } 2745c896fe29Sbellard } 2746246ae24dSMax Filippov #else 2747246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 2748246ae24dSMax Filippov { 2749246ae24dSMax Filippov cpu_fprintf(f, "[TCG profiler not compiled]\n"); 2750246ae24dSMax Filippov } 2751c896fe29Sbellard #endif 2752c896fe29Sbellard 2753c896fe29Sbellard 27545bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 2755c896fe29Sbellard { 2756fca8a500SRichard Henderson int i, oi, oi_next, num_insns; 2757c896fe29Sbellard 275804fe6400SRichard Henderson #ifdef CONFIG_PROFILER 275904fe6400SRichard Henderson { 276004fe6400SRichard Henderson int n; 276104fe6400SRichard Henderson 2762dcb8e758SRichard Henderson n = s->gen_op_buf[0].prev + 1; 276304fe6400SRichard Henderson s->op_count += n; 276404fe6400SRichard Henderson if (n > s->op_count_max) { 276504fe6400SRichard Henderson s->op_count_max = n; 276604fe6400SRichard Henderson } 276704fe6400SRichard Henderson 276804fe6400SRichard Henderson n = s->nb_temps; 276904fe6400SRichard Henderson s->temp_count += n; 277004fe6400SRichard Henderson if (n > s->temp_count_max) { 277104fe6400SRichard Henderson s->temp_count_max = n; 277204fe6400SRichard Henderson } 277304fe6400SRichard Henderson } 277404fe6400SRichard Henderson #endif 277504fe6400SRichard Henderson 2776c896fe29Sbellard #ifdef DEBUG_DISAS 2777d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 2778d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 27791ee73216SRichard Henderson qemu_log_lock(); 278093fcfe39Saliguori qemu_log("OP:\n"); 2781eeacee4dSBlue Swirl tcg_dump_ops(s); 278293fcfe39Saliguori qemu_log("\n"); 27831ee73216SRichard Henderson qemu_log_unlock(); 2784c896fe29Sbellard } 2785c896fe29Sbellard #endif 2786c896fe29Sbellard 2787c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 2788c5cc28ffSAurelien Jarno s->opt_time -= profile_getclock(); 2789c5cc28ffSAurelien Jarno #endif 2790c5cc28ffSAurelien Jarno 27918f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 2792c45cb8bbSRichard Henderson tcg_optimize(s); 27938f2e8c07SKirill Batuzov #endif 27948f2e8c07SKirill Batuzov 2795a23a9ec6Sbellard #ifdef CONFIG_PROFILER 2796c5cc28ffSAurelien Jarno s->opt_time += profile_getclock(); 2797a23a9ec6Sbellard s->la_time -= profile_getclock(); 2798a23a9ec6Sbellard #endif 2799c5cc28ffSAurelien Jarno 28005a18407fSRichard Henderson { 28015a18407fSRichard Henderson uint8_t *temp_state = tcg_malloc(s->nb_temps + s->nb_indirects); 28025a18407fSRichard Henderson 28035a18407fSRichard Henderson liveness_pass_1(s, temp_state); 28045a18407fSRichard Henderson 28055a18407fSRichard Henderson if (s->nb_indirects > 0) { 28065a18407fSRichard Henderson #ifdef DEBUG_DISAS 28075a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 28085a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 28091ee73216SRichard Henderson qemu_log_lock(); 28105a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 28115a18407fSRichard Henderson tcg_dump_ops(s); 28125a18407fSRichard Henderson qemu_log("\n"); 28131ee73216SRichard Henderson qemu_log_unlock(); 28145a18407fSRichard Henderson } 28155a18407fSRichard Henderson #endif 28165a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 28175a18407fSRichard Henderson if (liveness_pass_2(s, temp_state)) { 28185a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 28195a18407fSRichard Henderson liveness_pass_1(s, temp_state); 28205a18407fSRichard Henderson } 28215a18407fSRichard Henderson } 28225a18407fSRichard Henderson } 2823c5cc28ffSAurelien Jarno 2824a23a9ec6Sbellard #ifdef CONFIG_PROFILER 2825a23a9ec6Sbellard s->la_time += profile_getclock(); 2826a23a9ec6Sbellard #endif 2827c896fe29Sbellard 2828c896fe29Sbellard #ifdef DEBUG_DISAS 2829d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 2830d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 28311ee73216SRichard Henderson qemu_log_lock(); 2832c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 2833eeacee4dSBlue Swirl tcg_dump_ops(s); 283493fcfe39Saliguori qemu_log("\n"); 28351ee73216SRichard Henderson qemu_log_unlock(); 2836c896fe29Sbellard } 2837c896fe29Sbellard #endif 2838c896fe29Sbellard 2839c896fe29Sbellard tcg_reg_alloc_start(s); 2840c896fe29Sbellard 2841e7e168f4SEmilio G. Cota s->code_buf = tb->tc.ptr; 2842e7e168f4SEmilio G. Cota s->code_ptr = tb->tc.ptr; 2843c896fe29Sbellard 2844659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 2845659ef5cbSRichard Henderson s->ldst_labels = NULL; 2846659ef5cbSRichard Henderson #endif 284757a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 284857a26946SRichard Henderson s->pool_labels = NULL; 284957a26946SRichard Henderson #endif 28509ecefc84SRichard Henderson 2851fca8a500SRichard Henderson num_insns = -1; 2852dcb8e758SRichard Henderson for (oi = s->gen_op_buf[0].next; oi != 0; oi = oi_next) { 2853c45cb8bbSRichard Henderson TCGOp * const op = &s->gen_op_buf[oi]; 2854c45cb8bbSRichard Henderson TCGArg * const args = &s->gen_opparam_buf[op->args]; 2855c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2856c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2857bee158cbSRichard Henderson TCGLifeData arg_life = op->life; 2858b3db8758Sblueswir1 2859c45cb8bbSRichard Henderson oi_next = op->next; 2860c896fe29Sbellard #ifdef CONFIG_PROFILER 286154604f74Saurel32 tcg_table_op_count[opc]++; 2862c896fe29Sbellard #endif 2863c45cb8bbSRichard Henderson 2864c896fe29Sbellard switch (opc) { 2865c896fe29Sbellard case INDEX_op_mov_i32: 2866c896fe29Sbellard case INDEX_op_mov_i64: 2867a1b3c48dSRichard Henderson tcg_reg_alloc_mov(s, def, args, arg_life); 2868c896fe29Sbellard break; 2869e8996ee0Sbellard case INDEX_op_movi_i32: 2870e8996ee0Sbellard case INDEX_op_movi_i64: 2871a1b3c48dSRichard Henderson tcg_reg_alloc_movi(s, args, arg_life); 2872e8996ee0Sbellard break; 2873765b842aSRichard Henderson case INDEX_op_insn_start: 2874fca8a500SRichard Henderson if (num_insns >= 0) { 2875fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 2876fca8a500SRichard Henderson } 2877fca8a500SRichard Henderson num_insns++; 2878bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 2879bad729e2SRichard Henderson target_ulong a; 2880bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 2881bad729e2SRichard Henderson a = ((target_ulong)args[i * 2 + 1] << 32) | args[i * 2]; 2882bad729e2SRichard Henderson #else 2883bad729e2SRichard Henderson a = args[i]; 2884bad729e2SRichard Henderson #endif 2885fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 2886bad729e2SRichard Henderson } 2887c896fe29Sbellard break; 28885ff9d6a4Sbellard case INDEX_op_discard: 2889f8bf00f1SRichard Henderson temp_dead(s, &s->temps[args[0]]); 28905ff9d6a4Sbellard break; 2891c896fe29Sbellard case INDEX_op_set_label: 2892e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 2893bec16311SRichard Henderson tcg_out_label(s, arg_label(args[0]), s->code_ptr); 2894c896fe29Sbellard break; 2895c896fe29Sbellard case INDEX_op_call: 2896a1b3c48dSRichard Henderson tcg_reg_alloc_call(s, op->callo, op->calli, args, arg_life); 2897c45cb8bbSRichard Henderson break; 2898c896fe29Sbellard default: 289925c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 2900be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 2901c896fe29Sbellard /* Note: in order to speed up the code, it would be much 2902c896fe29Sbellard faster to have specialized register allocator functions for 2903c896fe29Sbellard some common argument patterns */ 2904a1b3c48dSRichard Henderson tcg_reg_alloc_op(s, def, opc, args, arg_life); 2905c896fe29Sbellard break; 2906c896fe29Sbellard } 29078d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2908c896fe29Sbellard check_regs(s); 2909c896fe29Sbellard #endif 2910b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 2911b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 2912b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 2913b125f9dcSRichard Henderson generating code without having to check during generation. */ 2914644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 2915b125f9dcSRichard Henderson return -1; 2916b125f9dcSRichard Henderson } 2917c896fe29Sbellard } 2918fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 2919fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 2920c45cb8bbSRichard Henderson 2921b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 2922659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 2923659ef5cbSRichard Henderson if (!tcg_out_ldst_finalize(s)) { 292423dceda6SRichard Henderson return -1; 292523dceda6SRichard Henderson } 2926659ef5cbSRichard Henderson #endif 292757a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 292857a26946SRichard Henderson if (!tcg_out_pool_finalize(s)) { 292957a26946SRichard Henderson return -1; 293057a26946SRichard Henderson } 293157a26946SRichard Henderson #endif 2932c896fe29Sbellard 2933c896fe29Sbellard /* flush instruction cache */ 29341813e175SRichard Henderson flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr); 29352aeabc08SStefan Weil 29361813e175SRichard Henderson return tcg_current_code_size(s); 2937c896fe29Sbellard } 2938c896fe29Sbellard 2939a23a9ec6Sbellard #ifdef CONFIG_PROFILER 2940405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 2941a23a9ec6Sbellard { 2942a23a9ec6Sbellard TCGContext *s = &tcg_ctx; 2943fca8a500SRichard Henderson int64_t tb_count = s->tb_count; 2944fca8a500SRichard Henderson int64_t tb_div_count = tb_count ? tb_count : 1; 2945fca8a500SRichard Henderson int64_t tot = s->interm_time + s->code_time; 2946a23a9ec6Sbellard 2947a23a9ec6Sbellard cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 2948a23a9ec6Sbellard tot, tot / 2.4e9); 2949a23a9ec6Sbellard cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n", 2950fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 2951fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 2952fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 2953a23a9ec6Sbellard cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n", 2954fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 2955a23a9ec6Sbellard cpu_fprintf(f, "deleted ops/TB %0.2f\n", 2956fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 2957a23a9ec6Sbellard cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n", 2958fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 2959fca8a500SRichard Henderson cpu_fprintf(f, "avg host code/TB %0.1f\n", 2960fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 2961fca8a500SRichard Henderson cpu_fprintf(f, "avg search data/TB %0.1f\n", 2962fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 2963a23a9ec6Sbellard 2964a23a9ec6Sbellard cpu_fprintf(f, "cycles/op %0.1f\n", 2965a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 2966a23a9ec6Sbellard cpu_fprintf(f, "cycles/in byte %0.1f\n", 2967a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 2968a23a9ec6Sbellard cpu_fprintf(f, "cycles/out byte %0.1f\n", 2969a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 2970fca8a500SRichard Henderson cpu_fprintf(f, "cycles/search byte %0.1f\n", 2971fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 2972fca8a500SRichard Henderson if (tot == 0) { 2973a23a9ec6Sbellard tot = 1; 2974fca8a500SRichard Henderson } 2975a23a9ec6Sbellard cpu_fprintf(f, " gen_interm time %0.1f%%\n", 2976a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 2977a23a9ec6Sbellard cpu_fprintf(f, " gen_code time %0.1f%%\n", 2978a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 2979c5cc28ffSAurelien Jarno cpu_fprintf(f, "optim./code time %0.1f%%\n", 2980c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 2981c5cc28ffSAurelien Jarno * 100.0); 2982a23a9ec6Sbellard cpu_fprintf(f, "liveness/code time %0.1f%%\n", 2983a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 2984a23a9ec6Sbellard cpu_fprintf(f, "cpu_restore count %" PRId64 "\n", 2985a23a9ec6Sbellard s->restore_count); 2986a23a9ec6Sbellard cpu_fprintf(f, " avg cycles %0.1f\n", 2987a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 2988a23a9ec6Sbellard } 2989a23a9ec6Sbellard #else 2990405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 2991a23a9ec6Sbellard { 299224bf7b3aSbellard cpu_fprintf(f, "[TCG profiler not compiled]\n"); 2993a23a9ec6Sbellard } 2994a23a9ec6Sbellard #endif 2995813da627SRichard Henderson 2996813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 29975872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 29985872bbf2SRichard Henderson 29995872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 30005872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 30015872bbf2SRichard Henderson 30025872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 30035872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 30045872bbf2SRichard Henderson prologue unwind info for the tcg machine. 30055872bbf2SRichard Henderson 30065872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 30075872bbf2SRichard Henderson */ 3008813da627SRichard Henderson 3009813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 3010813da627SRichard Henderson typedef enum { 3011813da627SRichard Henderson JIT_NOACTION = 0, 3012813da627SRichard Henderson JIT_REGISTER_FN, 3013813da627SRichard Henderson JIT_UNREGISTER_FN 3014813da627SRichard Henderson } jit_actions_t; 3015813da627SRichard Henderson 3016813da627SRichard Henderson struct jit_code_entry { 3017813da627SRichard Henderson struct jit_code_entry *next_entry; 3018813da627SRichard Henderson struct jit_code_entry *prev_entry; 3019813da627SRichard Henderson const void *symfile_addr; 3020813da627SRichard Henderson uint64_t symfile_size; 3021813da627SRichard Henderson }; 3022813da627SRichard Henderson 3023813da627SRichard Henderson struct jit_descriptor { 3024813da627SRichard Henderson uint32_t version; 3025813da627SRichard Henderson uint32_t action_flag; 3026813da627SRichard Henderson struct jit_code_entry *relevant_entry; 3027813da627SRichard Henderson struct jit_code_entry *first_entry; 3028813da627SRichard Henderson }; 3029813da627SRichard Henderson 3030813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 3031813da627SRichard Henderson void __jit_debug_register_code(void) 3032813da627SRichard Henderson { 3033813da627SRichard Henderson asm(""); 3034813da627SRichard Henderson } 3035813da627SRichard Henderson 3036813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 3037813da627SRichard Henderson the version before we can set it. */ 3038813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 3039813da627SRichard Henderson 3040813da627SRichard Henderson /* End GDB interface. */ 3041813da627SRichard Henderson 3042813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 3043813da627SRichard Henderson { 3044813da627SRichard Henderson const char *p = strtab + 1; 3045813da627SRichard Henderson 3046813da627SRichard Henderson while (1) { 3047813da627SRichard Henderson if (strcmp(p, str) == 0) { 3048813da627SRichard Henderson return p - strtab; 3049813da627SRichard Henderson } 3050813da627SRichard Henderson p += strlen(p) + 1; 3051813da627SRichard Henderson } 3052813da627SRichard Henderson } 3053813da627SRichard Henderson 30545872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size, 30552c90784aSRichard Henderson const void *debug_frame, 30562c90784aSRichard Henderson size_t debug_frame_size) 3057813da627SRichard Henderson { 30585872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 30595872bbf2SRichard Henderson uint32_t len; 30605872bbf2SRichard Henderson uint16_t version; 30615872bbf2SRichard Henderson uint32_t abbrev; 30625872bbf2SRichard Henderson uint8_t ptr_size; 30635872bbf2SRichard Henderson uint8_t cu_die; 30645872bbf2SRichard Henderson uint16_t cu_lang; 30655872bbf2SRichard Henderson uintptr_t cu_low_pc; 30665872bbf2SRichard Henderson uintptr_t cu_high_pc; 30675872bbf2SRichard Henderson uint8_t fn_die; 30685872bbf2SRichard Henderson char fn_name[16]; 30695872bbf2SRichard Henderson uintptr_t fn_low_pc; 30705872bbf2SRichard Henderson uintptr_t fn_high_pc; 30715872bbf2SRichard Henderson uint8_t cu_eoc; 30725872bbf2SRichard Henderson }; 3073813da627SRichard Henderson 3074813da627SRichard Henderson struct ElfImage { 3075813da627SRichard Henderson ElfW(Ehdr) ehdr; 3076813da627SRichard Henderson ElfW(Phdr) phdr; 30775872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 30785872bbf2SRichard Henderson ElfW(Sym) sym[2]; 30795872bbf2SRichard Henderson struct DebugInfo di; 30805872bbf2SRichard Henderson uint8_t da[24]; 30815872bbf2SRichard Henderson char str[80]; 30825872bbf2SRichard Henderson }; 30835872bbf2SRichard Henderson 30845872bbf2SRichard Henderson struct ElfImage *img; 30855872bbf2SRichard Henderson 30865872bbf2SRichard Henderson static const struct ElfImage img_template = { 30875872bbf2SRichard Henderson .ehdr = { 30885872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 30895872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 30905872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 30915872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 30925872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 30935872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 30945872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 30955872bbf2SRichard Henderson .e_type = ET_EXEC, 30965872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 30975872bbf2SRichard Henderson .e_version = EV_CURRENT, 30985872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 30995872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 31005872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 31015872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 31025872bbf2SRichard Henderson .e_phnum = 1, 31035872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 31045872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 31055872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 3106abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 3107abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 3108abbb3eaeSRichard Henderson #endif 3109abbb3eaeSRichard Henderson #ifdef ELF_OSABI 3110abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 3111abbb3eaeSRichard Henderson #endif 31125872bbf2SRichard Henderson }, 31135872bbf2SRichard Henderson .phdr = { 31145872bbf2SRichard Henderson .p_type = PT_LOAD, 31155872bbf2SRichard Henderson .p_flags = PF_X, 31165872bbf2SRichard Henderson }, 31175872bbf2SRichard Henderson .shdr = { 31185872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 31195872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 31205872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 31215872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 31225872bbf2SRichard Henderson will not look for contents. We can record any address. */ 31235872bbf2SRichard Henderson [1] = { /* .text */ 31245872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 31255872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 31265872bbf2SRichard Henderson }, 31275872bbf2SRichard Henderson [2] = { /* .debug_info */ 31285872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 31295872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 31305872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 31315872bbf2SRichard Henderson }, 31325872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 31335872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 31345872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 31355872bbf2SRichard Henderson .sh_size = sizeof(img->da), 31365872bbf2SRichard Henderson }, 31375872bbf2SRichard Henderson [4] = { /* .debug_frame */ 31385872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 31395872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 31405872bbf2SRichard Henderson }, 31415872bbf2SRichard Henderson [5] = { /* .symtab */ 31425872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 31435872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 31445872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 31455872bbf2SRichard Henderson .sh_info = 1, 31465872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 31475872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 31485872bbf2SRichard Henderson }, 31495872bbf2SRichard Henderson [6] = { /* .strtab */ 31505872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 31515872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 31525872bbf2SRichard Henderson .sh_size = sizeof(img->str), 31535872bbf2SRichard Henderson } 31545872bbf2SRichard Henderson }, 31555872bbf2SRichard Henderson .sym = { 31565872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 31575872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 31585872bbf2SRichard Henderson .st_shndx = 1, 31595872bbf2SRichard Henderson } 31605872bbf2SRichard Henderson }, 31615872bbf2SRichard Henderson .di = { 31625872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 31635872bbf2SRichard Henderson .version = 2, 31645872bbf2SRichard Henderson .ptr_size = sizeof(void *), 31655872bbf2SRichard Henderson .cu_die = 1, 31665872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 31675872bbf2SRichard Henderson .fn_die = 2, 31685872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 31695872bbf2SRichard Henderson }, 31705872bbf2SRichard Henderson .da = { 31715872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 31725872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 31735872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 31745872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 31755872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 31765872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 31775872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 31785872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 31795872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 31805872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 31815872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 31825872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 31835872bbf2SRichard Henderson 0 /* no more abbrev */ 31845872bbf2SRichard Henderson }, 31855872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 31865872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 3187813da627SRichard Henderson }; 3188813da627SRichard Henderson 3189813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 3190813da627SRichard Henderson static struct jit_code_entry one_entry; 3191813da627SRichard Henderson 31925872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 3193813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 31942c90784aSRichard Henderson DebugFrameHeader *dfh; 3195813da627SRichard Henderson 31965872bbf2SRichard Henderson img = g_malloc(img_size); 31975872bbf2SRichard Henderson *img = img_template; 3198813da627SRichard Henderson 31995872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 32005872bbf2SRichard Henderson img->phdr.p_paddr = buf; 32015872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 3202813da627SRichard Henderson 32035872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 32045872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 32055872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 3206813da627SRichard Henderson 32075872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 32085872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 32095872bbf2SRichard Henderson 32105872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 32115872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 32125872bbf2SRichard Henderson 32135872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 32145872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 32155872bbf2SRichard Henderson 32165872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 32175872bbf2SRichard Henderson img->sym[1].st_value = buf; 32185872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 32195872bbf2SRichard Henderson 32205872bbf2SRichard Henderson img->di.cu_low_pc = buf; 322145aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 32225872bbf2SRichard Henderson img->di.fn_low_pc = buf; 322345aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 3224813da627SRichard Henderson 32252c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 32262c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 32272c90784aSRichard Henderson dfh->fde.func_start = buf; 32282c90784aSRichard Henderson dfh->fde.func_len = buf_size; 32292c90784aSRichard Henderson 3230813da627SRichard Henderson #ifdef DEBUG_JIT 3231813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 3232813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 3233813da627SRichard Henderson { 3234813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 3235813da627SRichard Henderson if (f) { 32365872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 3237813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 3238813da627SRichard Henderson } 3239813da627SRichard Henderson fclose(f); 3240813da627SRichard Henderson } 3241813da627SRichard Henderson } 3242813da627SRichard Henderson #endif 3243813da627SRichard Henderson 3244813da627SRichard Henderson one_entry.symfile_addr = img; 3245813da627SRichard Henderson one_entry.symfile_size = img_size; 3246813da627SRichard Henderson 3247813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 3248813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 3249813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 3250813da627SRichard Henderson __jit_debug_register_code(); 3251813da627SRichard Henderson } 3252813da627SRichard Henderson #else 32535872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 32545872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 3255813da627SRichard Henderson 3256813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 32572c90784aSRichard Henderson const void *debug_frame, 32582c90784aSRichard Henderson size_t debug_frame_size) 3259813da627SRichard Henderson { 3260813da627SRichard Henderson } 3261813da627SRichard Henderson 3262813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size) 3263813da627SRichard Henderson { 3264813da627SRichard Henderson } 3265813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 3266