1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 3372fd2efbSEmilio G. Cota #include "qemu/error-report.h" 34f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 351de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 361de7afc9SPaolo Bonzini #include "qemu/timer.h" 37c896fe29Sbellard 38c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 39c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 40c896fe29Sbellard instructions */ 41c896fe29Sbellard #define NO_CPU_IO_DEFS 42c896fe29Sbellard #include "cpu.h" 43c896fe29Sbellard 4463c91552SPaolo Bonzini #include "exec/cpu-common.h" 4563c91552SPaolo Bonzini #include "exec/exec-all.h" 4663c91552SPaolo Bonzini 47c896fe29Sbellard #include "tcg-op.h" 48813da627SRichard Henderson 49edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 50813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 51edee2579SRichard Henderson #else 52edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 53813da627SRichard Henderson #endif 54813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 55813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 56813da627SRichard Henderson #else 57813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 58813da627SRichard Henderson #endif 59813da627SRichard Henderson 60c896fe29Sbellard #include "elf.h" 61508127e2SPaolo Bonzini #include "exec/log.h" 623468b59eSEmilio G. Cota #include "sysemu/sysemu.h" 63c896fe29Sbellard 64ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and 65ce151109SPeter Maydell used here. */ 66e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 67f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode); 68e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 696ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type, 702ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 71c896fe29Sbellard 72497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 73497a22ebSRichard Henderson typedef struct { 74497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 75497a22ebSRichard Henderson uint32_t id; 76497a22ebSRichard Henderson uint8_t version; 77497a22ebSRichard Henderson char augmentation[1]; 78497a22ebSRichard Henderson uint8_t code_align; 79497a22ebSRichard Henderson uint8_t data_align; 80497a22ebSRichard Henderson uint8_t return_column; 81497a22ebSRichard Henderson } DebugFrameCIE; 82497a22ebSRichard Henderson 83497a22ebSRichard Henderson typedef struct QEMU_PACKED { 84497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 85497a22ebSRichard Henderson uint32_t cie_offset; 86edee2579SRichard Henderson uintptr_t func_start; 87edee2579SRichard Henderson uintptr_t func_len; 88497a22ebSRichard Henderson } DebugFrameFDEHeader; 89497a22ebSRichard Henderson 902c90784aSRichard Henderson typedef struct QEMU_PACKED { 912c90784aSRichard Henderson DebugFrameCIE cie; 922c90784aSRichard Henderson DebugFrameFDEHeader fde; 932c90784aSRichard Henderson } DebugFrameHeader; 942c90784aSRichard Henderson 95813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 962c90784aSRichard Henderson const void *debug_frame, 972c90784aSRichard Henderson size_t debug_frame_size) 98813da627SRichard Henderson __attribute__((unused)); 99813da627SRichard Henderson 100ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */ 101069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct, 102069ea736SRichard Henderson const char *ct_str, TCGType type); 1032a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 104a05b5b9bSRichard Henderson intptr_t arg2); 1052a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 106c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1072a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 108c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args, 109c0ad3001SStefan Weil const int *const_args); 110d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 111d2fd745fSRichard Henderson static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 112d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 113d2fd745fSRichard Henderson const int *const_args); 114d2fd745fSRichard Henderson #else 115d2fd745fSRichard Henderson static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 116d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 117d2fd745fSRichard Henderson const int *const_args) 118d2fd745fSRichard Henderson { 119d2fd745fSRichard Henderson g_assert_not_reached(); 120d2fd745fSRichard Henderson } 121d2fd745fSRichard Henderson #endif 1222a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 123a05b5b9bSRichard Henderson intptr_t arg2); 12459d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 12559d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 126cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); 127f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type, 128c0ad3001SStefan Weil const TCGArgConstraint *arg_ct); 129659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 130659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s); 131659ef5cbSRichard Henderson #endif 132c896fe29Sbellard 133a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024 134a505785cSEmilio G. Cota 135df2cce29SEmilio G. Cota static TCGContext **tcg_ctxs; 136df2cce29SEmilio G. Cota static unsigned int n_tcg_ctxs; 1371c2adb95SRichard Henderson TCGv_env cpu_env = 0; 138df2cce29SEmilio G. Cota 139be2cdc5eSEmilio G. Cota struct tcg_region_tree { 140be2cdc5eSEmilio G. Cota QemuMutex lock; 141be2cdc5eSEmilio G. Cota GTree *tree; 142be2cdc5eSEmilio G. Cota /* padding to avoid false sharing is computed at run-time */ 143be2cdc5eSEmilio G. Cota }; 144be2cdc5eSEmilio G. Cota 145e8feb96fSEmilio G. Cota /* 146e8feb96fSEmilio G. Cota * We divide code_gen_buffer into equally-sized "regions" that TCG threads 147e8feb96fSEmilio G. Cota * dynamically allocate from as demand dictates. Given appropriate region 148e8feb96fSEmilio G. Cota * sizing, this minimizes flushes even when some TCG threads generate a lot 149e8feb96fSEmilio G. Cota * more code than others. 150e8feb96fSEmilio G. Cota */ 151e8feb96fSEmilio G. Cota struct tcg_region_state { 152e8feb96fSEmilio G. Cota QemuMutex lock; 153e8feb96fSEmilio G. Cota 154e8feb96fSEmilio G. Cota /* fields set at init time */ 155e8feb96fSEmilio G. Cota void *start; 156e8feb96fSEmilio G. Cota void *start_aligned; 157e8feb96fSEmilio G. Cota void *end; 158e8feb96fSEmilio G. Cota size_t n; 159e8feb96fSEmilio G. Cota size_t size; /* size of one region */ 160e8feb96fSEmilio G. Cota size_t stride; /* .size + guard size */ 161e8feb96fSEmilio G. Cota 162e8feb96fSEmilio G. Cota /* fields protected by the lock */ 163e8feb96fSEmilio G. Cota size_t current; /* current region index */ 164e8feb96fSEmilio G. Cota size_t agg_size_full; /* aggregate size of full regions */ 165e8feb96fSEmilio G. Cota }; 166e8feb96fSEmilio G. Cota 167e8feb96fSEmilio G. Cota static struct tcg_region_state region; 168be2cdc5eSEmilio G. Cota /* 169be2cdc5eSEmilio G. Cota * This is an array of struct tcg_region_tree's, with padding. 170be2cdc5eSEmilio G. Cota * We use void * to simplify the computation of region_trees[i]; each 171be2cdc5eSEmilio G. Cota * struct is found every tree_size bytes. 172be2cdc5eSEmilio G. Cota */ 173be2cdc5eSEmilio G. Cota static void *region_trees; 174be2cdc5eSEmilio G. Cota static size_t tree_size; 175d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 176b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 177c896fe29Sbellard 1781813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1794196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 180c896fe29Sbellard { 181c896fe29Sbellard *s->code_ptr++ = v; 182c896fe29Sbellard } 183c896fe29Sbellard 1844196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1854196dca6SPeter Maydell uint8_t v) 1865c53bb81SPeter Maydell { 1871813e175SRichard Henderson *p = v; 1885c53bb81SPeter Maydell } 1891813e175SRichard Henderson #endif 1905c53bb81SPeter Maydell 1911813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1924196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 193c896fe29Sbellard { 1941813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1951813e175SRichard Henderson *s->code_ptr++ = v; 1961813e175SRichard Henderson } else { 1971813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1984387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1991813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 2001813e175SRichard Henderson } 201c896fe29Sbellard } 202c896fe29Sbellard 2034196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 2044196dca6SPeter Maydell uint16_t v) 2055c53bb81SPeter Maydell { 2061813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 2071813e175SRichard Henderson *p = v; 2081813e175SRichard Henderson } else { 2095c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2105c53bb81SPeter Maydell } 2111813e175SRichard Henderson } 2121813e175SRichard Henderson #endif 2135c53bb81SPeter Maydell 2141813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2154196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 216c896fe29Sbellard { 2171813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2181813e175SRichard Henderson *s->code_ptr++ = v; 2191813e175SRichard Henderson } else { 2201813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2214387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2221813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2231813e175SRichard Henderson } 224c896fe29Sbellard } 225c896fe29Sbellard 2264196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2274196dca6SPeter Maydell uint32_t v) 2285c53bb81SPeter Maydell { 2291813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2301813e175SRichard Henderson *p = v; 2311813e175SRichard Henderson } else { 2325c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2335c53bb81SPeter Maydell } 2341813e175SRichard Henderson } 2351813e175SRichard Henderson #endif 2365c53bb81SPeter Maydell 2371813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2384196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 239ac26eb69SRichard Henderson { 2401813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2411813e175SRichard Henderson *s->code_ptr++ = v; 2421813e175SRichard Henderson } else { 2431813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2444387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2451813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2461813e175SRichard Henderson } 247ac26eb69SRichard Henderson } 248ac26eb69SRichard Henderson 2494196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2504196dca6SPeter Maydell uint64_t v) 2515c53bb81SPeter Maydell { 2521813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2531813e175SRichard Henderson *p = v; 2541813e175SRichard Henderson } else { 2555c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2565c53bb81SPeter Maydell } 2571813e175SRichard Henderson } 2581813e175SRichard Henderson #endif 2595c53bb81SPeter Maydell 260c896fe29Sbellard /* label relocation processing */ 261c896fe29Sbellard 2621813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 263bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 264c896fe29Sbellard { 265c896fe29Sbellard TCGRelocation *r; 266c896fe29Sbellard 267c896fe29Sbellard if (l->has_value) { 268623e265cSpbrook /* FIXME: This may break relocations on RISC targets that 269623e265cSpbrook modify instruction fields in place. The caller may not have 270623e265cSpbrook written the initial value. */ 2716ac17786SRichard Henderson bool ok = patch_reloc(code_ptr, type, l->u.value, addend); 2726ac17786SRichard Henderson tcg_debug_assert(ok); 273c896fe29Sbellard } else { 274c896fe29Sbellard /* add a new relocation entry */ 275c896fe29Sbellard r = tcg_malloc(sizeof(TCGRelocation)); 276c896fe29Sbellard r->type = type; 277c896fe29Sbellard r->ptr = code_ptr; 278c896fe29Sbellard r->addend = addend; 279c896fe29Sbellard r->next = l->u.first_reloc; 280c896fe29Sbellard l->u.first_reloc = r; 281c896fe29Sbellard } 282c896fe29Sbellard } 283c896fe29Sbellard 284bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr) 285c896fe29Sbellard { 2862ba7fae2SRichard Henderson intptr_t value = (intptr_t)ptr; 2871813e175SRichard Henderson TCGRelocation *r; 288c896fe29Sbellard 289eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 2901813e175SRichard Henderson 2911813e175SRichard Henderson for (r = l->u.first_reloc; r != NULL; r = r->next) { 2926ac17786SRichard Henderson bool ok = patch_reloc(r->ptr, r->type, value, r->addend); 2936ac17786SRichard Henderson tcg_debug_assert(ok); 294c896fe29Sbellard } 2951813e175SRichard Henderson 296c896fe29Sbellard l->has_value = 1; 2971813e175SRichard Henderson l->u.value_ptr = ptr; 298c896fe29Sbellard } 299c896fe29Sbellard 30042a268c2SRichard Henderson TCGLabel *gen_new_label(void) 301c896fe29Sbellard { 302b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 30351e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 304c896fe29Sbellard 30551e3972cSRichard Henderson *l = (TCGLabel){ 30651e3972cSRichard Henderson .id = s->nb_labels++ 30751e3972cSRichard Henderson }; 30842a268c2SRichard Henderson 30942a268c2SRichard Henderson return l; 310c896fe29Sbellard } 311c896fe29Sbellard 3129f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which) 3139f754620SRichard Henderson { 3149f754620SRichard Henderson size_t off = tcg_current_code_size(s); 3159f754620SRichard Henderson s->tb_jmp_reset_offset[which] = off; 3169f754620SRichard Henderson /* Make sure that we didn't overflow the stored offset. */ 3179f754620SRichard Henderson assert(s->tb_jmp_reset_offset[which] == off); 3189f754620SRichard Henderson } 3199f754620SRichard Henderson 320ce151109SPeter Maydell #include "tcg-target.inc.c" 321c896fe29Sbellard 322be2cdc5eSEmilio G. Cota /* compare a pointer @ptr and a tb_tc @s */ 323be2cdc5eSEmilio G. Cota static int ptr_cmp_tb_tc(const void *ptr, const struct tb_tc *s) 324be2cdc5eSEmilio G. Cota { 325be2cdc5eSEmilio G. Cota if (ptr >= s->ptr + s->size) { 326be2cdc5eSEmilio G. Cota return 1; 327be2cdc5eSEmilio G. Cota } else if (ptr < s->ptr) { 328be2cdc5eSEmilio G. Cota return -1; 329be2cdc5eSEmilio G. Cota } 330be2cdc5eSEmilio G. Cota return 0; 331be2cdc5eSEmilio G. Cota } 332be2cdc5eSEmilio G. Cota 333be2cdc5eSEmilio G. Cota static gint tb_tc_cmp(gconstpointer ap, gconstpointer bp) 334be2cdc5eSEmilio G. Cota { 335be2cdc5eSEmilio G. Cota const struct tb_tc *a = ap; 336be2cdc5eSEmilio G. Cota const struct tb_tc *b = bp; 337be2cdc5eSEmilio G. Cota 338be2cdc5eSEmilio G. Cota /* 339be2cdc5eSEmilio G. Cota * When both sizes are set, we know this isn't a lookup. 340be2cdc5eSEmilio G. Cota * This is the most likely case: every TB must be inserted; lookups 341be2cdc5eSEmilio G. Cota * are a lot less frequent. 342be2cdc5eSEmilio G. Cota */ 343be2cdc5eSEmilio G. Cota if (likely(a->size && b->size)) { 344be2cdc5eSEmilio G. Cota if (a->ptr > b->ptr) { 345be2cdc5eSEmilio G. Cota return 1; 346be2cdc5eSEmilio G. Cota } else if (a->ptr < b->ptr) { 347be2cdc5eSEmilio G. Cota return -1; 348be2cdc5eSEmilio G. Cota } 349be2cdc5eSEmilio G. Cota /* a->ptr == b->ptr should happen only on deletions */ 350be2cdc5eSEmilio G. Cota g_assert(a->size == b->size); 351be2cdc5eSEmilio G. Cota return 0; 352be2cdc5eSEmilio G. Cota } 353be2cdc5eSEmilio G. Cota /* 354be2cdc5eSEmilio G. Cota * All lookups have either .size field set to 0. 355be2cdc5eSEmilio G. Cota * From the glib sources we see that @ap is always the lookup key. However 356be2cdc5eSEmilio G. Cota * the docs provide no guarantee, so we just mark this case as likely. 357be2cdc5eSEmilio G. Cota */ 358be2cdc5eSEmilio G. Cota if (likely(a->size == 0)) { 359be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(a->ptr, b); 360be2cdc5eSEmilio G. Cota } 361be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(b->ptr, a); 362be2cdc5eSEmilio G. Cota } 363be2cdc5eSEmilio G. Cota 364be2cdc5eSEmilio G. Cota static void tcg_region_trees_init(void) 365be2cdc5eSEmilio G. Cota { 366be2cdc5eSEmilio G. Cota size_t i; 367be2cdc5eSEmilio G. Cota 368be2cdc5eSEmilio G. Cota tree_size = ROUND_UP(sizeof(struct tcg_region_tree), qemu_dcache_linesize); 369be2cdc5eSEmilio G. Cota region_trees = qemu_memalign(qemu_dcache_linesize, region.n * tree_size); 370be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 371be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 372be2cdc5eSEmilio G. Cota 373be2cdc5eSEmilio G. Cota qemu_mutex_init(&rt->lock); 374be2cdc5eSEmilio G. Cota rt->tree = g_tree_new(tb_tc_cmp); 375be2cdc5eSEmilio G. Cota } 376be2cdc5eSEmilio G. Cota } 377be2cdc5eSEmilio G. Cota 378be2cdc5eSEmilio G. Cota static struct tcg_region_tree *tc_ptr_to_region_tree(void *p) 379be2cdc5eSEmilio G. Cota { 380be2cdc5eSEmilio G. Cota size_t region_idx; 381be2cdc5eSEmilio G. Cota 382be2cdc5eSEmilio G. Cota if (p < region.start_aligned) { 383be2cdc5eSEmilio G. Cota region_idx = 0; 384be2cdc5eSEmilio G. Cota } else { 385be2cdc5eSEmilio G. Cota ptrdiff_t offset = p - region.start_aligned; 386be2cdc5eSEmilio G. Cota 387be2cdc5eSEmilio G. Cota if (offset > region.stride * (region.n - 1)) { 388be2cdc5eSEmilio G. Cota region_idx = region.n - 1; 389be2cdc5eSEmilio G. Cota } else { 390be2cdc5eSEmilio G. Cota region_idx = offset / region.stride; 391be2cdc5eSEmilio G. Cota } 392be2cdc5eSEmilio G. Cota } 393be2cdc5eSEmilio G. Cota return region_trees + region_idx * tree_size; 394be2cdc5eSEmilio G. Cota } 395be2cdc5eSEmilio G. Cota 396be2cdc5eSEmilio G. Cota void tcg_tb_insert(TranslationBlock *tb) 397be2cdc5eSEmilio G. Cota { 398be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 399be2cdc5eSEmilio G. Cota 400be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 401be2cdc5eSEmilio G. Cota g_tree_insert(rt->tree, &tb->tc, tb); 402be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 403be2cdc5eSEmilio G. Cota } 404be2cdc5eSEmilio G. Cota 405be2cdc5eSEmilio G. Cota void tcg_tb_remove(TranslationBlock *tb) 406be2cdc5eSEmilio G. Cota { 407be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 408be2cdc5eSEmilio G. Cota 409be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 410be2cdc5eSEmilio G. Cota g_tree_remove(rt->tree, &tb->tc); 411be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 412be2cdc5eSEmilio G. Cota } 413be2cdc5eSEmilio G. Cota 414be2cdc5eSEmilio G. Cota /* 415be2cdc5eSEmilio G. Cota * Find the TB 'tb' such that 416be2cdc5eSEmilio G. Cota * tb->tc.ptr <= tc_ptr < tb->tc.ptr + tb->tc.size 417be2cdc5eSEmilio G. Cota * Return NULL if not found. 418be2cdc5eSEmilio G. Cota */ 419be2cdc5eSEmilio G. Cota TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr) 420be2cdc5eSEmilio G. Cota { 421be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree((void *)tc_ptr); 422be2cdc5eSEmilio G. Cota TranslationBlock *tb; 423be2cdc5eSEmilio G. Cota struct tb_tc s = { .ptr = (void *)tc_ptr }; 424be2cdc5eSEmilio G. Cota 425be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 426be2cdc5eSEmilio G. Cota tb = g_tree_lookup(rt->tree, &s); 427be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 428be2cdc5eSEmilio G. Cota return tb; 429be2cdc5eSEmilio G. Cota } 430be2cdc5eSEmilio G. Cota 431be2cdc5eSEmilio G. Cota static void tcg_region_tree_lock_all(void) 432be2cdc5eSEmilio G. Cota { 433be2cdc5eSEmilio G. Cota size_t i; 434be2cdc5eSEmilio G. Cota 435be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 436be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 437be2cdc5eSEmilio G. Cota 438be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 439be2cdc5eSEmilio G. Cota } 440be2cdc5eSEmilio G. Cota } 441be2cdc5eSEmilio G. Cota 442be2cdc5eSEmilio G. Cota static void tcg_region_tree_unlock_all(void) 443be2cdc5eSEmilio G. Cota { 444be2cdc5eSEmilio G. Cota size_t i; 445be2cdc5eSEmilio G. Cota 446be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 447be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 448be2cdc5eSEmilio G. Cota 449be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 450be2cdc5eSEmilio G. Cota } 451be2cdc5eSEmilio G. Cota } 452be2cdc5eSEmilio G. Cota 453be2cdc5eSEmilio G. Cota void tcg_tb_foreach(GTraverseFunc func, gpointer user_data) 454be2cdc5eSEmilio G. Cota { 455be2cdc5eSEmilio G. Cota size_t i; 456be2cdc5eSEmilio G. Cota 457be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 458be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 459be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 460be2cdc5eSEmilio G. Cota 461be2cdc5eSEmilio G. Cota g_tree_foreach(rt->tree, func, user_data); 462be2cdc5eSEmilio G. Cota } 463be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 464be2cdc5eSEmilio G. Cota } 465be2cdc5eSEmilio G. Cota 466be2cdc5eSEmilio G. Cota size_t tcg_nb_tbs(void) 467be2cdc5eSEmilio G. Cota { 468be2cdc5eSEmilio G. Cota size_t nb_tbs = 0; 469be2cdc5eSEmilio G. Cota size_t i; 470be2cdc5eSEmilio G. Cota 471be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 472be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 473be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 474be2cdc5eSEmilio G. Cota 475be2cdc5eSEmilio G. Cota nb_tbs += g_tree_nnodes(rt->tree); 476be2cdc5eSEmilio G. Cota } 477be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 478be2cdc5eSEmilio G. Cota return nb_tbs; 479be2cdc5eSEmilio G. Cota } 480be2cdc5eSEmilio G. Cota 481be2cdc5eSEmilio G. Cota static void tcg_region_tree_reset_all(void) 482be2cdc5eSEmilio G. Cota { 483be2cdc5eSEmilio G. Cota size_t i; 484be2cdc5eSEmilio G. Cota 485be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 486be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 487be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 488be2cdc5eSEmilio G. Cota 489be2cdc5eSEmilio G. Cota /* Increment the refcount first so that destroy acts as a reset */ 490be2cdc5eSEmilio G. Cota g_tree_ref(rt->tree); 491be2cdc5eSEmilio G. Cota g_tree_destroy(rt->tree); 492be2cdc5eSEmilio G. Cota } 493be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 494be2cdc5eSEmilio G. Cota } 495be2cdc5eSEmilio G. Cota 496e8feb96fSEmilio G. Cota static void tcg_region_bounds(size_t curr_region, void **pstart, void **pend) 497e8feb96fSEmilio G. Cota { 498e8feb96fSEmilio G. Cota void *start, *end; 499e8feb96fSEmilio G. Cota 500e8feb96fSEmilio G. Cota start = region.start_aligned + curr_region * region.stride; 501e8feb96fSEmilio G. Cota end = start + region.size; 502e8feb96fSEmilio G. Cota 503e8feb96fSEmilio G. Cota if (curr_region == 0) { 504e8feb96fSEmilio G. Cota start = region.start; 505e8feb96fSEmilio G. Cota } 506e8feb96fSEmilio G. Cota if (curr_region == region.n - 1) { 507e8feb96fSEmilio G. Cota end = region.end; 508e8feb96fSEmilio G. Cota } 509e8feb96fSEmilio G. Cota 510e8feb96fSEmilio G. Cota *pstart = start; 511e8feb96fSEmilio G. Cota *pend = end; 512e8feb96fSEmilio G. Cota } 513e8feb96fSEmilio G. Cota 514e8feb96fSEmilio G. Cota static void tcg_region_assign(TCGContext *s, size_t curr_region) 515e8feb96fSEmilio G. Cota { 516e8feb96fSEmilio G. Cota void *start, *end; 517e8feb96fSEmilio G. Cota 518e8feb96fSEmilio G. Cota tcg_region_bounds(curr_region, &start, &end); 519e8feb96fSEmilio G. Cota 520e8feb96fSEmilio G. Cota s->code_gen_buffer = start; 521e8feb96fSEmilio G. Cota s->code_gen_ptr = start; 522e8feb96fSEmilio G. Cota s->code_gen_buffer_size = end - start; 523e8feb96fSEmilio G. Cota s->code_gen_highwater = end - TCG_HIGHWATER; 524e8feb96fSEmilio G. Cota } 525e8feb96fSEmilio G. Cota 526e8feb96fSEmilio G. Cota static bool tcg_region_alloc__locked(TCGContext *s) 527e8feb96fSEmilio G. Cota { 528e8feb96fSEmilio G. Cota if (region.current == region.n) { 529e8feb96fSEmilio G. Cota return true; 530e8feb96fSEmilio G. Cota } 531e8feb96fSEmilio G. Cota tcg_region_assign(s, region.current); 532e8feb96fSEmilio G. Cota region.current++; 533e8feb96fSEmilio G. Cota return false; 534e8feb96fSEmilio G. Cota } 535e8feb96fSEmilio G. Cota 536e8feb96fSEmilio G. Cota /* 537e8feb96fSEmilio G. Cota * Request a new region once the one in use has filled up. 538e8feb96fSEmilio G. Cota * Returns true on error. 539e8feb96fSEmilio G. Cota */ 540e8feb96fSEmilio G. Cota static bool tcg_region_alloc(TCGContext *s) 541e8feb96fSEmilio G. Cota { 542e8feb96fSEmilio G. Cota bool err; 543e8feb96fSEmilio G. Cota /* read the region size now; alloc__locked will overwrite it on success */ 544e8feb96fSEmilio G. Cota size_t size_full = s->code_gen_buffer_size; 545e8feb96fSEmilio G. Cota 546e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 547e8feb96fSEmilio G. Cota err = tcg_region_alloc__locked(s); 548e8feb96fSEmilio G. Cota if (!err) { 549e8feb96fSEmilio G. Cota region.agg_size_full += size_full - TCG_HIGHWATER; 550e8feb96fSEmilio G. Cota } 551e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 552e8feb96fSEmilio G. Cota return err; 553e8feb96fSEmilio G. Cota } 554e8feb96fSEmilio G. Cota 555e8feb96fSEmilio G. Cota /* 556e8feb96fSEmilio G. Cota * Perform a context's first region allocation. 557e8feb96fSEmilio G. Cota * This function does _not_ increment region.agg_size_full. 558e8feb96fSEmilio G. Cota */ 559e8feb96fSEmilio G. Cota static inline bool tcg_region_initial_alloc__locked(TCGContext *s) 560e8feb96fSEmilio G. Cota { 561e8feb96fSEmilio G. Cota return tcg_region_alloc__locked(s); 562e8feb96fSEmilio G. Cota } 563e8feb96fSEmilio G. Cota 564e8feb96fSEmilio G. Cota /* Call from a safe-work context */ 565e8feb96fSEmilio G. Cota void tcg_region_reset_all(void) 566e8feb96fSEmilio G. Cota { 5673468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 568e8feb96fSEmilio G. Cota unsigned int i; 569e8feb96fSEmilio G. Cota 570e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 571e8feb96fSEmilio G. Cota region.current = 0; 572e8feb96fSEmilio G. Cota region.agg_size_full = 0; 573e8feb96fSEmilio G. Cota 5743468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 5753468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 5763468b59eSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(s); 577e8feb96fSEmilio G. Cota 578e8feb96fSEmilio G. Cota g_assert(!err); 579e8feb96fSEmilio G. Cota } 580e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 581be2cdc5eSEmilio G. Cota 582be2cdc5eSEmilio G. Cota tcg_region_tree_reset_all(); 583e8feb96fSEmilio G. Cota } 584e8feb96fSEmilio G. Cota 5853468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 5863468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5873468b59eSEmilio G. Cota { 5883468b59eSEmilio G. Cota return 1; 5893468b59eSEmilio G. Cota } 5903468b59eSEmilio G. Cota #else 5913468b59eSEmilio G. Cota /* 5923468b59eSEmilio G. Cota * It is likely that some vCPUs will translate more code than others, so we 5933468b59eSEmilio G. Cota * first try to set more regions than max_cpus, with those regions being of 5943468b59eSEmilio G. Cota * reasonable size. If that's not possible we make do by evenly dividing 5953468b59eSEmilio G. Cota * the code_gen_buffer among the vCPUs. 5963468b59eSEmilio G. Cota */ 5973468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5983468b59eSEmilio G. Cota { 5993468b59eSEmilio G. Cota size_t i; 6003468b59eSEmilio G. Cota 6013468b59eSEmilio G. Cota /* Use a single region if all we have is one vCPU thread */ 6023468b59eSEmilio G. Cota if (max_cpus == 1 || !qemu_tcg_mttcg_enabled()) { 6033468b59eSEmilio G. Cota return 1; 6043468b59eSEmilio G. Cota } 6053468b59eSEmilio G. Cota 6063468b59eSEmilio G. Cota /* Try to have more regions than max_cpus, with each region being >= 2 MB */ 6073468b59eSEmilio G. Cota for (i = 8; i > 0; i--) { 6083468b59eSEmilio G. Cota size_t regions_per_thread = i; 6093468b59eSEmilio G. Cota size_t region_size; 6103468b59eSEmilio G. Cota 6113468b59eSEmilio G. Cota region_size = tcg_init_ctx.code_gen_buffer_size; 6123468b59eSEmilio G. Cota region_size /= max_cpus * regions_per_thread; 6133468b59eSEmilio G. Cota 6143468b59eSEmilio G. Cota if (region_size >= 2 * 1024u * 1024) { 6153468b59eSEmilio G. Cota return max_cpus * regions_per_thread; 6163468b59eSEmilio G. Cota } 6173468b59eSEmilio G. Cota } 6183468b59eSEmilio G. Cota /* If we can't, then just allocate one region per vCPU thread */ 6193468b59eSEmilio G. Cota return max_cpus; 6203468b59eSEmilio G. Cota } 6213468b59eSEmilio G. Cota #endif 6223468b59eSEmilio G. Cota 623e8feb96fSEmilio G. Cota /* 624e8feb96fSEmilio G. Cota * Initializes region partitioning. 625e8feb96fSEmilio G. Cota * 626e8feb96fSEmilio G. Cota * Called at init time from the parent thread (i.e. the one calling 627e8feb96fSEmilio G. Cota * tcg_context_init), after the target's TCG globals have been set. 6283468b59eSEmilio G. Cota * 6293468b59eSEmilio G. Cota * Region partitioning works by splitting code_gen_buffer into separate regions, 6303468b59eSEmilio G. Cota * and then assigning regions to TCG threads so that the threads can translate 6313468b59eSEmilio G. Cota * code in parallel without synchronization. 6323468b59eSEmilio G. Cota * 6333468b59eSEmilio G. Cota * In softmmu the number of TCG threads is bounded by max_cpus, so we use at 6343468b59eSEmilio G. Cota * least max_cpus regions in MTTCG. In !MTTCG we use a single region. 6353468b59eSEmilio G. Cota * Note that the TCG options from the command-line (i.e. -accel accel=tcg,[...]) 6363468b59eSEmilio G. Cota * must have been parsed before calling this function, since it calls 6373468b59eSEmilio G. Cota * qemu_tcg_mttcg_enabled(). 6383468b59eSEmilio G. Cota * 6393468b59eSEmilio G. Cota * In user-mode we use a single region. Having multiple regions in user-mode 6403468b59eSEmilio G. Cota * is not supported, because the number of vCPU threads (recall that each thread 6413468b59eSEmilio G. Cota * spawned by the guest corresponds to a vCPU thread) is only bounded by the 6423468b59eSEmilio G. Cota * OS, and usually this number is huge (tens of thousands is not uncommon). 6433468b59eSEmilio G. Cota * Thus, given this large bound on the number of vCPU threads and the fact 6443468b59eSEmilio G. Cota * that code_gen_buffer is allocated at compile-time, we cannot guarantee 6453468b59eSEmilio G. Cota * that the availability of at least one region per vCPU thread. 6463468b59eSEmilio G. Cota * 6473468b59eSEmilio G. Cota * However, this user-mode limitation is unlikely to be a significant problem 6483468b59eSEmilio G. Cota * in practice. Multi-threaded guests share most if not all of their translated 6493468b59eSEmilio G. Cota * code, which makes parallel code generation less appealing than in softmmu. 650e8feb96fSEmilio G. Cota */ 651e8feb96fSEmilio G. Cota void tcg_region_init(void) 652e8feb96fSEmilio G. Cota { 653e8feb96fSEmilio G. Cota void *buf = tcg_init_ctx.code_gen_buffer; 654e8feb96fSEmilio G. Cota void *aligned; 655e8feb96fSEmilio G. Cota size_t size = tcg_init_ctx.code_gen_buffer_size; 656e8feb96fSEmilio G. Cota size_t page_size = qemu_real_host_page_size; 657e8feb96fSEmilio G. Cota size_t region_size; 658e8feb96fSEmilio G. Cota size_t n_regions; 659e8feb96fSEmilio G. Cota size_t i; 660e8feb96fSEmilio G. Cota 6613468b59eSEmilio G. Cota n_regions = tcg_n_regions(); 662e8feb96fSEmilio G. Cota 663e8feb96fSEmilio G. Cota /* The first region will be 'aligned - buf' bytes larger than the others */ 664e8feb96fSEmilio G. Cota aligned = QEMU_ALIGN_PTR_UP(buf, page_size); 665e8feb96fSEmilio G. Cota g_assert(aligned < tcg_init_ctx.code_gen_buffer + size); 666e8feb96fSEmilio G. Cota /* 667e8feb96fSEmilio G. Cota * Make region_size a multiple of page_size, using aligned as the start. 668e8feb96fSEmilio G. Cota * As a result of this we might end up with a few extra pages at the end of 669e8feb96fSEmilio G. Cota * the buffer; we will assign those to the last region. 670e8feb96fSEmilio G. Cota */ 671e8feb96fSEmilio G. Cota region_size = (size - (aligned - buf)) / n_regions; 672e8feb96fSEmilio G. Cota region_size = QEMU_ALIGN_DOWN(region_size, page_size); 673e8feb96fSEmilio G. Cota 674e8feb96fSEmilio G. Cota /* A region must have at least 2 pages; one code, one guard */ 675e8feb96fSEmilio G. Cota g_assert(region_size >= 2 * page_size); 676e8feb96fSEmilio G. Cota 677e8feb96fSEmilio G. Cota /* init the region struct */ 678e8feb96fSEmilio G. Cota qemu_mutex_init(®ion.lock); 679e8feb96fSEmilio G. Cota region.n = n_regions; 680e8feb96fSEmilio G. Cota region.size = region_size - page_size; 681e8feb96fSEmilio G. Cota region.stride = region_size; 682e8feb96fSEmilio G. Cota region.start = buf; 683e8feb96fSEmilio G. Cota region.start_aligned = aligned; 684e8feb96fSEmilio G. Cota /* page-align the end, since its last page will be a guard page */ 685e8feb96fSEmilio G. Cota region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size); 686e8feb96fSEmilio G. Cota /* account for that last guard page */ 687e8feb96fSEmilio G. Cota region.end -= page_size; 688e8feb96fSEmilio G. Cota 689e8feb96fSEmilio G. Cota /* set guard pages */ 690e8feb96fSEmilio G. Cota for (i = 0; i < region.n; i++) { 691e8feb96fSEmilio G. Cota void *start, *end; 692e8feb96fSEmilio G. Cota int rc; 693e8feb96fSEmilio G. Cota 694e8feb96fSEmilio G. Cota tcg_region_bounds(i, &start, &end); 695e8feb96fSEmilio G. Cota rc = qemu_mprotect_none(end, page_size); 696e8feb96fSEmilio G. Cota g_assert(!rc); 697e8feb96fSEmilio G. Cota } 698e8feb96fSEmilio G. Cota 699be2cdc5eSEmilio G. Cota tcg_region_trees_init(); 700be2cdc5eSEmilio G. Cota 7013468b59eSEmilio G. Cota /* In user-mode we support only one ctx, so do the initial allocation now */ 7023468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 703e8feb96fSEmilio G. Cota { 704e8feb96fSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(tcg_ctx); 705e8feb96fSEmilio G. Cota 706e8feb96fSEmilio G. Cota g_assert(!err); 707e8feb96fSEmilio G. Cota } 7083468b59eSEmilio G. Cota #endif 709e8feb96fSEmilio G. Cota } 710e8feb96fSEmilio G. Cota 711e8feb96fSEmilio G. Cota /* 7123468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 7133468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 7143468b59eSEmilio G. Cota * before initiating translation. 7153468b59eSEmilio G. Cota * 7163468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 7173468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 7183468b59eSEmilio G. Cota * 7193468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 7203468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 7213468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 7223468b59eSEmilio G. Cota * 7233468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 7243468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 7253468b59eSEmilio G. Cota */ 7263468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 7273468b59eSEmilio G. Cota void tcg_register_thread(void) 7283468b59eSEmilio G. Cota { 7293468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 7303468b59eSEmilio G. Cota } 7313468b59eSEmilio G. Cota #else 7323468b59eSEmilio G. Cota void tcg_register_thread(void) 7333468b59eSEmilio G. Cota { 7343468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 7353468b59eSEmilio G. Cota unsigned int i, n; 7363468b59eSEmilio G. Cota bool err; 7373468b59eSEmilio G. Cota 7383468b59eSEmilio G. Cota *s = tcg_init_ctx; 7393468b59eSEmilio G. Cota 7403468b59eSEmilio G. Cota /* Relink mem_base. */ 7413468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 7423468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 7433468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 7443468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 7453468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 7463468b59eSEmilio G. Cota } 7473468b59eSEmilio G. Cota } 7483468b59eSEmilio G. Cota 7493468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 7503468b59eSEmilio G. Cota n = atomic_fetch_inc(&n_tcg_ctxs); 7513468b59eSEmilio G. Cota g_assert(n < max_cpus); 7523468b59eSEmilio G. Cota atomic_set(&tcg_ctxs[n], s); 7533468b59eSEmilio G. Cota 7543468b59eSEmilio G. Cota tcg_ctx = s; 7553468b59eSEmilio G. Cota qemu_mutex_lock(®ion.lock); 7563468b59eSEmilio G. Cota err = tcg_region_initial_alloc__locked(tcg_ctx); 7573468b59eSEmilio G. Cota g_assert(!err); 7583468b59eSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 7593468b59eSEmilio G. Cota } 7603468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 7613468b59eSEmilio G. Cota 7623468b59eSEmilio G. Cota /* 763e8feb96fSEmilio G. Cota * Returns the size (in bytes) of all translated code (i.e. from all regions) 764e8feb96fSEmilio G. Cota * currently in the cache. 765e8feb96fSEmilio G. Cota * See also: tcg_code_capacity() 766e8feb96fSEmilio G. Cota * Do not confuse with tcg_current_code_size(); that one applies to a single 767e8feb96fSEmilio G. Cota * TCG context. 768e8feb96fSEmilio G. Cota */ 769e8feb96fSEmilio G. Cota size_t tcg_code_size(void) 770e8feb96fSEmilio G. Cota { 7713468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 772e8feb96fSEmilio G. Cota unsigned int i; 773e8feb96fSEmilio G. Cota size_t total; 774e8feb96fSEmilio G. Cota 775e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 776e8feb96fSEmilio G. Cota total = region.agg_size_full; 7773468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 7783468b59eSEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 779e8feb96fSEmilio G. Cota size_t size; 780e8feb96fSEmilio G. Cota 781e8feb96fSEmilio G. Cota size = atomic_read(&s->code_gen_ptr) - s->code_gen_buffer; 782e8feb96fSEmilio G. Cota g_assert(size <= s->code_gen_buffer_size); 783e8feb96fSEmilio G. Cota total += size; 784e8feb96fSEmilio G. Cota } 785e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 786e8feb96fSEmilio G. Cota return total; 787e8feb96fSEmilio G. Cota } 788e8feb96fSEmilio G. Cota 789e8feb96fSEmilio G. Cota /* 790e8feb96fSEmilio G. Cota * Returns the code capacity (in bytes) of the entire cache, i.e. including all 791e8feb96fSEmilio G. Cota * regions. 792e8feb96fSEmilio G. Cota * See also: tcg_code_size() 793e8feb96fSEmilio G. Cota */ 794e8feb96fSEmilio G. Cota size_t tcg_code_capacity(void) 795e8feb96fSEmilio G. Cota { 796e8feb96fSEmilio G. Cota size_t guard_size, capacity; 797e8feb96fSEmilio G. Cota 798e8feb96fSEmilio G. Cota /* no need for synchronization; these variables are set at init time */ 799e8feb96fSEmilio G. Cota guard_size = region.stride - region.size; 800e8feb96fSEmilio G. Cota capacity = region.end + guard_size - region.start; 801e8feb96fSEmilio G. Cota capacity -= region.n * (guard_size + TCG_HIGHWATER); 802e8feb96fSEmilio G. Cota return capacity; 803e8feb96fSEmilio G. Cota } 804e8feb96fSEmilio G. Cota 805128ed227SEmilio G. Cota size_t tcg_tb_phys_invalidate_count(void) 806128ed227SEmilio G. Cota { 807128ed227SEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 808128ed227SEmilio G. Cota unsigned int i; 809128ed227SEmilio G. Cota size_t total = 0; 810128ed227SEmilio G. Cota 811128ed227SEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 812128ed227SEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 813128ed227SEmilio G. Cota 814128ed227SEmilio G. Cota total += atomic_read(&s->tb_phys_invalidate_count); 815128ed227SEmilio G. Cota } 816128ed227SEmilio G. Cota return total; 817128ed227SEmilio G. Cota } 818128ed227SEmilio G. Cota 819c896fe29Sbellard /* pool based memory allocation */ 820c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 821c896fe29Sbellard { 822c896fe29Sbellard TCGPool *p; 823c896fe29Sbellard int pool_size; 824c896fe29Sbellard 825c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 826c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 8277267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 828c896fe29Sbellard p->size = size; 8294055299eSKirill Batuzov p->next = s->pool_first_large; 8304055299eSKirill Batuzov s->pool_first_large = p; 8314055299eSKirill Batuzov return p->data; 832c896fe29Sbellard } else { 833c896fe29Sbellard p = s->pool_current; 834c896fe29Sbellard if (!p) { 835c896fe29Sbellard p = s->pool_first; 836c896fe29Sbellard if (!p) 837c896fe29Sbellard goto new_pool; 838c896fe29Sbellard } else { 839c896fe29Sbellard if (!p->next) { 840c896fe29Sbellard new_pool: 841c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 8427267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 843c896fe29Sbellard p->size = pool_size; 844c896fe29Sbellard p->next = NULL; 845c896fe29Sbellard if (s->pool_current) 846c896fe29Sbellard s->pool_current->next = p; 847c896fe29Sbellard else 848c896fe29Sbellard s->pool_first = p; 849c896fe29Sbellard } else { 850c896fe29Sbellard p = p->next; 851c896fe29Sbellard } 852c896fe29Sbellard } 853c896fe29Sbellard } 854c896fe29Sbellard s->pool_current = p; 855c896fe29Sbellard s->pool_cur = p->data + size; 856c896fe29Sbellard s->pool_end = p->data + p->size; 857c896fe29Sbellard return p->data; 858c896fe29Sbellard } 859c896fe29Sbellard 860c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 861c896fe29Sbellard { 8624055299eSKirill Batuzov TCGPool *p, *t; 8634055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 8644055299eSKirill Batuzov t = p->next; 8654055299eSKirill Batuzov g_free(p); 8664055299eSKirill Batuzov } 8674055299eSKirill Batuzov s->pool_first_large = NULL; 868c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 869c896fe29Sbellard s->pool_current = NULL; 870c896fe29Sbellard } 871c896fe29Sbellard 872100b5e01SRichard Henderson typedef struct TCGHelperInfo { 873100b5e01SRichard Henderson void *func; 874100b5e01SRichard Henderson const char *name; 875afb49896SRichard Henderson unsigned flags; 876afb49896SRichard Henderson unsigned sizemask; 877100b5e01SRichard Henderson } TCGHelperInfo; 878100b5e01SRichard Henderson 8792ef6175aSRichard Henderson #include "exec/helper-proto.h" 8802ef6175aSRichard Henderson 881100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 8822ef6175aSRichard Henderson #include "exec/helper-tcg.h" 883100b5e01SRichard Henderson }; 884619205fdSEmilio G. Cota static GHashTable *helper_table; 885100b5e01SRichard Henderson 88691478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 887f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 8881c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 8891c2adb95SRichard Henderson TCGReg reg, const char *name); 89091478cefSRichard Henderson 891c896fe29Sbellard void tcg_context_init(TCGContext *s) 892c896fe29Sbellard { 893100b5e01SRichard Henderson int op, total_args, n, i; 894c896fe29Sbellard TCGOpDef *def; 895c896fe29Sbellard TCGArgConstraint *args_ct; 896c896fe29Sbellard int *sorted_args; 8971c2adb95SRichard Henderson TCGTemp *ts; 898c896fe29Sbellard 899c896fe29Sbellard memset(s, 0, sizeof(*s)); 900c896fe29Sbellard s->nb_globals = 0; 901c896fe29Sbellard 902c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 903c896fe29Sbellard space */ 904c896fe29Sbellard total_args = 0; 905c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 906c896fe29Sbellard def = &tcg_op_defs[op]; 907c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 908c896fe29Sbellard total_args += n; 909c896fe29Sbellard } 910c896fe29Sbellard 9117267c094SAnthony Liguori args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args); 9127267c094SAnthony Liguori sorted_args = g_malloc(sizeof(int) * total_args); 913c896fe29Sbellard 914c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 915c896fe29Sbellard def = &tcg_op_defs[op]; 916c896fe29Sbellard def->args_ct = args_ct; 917c896fe29Sbellard def->sorted_args = sorted_args; 918c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 919c896fe29Sbellard sorted_args += n; 920c896fe29Sbellard args_ct += n; 921c896fe29Sbellard } 922c896fe29Sbellard 9235cd8f621SRichard Henderson /* Register helpers. */ 92484fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 925619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 92684fd9dd3SRichard Henderson 927100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 92884fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 92972866e82SRichard Henderson (gpointer)&all_helpers[i]); 930100b5e01SRichard Henderson } 9315cd8f621SRichard Henderson 932c896fe29Sbellard tcg_target_init(s); 933f69d277eSRichard Henderson process_op_defs(s); 93491478cefSRichard Henderson 93591478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 93691478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 93791478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 93891478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 93991478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 94091478cefSRichard Henderson break; 94191478cefSRichard Henderson } 94291478cefSRichard Henderson } 94391478cefSRichard Henderson for (i = 0; i < n; ++i) { 94491478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 94591478cefSRichard Henderson } 94691478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 94791478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 94891478cefSRichard Henderson } 949b1311c4aSEmilio G. Cota 950b1311c4aSEmilio G. Cota tcg_ctx = s; 9513468b59eSEmilio G. Cota /* 9523468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 9533468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 9543468b59eSEmilio G. Cota * reasoning behind this. 9553468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 9563468b59eSEmilio G. Cota */ 9573468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 958df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 959df2cce29SEmilio G. Cota n_tcg_ctxs = 1; 9603468b59eSEmilio G. Cota #else 9613468b59eSEmilio G. Cota tcg_ctxs = g_new(TCGContext *, max_cpus); 9623468b59eSEmilio G. Cota #endif 9631c2adb95SRichard Henderson 9641c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 9651c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 9661c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 9679002ec79SRichard Henderson } 968b03cce8eSbellard 9696e3b2bfdSEmilio G. Cota /* 9706e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 9716e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 9726e3b2bfdSEmilio G. Cota */ 9736e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 9746e3b2bfdSEmilio G. Cota { 9756e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 9766e3b2bfdSEmilio G. Cota TranslationBlock *tb; 9776e3b2bfdSEmilio G. Cota void *next; 9786e3b2bfdSEmilio G. Cota 979e8feb96fSEmilio G. Cota retry: 9806e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 9816e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 9826e3b2bfdSEmilio G. Cota 9836e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 984e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 9856e3b2bfdSEmilio G. Cota return NULL; 9866e3b2bfdSEmilio G. Cota } 987e8feb96fSEmilio G. Cota goto retry; 988e8feb96fSEmilio G. Cota } 989e8feb96fSEmilio G. Cota atomic_set(&s->code_gen_ptr, next); 99057a26946SRichard Henderson s->data_gen_ptr = NULL; 9916e3b2bfdSEmilio G. Cota return tb; 9926e3b2bfdSEmilio G. Cota } 9936e3b2bfdSEmilio G. Cota 9949002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 9959002ec79SRichard Henderson { 9968163b749SRichard Henderson size_t prologue_size, total_size; 9978163b749SRichard Henderson void *buf0, *buf1; 9988163b749SRichard Henderson 9998163b749SRichard Henderson /* Put the prologue at the beginning of code_gen_buffer. */ 10008163b749SRichard Henderson buf0 = s->code_gen_buffer; 10015b38ee31SRichard Henderson total_size = s->code_gen_buffer_size; 10028163b749SRichard Henderson s->code_ptr = buf0; 10038163b749SRichard Henderson s->code_buf = buf0; 10045b38ee31SRichard Henderson s->data_gen_ptr = NULL; 10058163b749SRichard Henderson s->code_gen_prologue = buf0; 10068163b749SRichard Henderson 10075b38ee31SRichard Henderson /* Compute a high-water mark, at which we voluntarily flush the buffer 10085b38ee31SRichard Henderson and start over. The size here is arbitrary, significantly larger 10095b38ee31SRichard Henderson than we expect the code generation for any one opcode to require. */ 10105b38ee31SRichard Henderson s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER); 10115b38ee31SRichard Henderson 10125b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10135b38ee31SRichard Henderson s->pool_labels = NULL; 10145b38ee31SRichard Henderson #endif 10155b38ee31SRichard Henderson 10168163b749SRichard Henderson /* Generate the prologue. */ 1017b03cce8eSbellard tcg_target_qemu_prologue(s); 10185b38ee31SRichard Henderson 10195b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10205b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 10215b38ee31SRichard Henderson { 10225b38ee31SRichard Henderson bool ok = tcg_out_pool_finalize(s); 10235b38ee31SRichard Henderson tcg_debug_assert(ok); 10245b38ee31SRichard Henderson } 10255b38ee31SRichard Henderson #endif 10265b38ee31SRichard Henderson 10278163b749SRichard Henderson buf1 = s->code_ptr; 10288163b749SRichard Henderson flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1); 10298163b749SRichard Henderson 10308163b749SRichard Henderson /* Deduct the prologue from the buffer. */ 10318163b749SRichard Henderson prologue_size = tcg_current_code_size(s); 10328163b749SRichard Henderson s->code_gen_ptr = buf1; 10338163b749SRichard Henderson s->code_gen_buffer = buf1; 10348163b749SRichard Henderson s->code_buf = buf1; 10355b38ee31SRichard Henderson total_size -= prologue_size; 10368163b749SRichard Henderson s->code_gen_buffer_size = total_size; 10378163b749SRichard Henderson 10388163b749SRichard Henderson tcg_register_jit(s->code_gen_buffer, total_size); 1039d6b64b2bSRichard Henderson 1040d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 1041d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 10421ee73216SRichard Henderson qemu_log_lock(); 10438163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 10445b38ee31SRichard Henderson if (s->data_gen_ptr) { 10455b38ee31SRichard Henderson size_t code_size = s->data_gen_ptr - buf0; 10465b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 10475b38ee31SRichard Henderson size_t i; 10485b38ee31SRichard Henderson 10495b38ee31SRichard Henderson log_disas(buf0, code_size); 10505b38ee31SRichard Henderson 10515b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 10525b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 10535b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 10545b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10555b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 10565b38ee31SRichard Henderson } else { 10575b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .long 0x%08x\n", 10585b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10595b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 10605b38ee31SRichard Henderson } 10615b38ee31SRichard Henderson } 10625b38ee31SRichard Henderson } else { 10638163b749SRichard Henderson log_disas(buf0, prologue_size); 10645b38ee31SRichard Henderson } 1065d6b64b2bSRichard Henderson qemu_log("\n"); 1066d6b64b2bSRichard Henderson qemu_log_flush(); 10671ee73216SRichard Henderson qemu_log_unlock(); 1068d6b64b2bSRichard Henderson } 1069d6b64b2bSRichard Henderson #endif 1070cedbcb01SEmilio G. Cota 1071cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 1072cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 1073cedbcb01SEmilio G. Cota tcg_debug_assert(s->code_gen_epilogue != NULL); 1074cedbcb01SEmilio G. Cota } 1075c896fe29Sbellard } 1076c896fe29Sbellard 1077c896fe29Sbellard void tcg_func_start(TCGContext *s) 1078c896fe29Sbellard { 1079c896fe29Sbellard tcg_pool_reset(s); 1080c896fe29Sbellard s->nb_temps = s->nb_globals; 10810ec9eabcSRichard Henderson 10820ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 10830ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 10840ec9eabcSRichard Henderson 1085abebf925SRichard Henderson s->nb_ops = 0; 1086c896fe29Sbellard s->nb_labels = 0; 1087c896fe29Sbellard s->current_frame_offset = s->frame_start; 1088c896fe29Sbellard 10890a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 10900a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 10910a209d4bSRichard Henderson #endif 10920a209d4bSRichard Henderson 109315fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 109415fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 1095c896fe29Sbellard } 1096c896fe29Sbellard 10977ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s) 10987ca4b752SRichard Henderson { 10997ca4b752SRichard Henderson int n = s->nb_temps++; 11007ca4b752SRichard Henderson tcg_debug_assert(n < TCG_MAX_TEMPS); 11017ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 11027ca4b752SRichard Henderson } 11037ca4b752SRichard Henderson 11047ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s) 11057ca4b752SRichard Henderson { 1106fa477d25SRichard Henderson TCGTemp *ts; 1107fa477d25SRichard Henderson 11087ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 11097ca4b752SRichard Henderson s->nb_globals++; 1110fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 1111fa477d25SRichard Henderson ts->temp_global = 1; 1112fa477d25SRichard Henderson 1113fa477d25SRichard Henderson return ts; 1114c896fe29Sbellard } 1115c896fe29Sbellard 1116085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 1117b6638662SRichard Henderson TCGReg reg, const char *name) 1118c896fe29Sbellard { 1119c896fe29Sbellard TCGTemp *ts; 1120c896fe29Sbellard 1121b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 1122c896fe29Sbellard tcg_abort(); 1123b3a62939SRichard Henderson } 11247ca4b752SRichard Henderson 11257ca4b752SRichard Henderson ts = tcg_global_alloc(s); 1126c896fe29Sbellard ts->base_type = type; 1127c896fe29Sbellard ts->type = type; 1128c896fe29Sbellard ts->fixed_reg = 1; 1129c896fe29Sbellard ts->reg = reg; 1130c896fe29Sbellard ts->name = name; 1131c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 11327ca4b752SRichard Henderson 1133085272b3SRichard Henderson return ts; 1134a7812ae4Spbrook } 1135a7812ae4Spbrook 1136b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 1137a7812ae4Spbrook { 1138b3a62939SRichard Henderson s->frame_start = start; 1139b3a62939SRichard Henderson s->frame_end = start + size; 1140085272b3SRichard Henderson s->frame_temp 1141085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 1142b3a62939SRichard Henderson } 1143a7812ae4Spbrook 1144085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 1145e1ccc054SRichard Henderson intptr_t offset, const char *name) 1146c896fe29Sbellard { 1147b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1148dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 11497ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 1150b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 11517ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 11527ca4b752SRichard Henderson bigendian = 1; 11537ca4b752SRichard Henderson #endif 1154c896fe29Sbellard 1155b3915dbbSRichard Henderson if (!base_ts->fixed_reg) { 11565a18407fSRichard Henderson /* We do not support double-indirect registers. */ 11575a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 1158b3915dbbSRichard Henderson base_ts->indirect_base = 1; 11595a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 11605a18407fSRichard Henderson ? 2 : 1); 11615a18407fSRichard Henderson indirect_reg = 1; 1162b3915dbbSRichard Henderson } 1163b3915dbbSRichard Henderson 11647ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 11657ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 1166c896fe29Sbellard char buf[64]; 11677ca4b752SRichard Henderson 11687ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 1169c896fe29Sbellard ts->type = TCG_TYPE_I32; 1170b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1171c896fe29Sbellard ts->mem_allocated = 1; 1172b3a62939SRichard Henderson ts->mem_base = base_ts; 11737ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 1174c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1175c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 1176c896fe29Sbellard ts->name = strdup(buf); 1177c896fe29Sbellard 11787ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 11797ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 11807ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 1181b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 11827ca4b752SRichard Henderson ts2->mem_allocated = 1; 11837ca4b752SRichard Henderson ts2->mem_base = base_ts; 11847ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 1185c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1186c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 1187120c1084SRichard Henderson ts2->name = strdup(buf); 11887ca4b752SRichard Henderson } else { 1189c896fe29Sbellard ts->base_type = type; 1190c896fe29Sbellard ts->type = type; 1191b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1192c896fe29Sbellard ts->mem_allocated = 1; 1193b3a62939SRichard Henderson ts->mem_base = base_ts; 1194c896fe29Sbellard ts->mem_offset = offset; 1195c896fe29Sbellard ts->name = name; 1196c896fe29Sbellard } 1197085272b3SRichard Henderson return ts; 1198c896fe29Sbellard } 1199c896fe29Sbellard 12005bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 1201c896fe29Sbellard { 1202b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1203c896fe29Sbellard TCGTemp *ts; 1204641d5fbeSbellard int idx, k; 1205c896fe29Sbellard 12060ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 12070ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 12080ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 12090ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 12100ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 12110ec9eabcSRichard Henderson 1212e8996ee0Sbellard ts = &s->temps[idx]; 1213e8996ee0Sbellard ts->temp_allocated = 1; 12147ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 12157ca4b752SRichard Henderson tcg_debug_assert(ts->temp_local == temp_local); 1216e8996ee0Sbellard } else { 12177ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 12187ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 12197ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 12207ca4b752SRichard Henderson 1221c896fe29Sbellard ts->base_type = type; 1222c896fe29Sbellard ts->type = TCG_TYPE_I32; 1223e8996ee0Sbellard ts->temp_allocated = 1; 1224641d5fbeSbellard ts->temp_local = temp_local; 12257ca4b752SRichard Henderson 12267ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 12277ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 12287ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 12297ca4b752SRichard Henderson ts2->temp_allocated = 1; 12307ca4b752SRichard Henderson ts2->temp_local = temp_local; 12317ca4b752SRichard Henderson } else { 1232c896fe29Sbellard ts->base_type = type; 1233c896fe29Sbellard ts->type = type; 1234e8996ee0Sbellard ts->temp_allocated = 1; 1235641d5fbeSbellard ts->temp_local = temp_local; 1236c896fe29Sbellard } 1237e8996ee0Sbellard } 123827bfd83cSPeter Maydell 123927bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 124027bfd83cSPeter Maydell s->temps_in_use++; 124127bfd83cSPeter Maydell #endif 1242085272b3SRichard Henderson return ts; 1243c896fe29Sbellard } 1244c896fe29Sbellard 1245d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 1246d2fd745fSRichard Henderson { 1247d2fd745fSRichard Henderson TCGTemp *t; 1248d2fd745fSRichard Henderson 1249d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 1250d2fd745fSRichard Henderson switch (type) { 1251d2fd745fSRichard Henderson case TCG_TYPE_V64: 1252d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 1253d2fd745fSRichard Henderson break; 1254d2fd745fSRichard Henderson case TCG_TYPE_V128: 1255d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 1256d2fd745fSRichard Henderson break; 1257d2fd745fSRichard Henderson case TCG_TYPE_V256: 1258d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 1259d2fd745fSRichard Henderson break; 1260d2fd745fSRichard Henderson default: 1261d2fd745fSRichard Henderson g_assert_not_reached(); 1262d2fd745fSRichard Henderson } 1263d2fd745fSRichard Henderson #endif 1264d2fd745fSRichard Henderson 1265d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 1266d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1267d2fd745fSRichard Henderson } 1268d2fd745fSRichard Henderson 1269d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 1270d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 1271d2fd745fSRichard Henderson { 1272d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 1273d2fd745fSRichard Henderson 1274d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 1275d2fd745fSRichard Henderson 1276d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 1277d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1278d2fd745fSRichard Henderson } 1279d2fd745fSRichard Henderson 12805bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 1281c896fe29Sbellard { 1282b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1283085272b3SRichard Henderson int k, idx; 1284c896fe29Sbellard 128527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 128627bfd83cSPeter Maydell s->temps_in_use--; 128727bfd83cSPeter Maydell if (s->temps_in_use < 0) { 128827bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 128927bfd83cSPeter Maydell } 129027bfd83cSPeter Maydell #endif 129127bfd83cSPeter Maydell 1292085272b3SRichard Henderson tcg_debug_assert(ts->temp_global == 0); 1293eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 1294e8996ee0Sbellard ts->temp_allocated = 0; 12950ec9eabcSRichard Henderson 1296085272b3SRichard Henderson idx = temp_idx(ts); 129718d13fa2SAlexander Graf k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0); 12980ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 1299e8996ee0Sbellard } 1300e8996ee0Sbellard 1301a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1302a7812ae4Spbrook { 1303a7812ae4Spbrook TCGv_i32 t0; 1304a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1305e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1306e8996ee0Sbellard return t0; 1307c896fe29Sbellard } 1308c896fe29Sbellard 1309a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1310c896fe29Sbellard { 1311a7812ae4Spbrook TCGv_i64 t0; 1312a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1313e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1314e8996ee0Sbellard return t0; 1315c896fe29Sbellard } 1316c896fe29Sbellard 1317a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1318bdffd4a9Saurel32 { 1319a7812ae4Spbrook TCGv_i32 t0; 1320a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1321bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1322bdffd4a9Saurel32 return t0; 1323bdffd4a9Saurel32 } 1324bdffd4a9Saurel32 1325a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1326bdffd4a9Saurel32 { 1327a7812ae4Spbrook TCGv_i64 t0; 1328a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1329bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1330bdffd4a9Saurel32 return t0; 1331bdffd4a9Saurel32 } 1332bdffd4a9Saurel32 133327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 133427bfd83cSPeter Maydell void tcg_clear_temp_count(void) 133527bfd83cSPeter Maydell { 1336b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 133727bfd83cSPeter Maydell s->temps_in_use = 0; 133827bfd83cSPeter Maydell } 133927bfd83cSPeter Maydell 134027bfd83cSPeter Maydell int tcg_check_temp_count(void) 134127bfd83cSPeter Maydell { 1342b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 134327bfd83cSPeter Maydell if (s->temps_in_use) { 134427bfd83cSPeter Maydell /* Clear the count so that we don't give another 134527bfd83cSPeter Maydell * warning immediately next time around. 134627bfd83cSPeter Maydell */ 134727bfd83cSPeter Maydell s->temps_in_use = 0; 134827bfd83cSPeter Maydell return 1; 134927bfd83cSPeter Maydell } 135027bfd83cSPeter Maydell return 0; 135127bfd83cSPeter Maydell } 135227bfd83cSPeter Maydell #endif 135327bfd83cSPeter Maydell 1354be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1355be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1356be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1357be0f34b5SRichard Henderson { 1358d2fd745fSRichard Henderson const bool have_vec 1359d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1360d2fd745fSRichard Henderson 1361be0f34b5SRichard Henderson switch (op) { 1362be0f34b5SRichard Henderson case INDEX_op_discard: 1363be0f34b5SRichard Henderson case INDEX_op_set_label: 1364be0f34b5SRichard Henderson case INDEX_op_call: 1365be0f34b5SRichard Henderson case INDEX_op_br: 1366be0f34b5SRichard Henderson case INDEX_op_mb: 1367be0f34b5SRichard Henderson case INDEX_op_insn_start: 1368be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1369be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1370be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1371be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1372be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1373be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1374be0f34b5SRichard Henderson return true; 1375be0f34b5SRichard Henderson 1376be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 1377be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 1378be0f34b5SRichard Henderson 1379be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1380be0f34b5SRichard Henderson case INDEX_op_movi_i32: 1381be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1382be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1383be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1384be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1385be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1386be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1387be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1388be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1389be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1390be0f34b5SRichard Henderson case INDEX_op_st_i32: 1391be0f34b5SRichard Henderson case INDEX_op_add_i32: 1392be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1393be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1394be0f34b5SRichard Henderson case INDEX_op_and_i32: 1395be0f34b5SRichard Henderson case INDEX_op_or_i32: 1396be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1397be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1398be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1399be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1400be0f34b5SRichard Henderson return true; 1401be0f34b5SRichard Henderson 1402be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1403be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1404be0f34b5SRichard Henderson case INDEX_op_div_i32: 1405be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1406be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1407be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1408be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1409be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1410be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1411be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1412be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1413be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1414be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1415be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1416be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1417be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1418be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1419be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1420be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1421be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1422be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1423be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1424be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1425be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1426be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1427be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1428be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1429be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1430be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1431be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1432be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1433be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1434be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1435be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1436be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1437be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1438be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1439be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1440be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1441be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1442be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1443be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1444be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1445be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1446be0f34b5SRichard Henderson case INDEX_op_not_i32: 1447be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1448be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1449be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1450be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1451be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1452be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1453be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1454be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1455be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1456be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1457be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1458be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1459be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1460be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1461be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1462be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1463be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1464be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1465be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1466be0f34b5SRichard Henderson 1467be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1468be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1469be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1470be0f34b5SRichard Henderson 1471be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1472be0f34b5SRichard Henderson case INDEX_op_movi_i64: 1473be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1474be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1475be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1476be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1477be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1478be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1479be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1480be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1481be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1482be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1483be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1484be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1485be0f34b5SRichard Henderson case INDEX_op_st_i64: 1486be0f34b5SRichard Henderson case INDEX_op_add_i64: 1487be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1488be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1489be0f34b5SRichard Henderson case INDEX_op_and_i64: 1490be0f34b5SRichard Henderson case INDEX_op_or_i64: 1491be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1492be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1493be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1494be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1495be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1496be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1497be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1498be0f34b5SRichard Henderson 1499be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1500be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1501be0f34b5SRichard Henderson case INDEX_op_div_i64: 1502be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1503be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1504be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1505be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1506be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1507be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1508be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1509be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1510be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1511be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1512be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1513be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1514be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1515be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1516be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1517be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1518be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1519be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1520be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1521be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1522be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1523be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1524be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1525be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1526be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1527be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1528be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1529be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1530be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1531be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1532be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1533be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1534be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1535be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1536be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1537be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1538be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1539be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1540be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1541be0f34b5SRichard Henderson case INDEX_op_not_i64: 1542be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1543be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1544be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1545be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1546be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1547be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1548be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1549be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1550be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1551be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1552be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1553be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1554be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1555be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1556be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1557be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1558be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1559be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1560be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1561be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1562be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1563be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1564be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1565be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1566be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1567be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1568be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1569be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1570be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1571be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1572be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1573be0f34b5SRichard Henderson 1574d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1575d2fd745fSRichard Henderson case INDEX_op_dup_vec: 1576d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 1577d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1578d2fd745fSRichard Henderson case INDEX_op_st_vec: 1579d2fd745fSRichard Henderson case INDEX_op_add_vec: 1580d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1581d2fd745fSRichard Henderson case INDEX_op_and_vec: 1582d2fd745fSRichard Henderson case INDEX_op_or_vec: 1583d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1584212be173SRichard Henderson case INDEX_op_cmp_vec: 1585d2fd745fSRichard Henderson return have_vec; 1586d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1587d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1588d2fd745fSRichard Henderson case INDEX_op_not_vec: 1589d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1590d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1591d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1592d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1593d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1594d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1595d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 15963774030aSRichard Henderson case INDEX_op_mul_vec: 15973774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1598d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1599d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1600d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1601d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1602d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1603d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1604d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1605d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1606d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1607d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1608d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1609d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1610d2fd745fSRichard Henderson 1611db432672SRichard Henderson default: 1612db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1613db432672SRichard Henderson return true; 1614be0f34b5SRichard Henderson } 1615be0f34b5SRichard Henderson } 1616be0f34b5SRichard Henderson 161739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 161839cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 161939cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1620ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1621c896fe29Sbellard { 162275e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 1623bbb8a1b4SRichard Henderson unsigned sizemask, flags; 1624afb49896SRichard Henderson TCGHelperInfo *info; 162575e8b9b7SRichard Henderson TCGOp *op; 1626afb49896SRichard Henderson 1627619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 1628bbb8a1b4SRichard Henderson flags = info->flags; 1629bbb8a1b4SRichard Henderson sizemask = info->sizemask; 16302bece2c8SRichard Henderson 163134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 163234b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 163334b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 163434b1a49cSRichard Henderson separate parameters. Split them. */ 163534b1a49cSRichard Henderson int orig_sizemask = sizemask; 163634b1a49cSRichard Henderson int orig_nargs = nargs; 163734b1a49cSRichard Henderson TCGv_i64 retl, reth; 1638ae8b75dcSRichard Henderson TCGTemp *split_args[MAX_OPC_PARAM]; 163934b1a49cSRichard Henderson 1640f764718dSRichard Henderson retl = NULL; 1641f764718dSRichard Henderson reth = NULL; 164234b1a49cSRichard Henderson if (sizemask != 0) { 164334b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 164434b1a49cSRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 164534b1a49cSRichard Henderson if (is_64bit) { 1646085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 164734b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 164834b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 164934b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 1650ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(h); 1651ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(l); 165234b1a49cSRichard Henderson } else { 165334b1a49cSRichard Henderson split_args[real_args++] = args[i]; 165434b1a49cSRichard Henderson } 165534b1a49cSRichard Henderson } 165634b1a49cSRichard Henderson nargs = real_args; 165734b1a49cSRichard Henderson args = split_args; 165834b1a49cSRichard Henderson sizemask = 0; 165934b1a49cSRichard Henderson } 166034b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 16612bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 16622bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 16632bece2c8SRichard Henderson int is_signed = sizemask & (2 << (i+1)*2); 16642bece2c8SRichard Henderson if (!is_64bit) { 16652bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 1666085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 16672bece2c8SRichard Henderson if (is_signed) { 16682bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 16692bece2c8SRichard Henderson } else { 16702bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 16712bece2c8SRichard Henderson } 1672ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 16732bece2c8SRichard Henderson } 16742bece2c8SRichard Henderson } 16752bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 16762bece2c8SRichard Henderson 167715fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 167875e8b9b7SRichard Henderson 167975e8b9b7SRichard Henderson pi = 0; 1680ae8b75dcSRichard Henderson if (ret != NULL) { 168134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 168234b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 168334b1a49cSRichard Henderson if (orig_sizemask & 1) { 168434b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 168534b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 168634b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 168734b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 168834b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1689ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(reth); 1690ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(retl); 169134b1a49cSRichard Henderson nb_rets = 2; 169234b1a49cSRichard Henderson } else { 1693ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 169434b1a49cSRichard Henderson nb_rets = 1; 169534b1a49cSRichard Henderson } 169634b1a49cSRichard Henderson #else 169734b1a49cSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) { 169802eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1699ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1700ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1701a7812ae4Spbrook #else 1702ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1703ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1704a7812ae4Spbrook #endif 1705a7812ae4Spbrook nb_rets = 2; 170634b1a49cSRichard Henderson } else { 1707ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1708a7812ae4Spbrook nb_rets = 1; 1709a7812ae4Spbrook } 171034b1a49cSRichard Henderson #endif 1711a7812ae4Spbrook } else { 1712a7812ae4Spbrook nb_rets = 0; 1713a7812ae4Spbrook } 1714cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 171575e8b9b7SRichard Henderson 1716a7812ae4Spbrook real_args = 0; 1717a7812ae4Spbrook for (i = 0; i < nargs; i++) { 17182bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 1719bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 172039cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 172139cf05d3Sbellard /* some targets want aligned 64 bit args */ 1722ebd486d5Smalc if (real_args & 1) { 172375e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1724ebd486d5Smalc real_args++; 172539cf05d3Sbellard } 172639cf05d3Sbellard #endif 17273f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 17283f90f252SRichard Henderson arguments at lower addresses, which means we need to 17293f90f252SRichard Henderson reverse the order compared to how we would normally 17303f90f252SRichard Henderson treat either big or little-endian. For those arguments 17313f90f252SRichard Henderson that will wind up in registers, this still works for 17323f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 17333f90f252SRichard Henderson argument registers are *also* allocated in decreasing 17343f90f252SRichard Henderson order. If another such target is added, this logic may 17353f90f252SRichard Henderson have to get more complicated to differentiate between 17363f90f252SRichard Henderson stack arguments and register arguments. */ 173702eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1738ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1739ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1740c896fe29Sbellard #else 1741ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1742ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1743c896fe29Sbellard #endif 1744a7812ae4Spbrook real_args += 2; 17452bece2c8SRichard Henderson continue; 17462bece2c8SRichard Henderson } 17472bece2c8SRichard Henderson 1748ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1749a7812ae4Spbrook real_args++; 1750c896fe29Sbellard } 175175e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 175275e8b9b7SRichard Henderson op->args[pi++] = flags; 1753cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1754a7812ae4Spbrook 175575e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1756cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 175775e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 17582bece2c8SRichard Henderson 175934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 176034b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 176134b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 176234b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 176334b1a49cSRichard Henderson int is_64bit = orig_sizemask & (1 << (i+1)*2); 176434b1a49cSRichard Henderson if (is_64bit) { 1765085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 1766085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 176734b1a49cSRichard Henderson } else { 176834b1a49cSRichard Henderson real_args++; 176934b1a49cSRichard Henderson } 177034b1a49cSRichard Henderson } 177134b1a49cSRichard Henderson if (orig_sizemask & 1) { 177234b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 177334b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 177434b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 1775085272b3SRichard Henderson tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth); 177634b1a49cSRichard Henderson tcg_temp_free_i64(retl); 177734b1a49cSRichard Henderson tcg_temp_free_i64(reth); 177834b1a49cSRichard Henderson } 177934b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 17802bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 17812bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 17822bece2c8SRichard Henderson if (!is_64bit) { 1783085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 17842bece2c8SRichard Henderson } 17852bece2c8SRichard Henderson } 17862bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1787a7812ae4Spbrook } 1788c896fe29Sbellard 17898fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1790c896fe29Sbellard { 1791ac3b8891SRichard Henderson int i, n; 1792c896fe29Sbellard TCGTemp *ts; 1793ac3b8891SRichard Henderson 1794ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 1795c896fe29Sbellard ts = &s->temps[i]; 1796ac3b8891SRichard Henderson ts->val_type = (ts->fixed_reg ? TEMP_VAL_REG : TEMP_VAL_MEM); 1797c896fe29Sbellard } 1798ac3b8891SRichard Henderson for (n = s->nb_temps; i < n; i++) { 1799e8996ee0Sbellard ts = &s->temps[i]; 1800ac3b8891SRichard Henderson ts->val_type = (ts->temp_local ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 1801e8996ee0Sbellard ts->mem_allocated = 0; 1802e8996ee0Sbellard ts->fixed_reg = 0; 1803e8996ee0Sbellard } 1804f8b2f202SRichard Henderson 1805f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1806c896fe29Sbellard } 1807c896fe29Sbellard 1808f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1809f8b2f202SRichard Henderson TCGTemp *ts) 1810c896fe29Sbellard { 18111807f4c4SRichard Henderson int idx = temp_idx(ts); 1812ac56dd48Spbrook 1813fa477d25SRichard Henderson if (ts->temp_global) { 1814ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1815f8b2f202SRichard Henderson } else if (ts->temp_local) { 1816641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1817f8b2f202SRichard Henderson } else { 1818ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1819c896fe29Sbellard } 1820c896fe29Sbellard return buf; 1821c896fe29Sbellard } 1822c896fe29Sbellard 182343439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 182443439139SRichard Henderson int buf_size, TCGArg arg) 1825f8b2f202SRichard Henderson { 182643439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1827f8b2f202SRichard Henderson } 1828f8b2f202SRichard Henderson 18296e085f72SRichard Henderson /* Find helper name. */ 18306e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val) 1831e8996ee0Sbellard { 18326e085f72SRichard Henderson const char *ret = NULL; 1833619205fdSEmilio G. Cota if (helper_table) { 1834619205fdSEmilio G. Cota TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val); 183572866e82SRichard Henderson if (info) { 183672866e82SRichard Henderson ret = info->name; 183772866e82SRichard Henderson } 1838e8996ee0Sbellard } 18396e085f72SRichard Henderson return ret; 18404dc81f28Sbellard } 18414dc81f28Sbellard 1842f48f3edeSblueswir1 static const char * const cond_name[] = 1843f48f3edeSblueswir1 { 18440aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 18450aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1846f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1847f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1848f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1849f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1850f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1851f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1852f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1853f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1854f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1855f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1856f48f3edeSblueswir1 }; 1857f48f3edeSblueswir1 1858f713d6adSRichard Henderson static const char * const ldst_name[] = 1859f713d6adSRichard Henderson { 1860f713d6adSRichard Henderson [MO_UB] = "ub", 1861f713d6adSRichard Henderson [MO_SB] = "sb", 1862f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1863f713d6adSRichard Henderson [MO_LESW] = "lesw", 1864f713d6adSRichard Henderson [MO_LEUL] = "leul", 1865f713d6adSRichard Henderson [MO_LESL] = "lesl", 1866f713d6adSRichard Henderson [MO_LEQ] = "leq", 1867f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1868f713d6adSRichard Henderson [MO_BESW] = "besw", 1869f713d6adSRichard Henderson [MO_BEUL] = "beul", 1870f713d6adSRichard Henderson [MO_BESL] = "besl", 1871f713d6adSRichard Henderson [MO_BEQ] = "beq", 1872f713d6adSRichard Henderson }; 1873f713d6adSRichard Henderson 18741f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 18751f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY 18761f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 18771f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 18781f00b27fSSergey Sorokin #else 18791f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 18801f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 18811f00b27fSSergey Sorokin #endif 18821f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 18831f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 18841f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 18851f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 18861f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 18871f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 18881f00b27fSSergey Sorokin }; 18891f00b27fSSergey Sorokin 1890*b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d) 1891*b016486eSRichard Henderson { 1892*b016486eSRichard Henderson return (d & (d - 1)) == 0; 1893*b016486eSRichard Henderson } 1894*b016486eSRichard Henderson 1895*b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d) 1896*b016486eSRichard Henderson { 1897*b016486eSRichard Henderson if (TCG_TARGET_NB_REGS <= 32) { 1898*b016486eSRichard Henderson return ctz32(d); 1899*b016486eSRichard Henderson } else { 1900*b016486eSRichard Henderson return ctz64(d); 1901*b016486eSRichard Henderson } 1902*b016486eSRichard Henderson } 1903*b016486eSRichard Henderson 1904eeacee4dSBlue Swirl void tcg_dump_ops(TCGContext *s) 1905c896fe29Sbellard { 1906c896fe29Sbellard char buf[128]; 1907c45cb8bbSRichard Henderson TCGOp *op; 1908c896fe29Sbellard 190915fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1910c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1911c45cb8bbSRichard Henderson const TCGOpDef *def; 1912c45cb8bbSRichard Henderson TCGOpcode c; 1913bdfb460eSRichard Henderson int col = 0; 1914c45cb8bbSRichard Henderson 1915c45cb8bbSRichard Henderson c = op->opc; 1916c896fe29Sbellard def = &tcg_op_defs[c]; 1917c45cb8bbSRichard Henderson 1918765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1919*b016486eSRichard Henderson nb_oargs = 0; 192015fa08f8SRichard Henderson col += qemu_log("\n ----"); 19219aef40edSRichard Henderson 19229aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 19239aef40edSRichard Henderson target_ulong a; 19247e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1925efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 19267e4597d7Sbellard #else 1927efee3746SRichard Henderson a = op->args[i]; 19287e4597d7Sbellard #endif 1929bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1930eeacee4dSBlue Swirl } 19317e4597d7Sbellard } else if (c == INDEX_op_call) { 1932c896fe29Sbellard /* variable number of arguments */ 1933cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1934cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1935c896fe29Sbellard nb_cargs = def->nb_cargs; 1936b03cce8eSbellard 1937cf066674SRichard Henderson /* function name, flags, out args */ 1938bdfb460eSRichard Henderson col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name, 1939efee3746SRichard Henderson tcg_find_helper(s, op->args[nb_oargs + nb_iargs]), 1940efee3746SRichard Henderson op->args[nb_oargs + nb_iargs + 1], nb_oargs); 1941b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 194243439139SRichard Henderson col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1943efee3746SRichard Henderson op->args[i])); 1944b03cce8eSbellard } 1945cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1946efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1947cf066674SRichard Henderson const char *t = "<dummy>"; 1948cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 194943439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1950b03cce8eSbellard } 1951bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1952e8996ee0Sbellard } 1953b03cce8eSbellard } else { 1954bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1955c45cb8bbSRichard Henderson 1956c896fe29Sbellard nb_oargs = def->nb_oargs; 1957c896fe29Sbellard nb_iargs = def->nb_iargs; 1958c896fe29Sbellard nb_cargs = def->nb_cargs; 1959c896fe29Sbellard 1960d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1961d2fd745fSRichard Henderson col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op), 1962d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1963d2fd745fSRichard Henderson } 1964d2fd745fSRichard Henderson 1965c896fe29Sbellard k = 0; 1966c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1967eeacee4dSBlue Swirl if (k != 0) { 1968bdfb460eSRichard Henderson col += qemu_log(","); 1969eeacee4dSBlue Swirl } 197043439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1971efee3746SRichard Henderson op->args[k++])); 1972c896fe29Sbellard } 1973c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1974eeacee4dSBlue Swirl if (k != 0) { 1975bdfb460eSRichard Henderson col += qemu_log(","); 1976eeacee4dSBlue Swirl } 197743439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1978efee3746SRichard Henderson op->args[k++])); 1979c896fe29Sbellard } 1980be210acbSRichard Henderson switch (c) { 1981be210acbSRichard Henderson case INDEX_op_brcond_i32: 1982ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1983ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1984be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1985be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1986ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1987be210acbSRichard Henderson case INDEX_op_setcond_i64: 1988ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1989212be173SRichard Henderson case INDEX_op_cmp_vec: 1990efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1991efee3746SRichard Henderson && cond_name[op->args[k]]) { 1992efee3746SRichard Henderson col += qemu_log(",%s", cond_name[op->args[k++]]); 1993eeacee4dSBlue Swirl } else { 1994efee3746SRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]); 1995eeacee4dSBlue Swirl } 1996f48f3edeSblueswir1 i = 1; 1997be210acbSRichard Henderson break; 1998f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1999f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 2000f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 2001f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 200259227d5dSRichard Henderson { 2003efee3746SRichard Henderson TCGMemOpIdx oi = op->args[k++]; 200459227d5dSRichard Henderson TCGMemOp op = get_memop(oi); 200559227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 200659227d5dSRichard Henderson 200759c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 2008bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 200959c4b7e8SRichard Henderson } else { 20101f00b27fSSergey Sorokin const char *s_al, *s_op; 20111f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 201259c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 2013bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 2014f713d6adSRichard Henderson } 2015f713d6adSRichard Henderson i = 1; 201659227d5dSRichard Henderson } 2017f713d6adSRichard Henderson break; 2018be210acbSRichard Henderson default: 2019f48f3edeSblueswir1 i = 0; 2020be210acbSRichard Henderson break; 2021be210acbSRichard Henderson } 202251e3972cSRichard Henderson switch (c) { 202351e3972cSRichard Henderson case INDEX_op_set_label: 202451e3972cSRichard Henderson case INDEX_op_br: 202551e3972cSRichard Henderson case INDEX_op_brcond_i32: 202651e3972cSRichard Henderson case INDEX_op_brcond_i64: 202751e3972cSRichard Henderson case INDEX_op_brcond2_i32: 2028efee3746SRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", 2029efee3746SRichard Henderson arg_label(op->args[k])->id); 203051e3972cSRichard Henderson i++, k++; 203151e3972cSRichard Henderson break; 203251e3972cSRichard Henderson default: 203351e3972cSRichard Henderson break; 2034eeacee4dSBlue Swirl } 203551e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 2036efee3746SRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]); 2037bdfb460eSRichard Henderson } 2038bdfb460eSRichard Henderson } 2039bdfb460eSRichard Henderson if (op->life) { 2040bdfb460eSRichard Henderson unsigned life = op->life; 2041bdfb460eSRichard Henderson 2042bdfb460eSRichard Henderson for (; col < 48; ++col) { 2043bdfb460eSRichard Henderson putc(' ', qemu_logfile); 2044bdfb460eSRichard Henderson } 2045bdfb460eSRichard Henderson 2046bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 2047bdfb460eSRichard Henderson qemu_log(" sync:"); 2048bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 2049bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 2050bdfb460eSRichard Henderson qemu_log(" %d", i); 2051bdfb460eSRichard Henderson } 2052bdfb460eSRichard Henderson } 2053bdfb460eSRichard Henderson } 2054bdfb460eSRichard Henderson life /= DEAD_ARG; 2055bdfb460eSRichard Henderson if (life) { 2056bdfb460eSRichard Henderson qemu_log(" dead:"); 2057bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 2058bdfb460eSRichard Henderson if (life & 1) { 2059bdfb460eSRichard Henderson qemu_log(" %d", i); 2060bdfb460eSRichard Henderson } 2061bdfb460eSRichard Henderson } 2062c896fe29Sbellard } 2063b03cce8eSbellard } 2064eeacee4dSBlue Swirl qemu_log("\n"); 2065c896fe29Sbellard } 2066c896fe29Sbellard } 2067c896fe29Sbellard 2068c896fe29Sbellard /* we give more priority to constraints with less registers */ 2069c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 2070c896fe29Sbellard { 2071c896fe29Sbellard const TCGArgConstraint *arg_ct; 2072c896fe29Sbellard 2073c896fe29Sbellard int i, n; 2074c896fe29Sbellard arg_ct = &def->args_ct[k]; 2075c896fe29Sbellard if (arg_ct->ct & TCG_CT_ALIAS) { 2076c896fe29Sbellard /* an alias is equivalent to a single register */ 2077c896fe29Sbellard n = 1; 2078c896fe29Sbellard } else { 2079c896fe29Sbellard if (!(arg_ct->ct & TCG_CT_REG)) 2080c896fe29Sbellard return 0; 2081c896fe29Sbellard n = 0; 2082c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2083c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, i)) 2084c896fe29Sbellard n++; 2085c896fe29Sbellard } 2086c896fe29Sbellard } 2087c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 2088c896fe29Sbellard } 2089c896fe29Sbellard 2090c896fe29Sbellard /* sort from highest priority to lowest */ 2091c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 2092c896fe29Sbellard { 2093c896fe29Sbellard int i, j, p1, p2, tmp; 2094c896fe29Sbellard 2095c896fe29Sbellard for(i = 0; i < n; i++) 2096c896fe29Sbellard def->sorted_args[start + i] = start + i; 2097c896fe29Sbellard if (n <= 1) 2098c896fe29Sbellard return; 2099c896fe29Sbellard for(i = 0; i < n - 1; i++) { 2100c896fe29Sbellard for(j = i + 1; j < n; j++) { 2101c896fe29Sbellard p1 = get_constraint_priority(def, def->sorted_args[start + i]); 2102c896fe29Sbellard p2 = get_constraint_priority(def, def->sorted_args[start + j]); 2103c896fe29Sbellard if (p1 < p2) { 2104c896fe29Sbellard tmp = def->sorted_args[start + i]; 2105c896fe29Sbellard def->sorted_args[start + i] = def->sorted_args[start + j]; 2106c896fe29Sbellard def->sorted_args[start + j] = tmp; 2107c896fe29Sbellard } 2108c896fe29Sbellard } 2109c896fe29Sbellard } 2110c896fe29Sbellard } 2111c896fe29Sbellard 2112f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 2113c896fe29Sbellard { 2114a9751609SRichard Henderson TCGOpcode op; 2115c896fe29Sbellard 2116f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 2117f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 2118f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 2119069ea736SRichard Henderson TCGType type; 2120069ea736SRichard Henderson int i, nb_args; 2121f69d277eSRichard Henderson 2122f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 2123f69d277eSRichard Henderson continue; 2124f69d277eSRichard Henderson } 2125f69d277eSRichard Henderson 2126c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 2127f69d277eSRichard Henderson if (nb_args == 0) { 2128f69d277eSRichard Henderson continue; 2129f69d277eSRichard Henderson } 2130f69d277eSRichard Henderson 2131f69d277eSRichard Henderson tdefs = tcg_target_op_def(op); 2132f69d277eSRichard Henderson /* Missing TCGTargetOpDef entry. */ 2133f69d277eSRichard Henderson tcg_debug_assert(tdefs != NULL); 2134f69d277eSRichard Henderson 2135069ea736SRichard Henderson type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32); 2136c896fe29Sbellard for (i = 0; i < nb_args; i++) { 2137f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 2138f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2139eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2140f69d277eSRichard Henderson 2141ccb1bb66SRichard Henderson def->args_ct[i].u.regs = 0; 2142c896fe29Sbellard def->args_ct[i].ct = 0; 214317280ff4SRichard Henderson while (*ct_str != '\0') { 214417280ff4SRichard Henderson switch(*ct_str) { 214517280ff4SRichard Henderson case '0' ... '9': 214617280ff4SRichard Henderson { 214717280ff4SRichard Henderson int oarg = *ct_str - '0'; 214817280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 2149eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 2150eabb7b91SAurelien Jarno tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG); 215117280ff4SRichard Henderson /* TCG_CT_ALIAS is for the output arguments. 215217280ff4SRichard Henderson The input is tagged with TCG_CT_IALIAS. */ 2153c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 215417280ff4SRichard Henderson def->args_ct[oarg].ct |= TCG_CT_ALIAS; 21555ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 2156c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_IALIAS; 21575ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 215817280ff4SRichard Henderson } 215917280ff4SRichard Henderson ct_str++; 2160c896fe29Sbellard break; 216182790a87SRichard Henderson case '&': 216282790a87SRichard Henderson def->args_ct[i].ct |= TCG_CT_NEWREG; 216382790a87SRichard Henderson ct_str++; 216482790a87SRichard Henderson break; 2165c896fe29Sbellard case 'i': 2166c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2167c896fe29Sbellard ct_str++; 2168c896fe29Sbellard break; 2169c896fe29Sbellard default: 2170069ea736SRichard Henderson ct_str = target_parse_constraint(&def->args_ct[i], 2171069ea736SRichard Henderson ct_str, type); 2172f69d277eSRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2173069ea736SRichard Henderson tcg_debug_assert(ct_str != NULL); 2174c896fe29Sbellard } 2175c896fe29Sbellard } 2176c896fe29Sbellard } 2177c896fe29Sbellard 2178c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2179eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2180c68aaa18SStefan Weil 2181c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2182c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2183c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2184c896fe29Sbellard } 2185c896fe29Sbellard } 2186c896fe29Sbellard 21870c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 21880c627cdcSRichard Henderson { 2189d88a117eSRichard Henderson TCGLabel *label; 2190d88a117eSRichard Henderson 2191d88a117eSRichard Henderson switch (op->opc) { 2192d88a117eSRichard Henderson case INDEX_op_br: 2193d88a117eSRichard Henderson label = arg_label(op->args[0]); 2194d88a117eSRichard Henderson label->refs--; 2195d88a117eSRichard Henderson break; 2196d88a117eSRichard Henderson case INDEX_op_brcond_i32: 2197d88a117eSRichard Henderson case INDEX_op_brcond_i64: 2198d88a117eSRichard Henderson label = arg_label(op->args[3]); 2199d88a117eSRichard Henderson label->refs--; 2200d88a117eSRichard Henderson break; 2201d88a117eSRichard Henderson case INDEX_op_brcond2_i32: 2202d88a117eSRichard Henderson label = arg_label(op->args[5]); 2203d88a117eSRichard Henderson label->refs--; 2204d88a117eSRichard Henderson break; 2205d88a117eSRichard Henderson default: 2206d88a117eSRichard Henderson break; 2207d88a117eSRichard Henderson } 2208d88a117eSRichard Henderson 220915fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 221015fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2211abebf925SRichard Henderson s->nb_ops--; 22120c627cdcSRichard Henderson 22130c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2214c3fac113SEmilio G. Cota atomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 22150c627cdcSRichard Henderson #endif 22160c627cdcSRichard Henderson } 22170c627cdcSRichard Henderson 221815fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 221915fa08f8SRichard Henderson { 222015fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 222115fa08f8SRichard Henderson TCGOp *op; 222215fa08f8SRichard Henderson 222315fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 222415fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 222515fa08f8SRichard Henderson } else { 222615fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 222715fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 222815fa08f8SRichard Henderson } 222915fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 223015fa08f8SRichard Henderson op->opc = opc; 2231abebf925SRichard Henderson s->nb_ops++; 223215fa08f8SRichard Henderson 223315fa08f8SRichard Henderson return op; 223415fa08f8SRichard Henderson } 223515fa08f8SRichard Henderson 223615fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 223715fa08f8SRichard Henderson { 223815fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 223915fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 224015fa08f8SRichard Henderson return op; 224115fa08f8SRichard Henderson } 224215fa08f8SRichard Henderson 2243ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 22445a18407fSRichard Henderson { 224515fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 224615fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 22475a18407fSRichard Henderson return new_op; 22485a18407fSRichard Henderson } 22495a18407fSRichard Henderson 2250ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 22515a18407fSRichard Henderson { 225215fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 225315fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 22545a18407fSRichard Henderson return new_op; 22555a18407fSRichard Henderson } 22565a18407fSRichard Henderson 2257b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code. */ 2258b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s) 2259b4fc67c7SRichard Henderson { 2260b4fc67c7SRichard Henderson TCGOp *op, *op_next; 2261b4fc67c7SRichard Henderson bool dead = false; 2262b4fc67c7SRichard Henderson 2263b4fc67c7SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 2264b4fc67c7SRichard Henderson bool remove = dead; 2265b4fc67c7SRichard Henderson TCGLabel *label; 2266b4fc67c7SRichard Henderson int call_flags; 2267b4fc67c7SRichard Henderson 2268b4fc67c7SRichard Henderson switch (op->opc) { 2269b4fc67c7SRichard Henderson case INDEX_op_set_label: 2270b4fc67c7SRichard Henderson label = arg_label(op->args[0]); 2271b4fc67c7SRichard Henderson if (label->refs == 0) { 2272b4fc67c7SRichard Henderson /* 2273b4fc67c7SRichard Henderson * While there is an occasional backward branch, virtually 2274b4fc67c7SRichard Henderson * all branches generated by the translators are forward. 2275b4fc67c7SRichard Henderson * Which means that generally we will have already removed 2276b4fc67c7SRichard Henderson * all references to the label that will be, and there is 2277b4fc67c7SRichard Henderson * little to be gained by iterating. 2278b4fc67c7SRichard Henderson */ 2279b4fc67c7SRichard Henderson remove = true; 2280b4fc67c7SRichard Henderson } else { 2281b4fc67c7SRichard Henderson /* Once we see a label, insns become live again. */ 2282b4fc67c7SRichard Henderson dead = false; 2283b4fc67c7SRichard Henderson remove = false; 2284b4fc67c7SRichard Henderson 2285b4fc67c7SRichard Henderson /* 2286b4fc67c7SRichard Henderson * Optimization can fold conditional branches to unconditional. 2287b4fc67c7SRichard Henderson * If we find a label with one reference which is preceded by 2288b4fc67c7SRichard Henderson * an unconditional branch to it, remove both. This needed to 2289b4fc67c7SRichard Henderson * wait until the dead code in between them was removed. 2290b4fc67c7SRichard Henderson */ 2291b4fc67c7SRichard Henderson if (label->refs == 1) { 2292b4fc67c7SRichard Henderson TCGOp *op_prev = QTAILQ_PREV(op, TCGOpHead, link); 2293b4fc67c7SRichard Henderson if (op_prev->opc == INDEX_op_br && 2294b4fc67c7SRichard Henderson label == arg_label(op_prev->args[0])) { 2295b4fc67c7SRichard Henderson tcg_op_remove(s, op_prev); 2296b4fc67c7SRichard Henderson remove = true; 2297b4fc67c7SRichard Henderson } 2298b4fc67c7SRichard Henderson } 2299b4fc67c7SRichard Henderson } 2300b4fc67c7SRichard Henderson break; 2301b4fc67c7SRichard Henderson 2302b4fc67c7SRichard Henderson case INDEX_op_br: 2303b4fc67c7SRichard Henderson case INDEX_op_exit_tb: 2304b4fc67c7SRichard Henderson case INDEX_op_goto_ptr: 2305b4fc67c7SRichard Henderson /* Unconditional branches; everything following is dead. */ 2306b4fc67c7SRichard Henderson dead = true; 2307b4fc67c7SRichard Henderson break; 2308b4fc67c7SRichard Henderson 2309b4fc67c7SRichard Henderson case INDEX_op_call: 2310b4fc67c7SRichard Henderson /* Notice noreturn helper calls, raising exceptions. */ 2311b4fc67c7SRichard Henderson call_flags = op->args[TCGOP_CALLO(op) + TCGOP_CALLI(op) + 1]; 2312b4fc67c7SRichard Henderson if (call_flags & TCG_CALL_NO_RETURN) { 2313b4fc67c7SRichard Henderson dead = true; 2314b4fc67c7SRichard Henderson } 2315b4fc67c7SRichard Henderson break; 2316b4fc67c7SRichard Henderson 2317b4fc67c7SRichard Henderson case INDEX_op_insn_start: 2318b4fc67c7SRichard Henderson /* Never remove -- we need to keep these for unwind. */ 2319b4fc67c7SRichard Henderson remove = false; 2320b4fc67c7SRichard Henderson break; 2321b4fc67c7SRichard Henderson 2322b4fc67c7SRichard Henderson default: 2323b4fc67c7SRichard Henderson break; 2324b4fc67c7SRichard Henderson } 2325b4fc67c7SRichard Henderson 2326b4fc67c7SRichard Henderson if (remove) { 2327b4fc67c7SRichard Henderson tcg_op_remove(s, op); 2328b4fc67c7SRichard Henderson } 2329b4fc67c7SRichard Henderson } 2330b4fc67c7SRichard Henderson } 2331b4fc67c7SRichard Henderson 2332c70fbf0aSRichard Henderson #define TS_DEAD 1 2333c70fbf0aSRichard Henderson #define TS_MEM 2 2334c70fbf0aSRichard Henderson 23355a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 23365a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 23375a18407fSRichard Henderson 23389c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 23399c43b68dSAurelien Jarno should be in memory. */ 2340b83eabeaSRichard Henderson static void tcg_la_func_end(TCGContext *s) 2341c896fe29Sbellard { 2342b83eabeaSRichard Henderson int ng = s->nb_globals; 2343b83eabeaSRichard Henderson int nt = s->nb_temps; 2344b83eabeaSRichard Henderson int i; 2345b83eabeaSRichard Henderson 2346b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2347b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2348b83eabeaSRichard Henderson } 2349b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2350b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 2351b83eabeaSRichard Henderson } 2352c896fe29Sbellard } 2353c896fe29Sbellard 23549c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 23559c43b68dSAurelien Jarno and local temps should be in memory. */ 2356b83eabeaSRichard Henderson static void tcg_la_bb_end(TCGContext *s) 2357641d5fbeSbellard { 2358b83eabeaSRichard Henderson int ng = s->nb_globals; 2359b83eabeaSRichard Henderson int nt = s->nb_temps; 2360b83eabeaSRichard Henderson int i; 2361641d5fbeSbellard 2362b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2363b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2364c70fbf0aSRichard Henderson } 2365b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2366b83eabeaSRichard Henderson s->temps[i].state = (s->temps[i].temp_local 2367b83eabeaSRichard Henderson ? TS_DEAD | TS_MEM 2368b83eabeaSRichard Henderson : TS_DEAD); 2369641d5fbeSbellard } 2370641d5fbeSbellard } 2371641d5fbeSbellard 2372a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2373c896fe29Sbellard given input arguments is dead. Instructions updating dead 2374c896fe29Sbellard temporaries are removed. */ 2375b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2376c896fe29Sbellard { 2377c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 237815fa08f8SRichard Henderson TCGOp *op, *op_prev; 2379c896fe29Sbellard 2380b83eabeaSRichard Henderson tcg_la_func_end(s); 2381c896fe29Sbellard 238215fa08f8SRichard Henderson QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, TCGOpHead, link, op_prev) { 2383c45cb8bbSRichard Henderson int i, nb_iargs, nb_oargs; 2384c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2385c45cb8bbSRichard Henderson bool have_opc_new2; 2386a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 2387b83eabeaSRichard Henderson TCGTemp *arg_ts; 2388c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2389c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2390c45cb8bbSRichard Henderson 2391c45cb8bbSRichard Henderson switch (opc) { 2392c896fe29Sbellard case INDEX_op_call: 2393c6e113f5Sbellard { 2394c6e113f5Sbellard int call_flags; 2395c6e113f5Sbellard 2396cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2397cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2398efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 2399c6e113f5Sbellard 2400c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 240178505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2402c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 2403b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2404b83eabeaSRichard Henderson if (arg_ts->state != TS_DEAD) { 2405c6e113f5Sbellard goto do_not_remove_call; 2406c6e113f5Sbellard } 24079c43b68dSAurelien Jarno } 2408c45cb8bbSRichard Henderson goto do_remove; 2409c6e113f5Sbellard } else { 2410c6e113f5Sbellard do_not_remove_call: 2411c896fe29Sbellard 2412c896fe29Sbellard /* output args are dead */ 2413c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2414b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2415b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2416a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 24176b64b624SAurelien Jarno } 2418b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2419a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 24209c43b68dSAurelien Jarno } 2421b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2422c896fe29Sbellard } 2423c896fe29Sbellard 242478505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 242578505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 24269c43b68dSAurelien Jarno /* globals should go back to memory */ 2427b83eabeaSRichard Henderson for (i = 0; i < nb_globals; i++) { 2428b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2429b83eabeaSRichard Henderson } 2430c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2431c70fbf0aSRichard Henderson /* globals should be synced to memory */ 2432c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2433b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2434c70fbf0aSRichard Henderson } 2435b9c18f56Saurel32 } 2436c896fe29Sbellard 2437c19f47bfSAurelien Jarno /* record arguments that die in this helper */ 2438866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2439b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2440b83eabeaSRichard Henderson if (arg_ts && arg_ts->state & TS_DEAD) { 2441a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2442c896fe29Sbellard } 2443c896fe29Sbellard } 244467cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2445c70fbf0aSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2446b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2447b83eabeaSRichard Henderson if (arg_ts) { 2448b83eabeaSRichard Henderson arg_ts->state &= ~TS_DEAD; 2449c70fbf0aSRichard Henderson } 2450c19f47bfSAurelien Jarno } 2451c6e113f5Sbellard } 2452c6e113f5Sbellard } 2453c896fe29Sbellard break; 2454765b842aSRichard Henderson case INDEX_op_insn_start: 2455c896fe29Sbellard break; 24565ff9d6a4Sbellard case INDEX_op_discard: 24575ff9d6a4Sbellard /* mark the temporary as dead */ 2458b83eabeaSRichard Henderson arg_temp(op->args[0])->state = TS_DEAD; 24595ff9d6a4Sbellard break; 24601305c451SRichard Henderson 24611305c451SRichard Henderson case INDEX_op_add2_i32: 2462c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2463f1fae40cSRichard Henderson goto do_addsub2; 24641305c451SRichard Henderson case INDEX_op_sub2_i32: 2465c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2466f1fae40cSRichard Henderson goto do_addsub2; 2467f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2468c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2469f1fae40cSRichard Henderson goto do_addsub2; 2470f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2471c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2472f1fae40cSRichard Henderson do_addsub2: 24731305c451SRichard Henderson nb_iargs = 4; 24741305c451SRichard Henderson nb_oargs = 2; 24751305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 24761305c451SRichard Henderson the low part. The result can be optimized to a simple 24771305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 24781305c451SRichard Henderson cpu mode is set to 32 bit. */ 2479b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2480b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 24811305c451SRichard Henderson goto do_remove; 24821305c451SRichard Henderson } 2483c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2484c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2485c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2486efee3746SRichard Henderson op->args[1] = op->args[2]; 2487efee3746SRichard Henderson op->args[2] = op->args[4]; 24881305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 24891305c451SRichard Henderson nb_iargs = 2; 24901305c451SRichard Henderson nb_oargs = 1; 24911305c451SRichard Henderson } 24921305c451SRichard Henderson goto do_not_remove; 24931305c451SRichard Henderson 24941414968aSRichard Henderson case INDEX_op_mulu2_i32: 2495c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2496c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2497c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 249803271524SRichard Henderson goto do_mul2; 2499f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2500c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2501c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2502c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2503f1fae40cSRichard Henderson goto do_mul2; 2504f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2505c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2506c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2507c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 250803271524SRichard Henderson goto do_mul2; 2509f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2510c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2511c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2512c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 251303271524SRichard Henderson goto do_mul2; 2514f1fae40cSRichard Henderson do_mul2: 25151414968aSRichard Henderson nb_iargs = 2; 25161414968aSRichard Henderson nb_oargs = 2; 2517b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2518b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 251903271524SRichard Henderson /* Both parts of the operation are dead. */ 25201414968aSRichard Henderson goto do_remove; 25211414968aSRichard Henderson } 252203271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2523c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2524efee3746SRichard Henderson op->args[1] = op->args[2]; 2525efee3746SRichard Henderson op->args[2] = op->args[3]; 2526b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 252703271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2528c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2529efee3746SRichard Henderson op->args[0] = op->args[1]; 2530efee3746SRichard Henderson op->args[1] = op->args[2]; 2531efee3746SRichard Henderson op->args[2] = op->args[3]; 253203271524SRichard Henderson } else { 253303271524SRichard Henderson goto do_not_remove; 253403271524SRichard Henderson } 253503271524SRichard Henderson /* Mark the single-word operation live. */ 25361414968aSRichard Henderson nb_oargs = 1; 25371414968aSRichard Henderson goto do_not_remove; 25381414968aSRichard Henderson 2539c896fe29Sbellard default: 25401305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2541c896fe29Sbellard nb_iargs = def->nb_iargs; 2542c896fe29Sbellard nb_oargs = def->nb_oargs; 2543c896fe29Sbellard 2544c896fe29Sbellard /* Test if the operation can be removed because all 25455ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 25465ff9d6a4Sbellard implies side effects */ 25475ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2548c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2549b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2550c896fe29Sbellard goto do_not_remove; 2551c896fe29Sbellard } 25529c43b68dSAurelien Jarno } 25531305c451SRichard Henderson do_remove: 25540c627cdcSRichard Henderson tcg_op_remove(s, op); 2555c896fe29Sbellard } else { 2556c896fe29Sbellard do_not_remove: 2557c896fe29Sbellard /* output args are dead */ 2558c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2559b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2560b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2561a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 25626b64b624SAurelien Jarno } 2563b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2564a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 25659c43b68dSAurelien Jarno } 2566b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2567c896fe29Sbellard } 2568c896fe29Sbellard 2569c896fe29Sbellard /* if end of basic block, update */ 2570c896fe29Sbellard if (def->flags & TCG_OPF_BB_END) { 2571b83eabeaSRichard Henderson tcg_la_bb_end(s); 25723d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 25733d5c5f87SAurelien Jarno /* globals should be synced to memory */ 2574c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2575b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2576c70fbf0aSRichard Henderson } 2577c896fe29Sbellard } 2578c896fe29Sbellard 2579c19f47bfSAurelien Jarno /* record arguments that die in this opcode */ 2580866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2581b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2582b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2583a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2584c896fe29Sbellard } 2585c19f47bfSAurelien Jarno } 258667cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2587c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2588b83eabeaSRichard Henderson arg_temp(op->args[i])->state &= ~TS_DEAD; 2589c896fe29Sbellard } 2590c896fe29Sbellard } 2591c896fe29Sbellard break; 2592c896fe29Sbellard } 2593bee158cbSRichard Henderson op->life = arg_life; 2594c896fe29Sbellard } 25951ff0a2c5SEvgeny Voevodin } 2596c896fe29Sbellard 25975a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2598b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 25995a18407fSRichard Henderson { 26005a18407fSRichard Henderson int nb_globals = s->nb_globals; 260115fa08f8SRichard Henderson int nb_temps, i; 26025a18407fSRichard Henderson bool changes = false; 260315fa08f8SRichard Henderson TCGOp *op, *op_next; 26045a18407fSRichard Henderson 26055a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 26065a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 26075a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 26085a18407fSRichard Henderson if (its->indirect_reg) { 26095a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 26105a18407fSRichard Henderson dts->type = its->type; 26115a18407fSRichard Henderson dts->base_type = its->base_type; 2612b83eabeaSRichard Henderson its->state_ptr = dts; 2613b83eabeaSRichard Henderson } else { 2614b83eabeaSRichard Henderson its->state_ptr = NULL; 26155a18407fSRichard Henderson } 2616b83eabeaSRichard Henderson /* All globals begin dead. */ 2617b83eabeaSRichard Henderson its->state = TS_DEAD; 26185a18407fSRichard Henderson } 2619b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2620b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2621b83eabeaSRichard Henderson its->state_ptr = NULL; 2622b83eabeaSRichard Henderson its->state = TS_DEAD; 2623b83eabeaSRichard Henderson } 26245a18407fSRichard Henderson 262515fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 26265a18407fSRichard Henderson TCGOpcode opc = op->opc; 26275a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 26285a18407fSRichard Henderson TCGLifeData arg_life = op->life; 26295a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2630b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 26315a18407fSRichard Henderson 26325a18407fSRichard Henderson if (opc == INDEX_op_call) { 2633cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2634cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2635efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 26365a18407fSRichard Henderson } else { 26375a18407fSRichard Henderson nb_iargs = def->nb_iargs; 26385a18407fSRichard Henderson nb_oargs = def->nb_oargs; 26395a18407fSRichard Henderson 26405a18407fSRichard Henderson /* Set flags similar to how calls require. */ 26415a18407fSRichard Henderson if (def->flags & TCG_OPF_BB_END) { 26425a18407fSRichard Henderson /* Like writing globals: save_globals */ 26435a18407fSRichard Henderson call_flags = 0; 26445a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 26455a18407fSRichard Henderson /* Like reading globals: sync_globals */ 26465a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 26475a18407fSRichard Henderson } else { 26485a18407fSRichard Henderson /* No effect on globals. */ 26495a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 26505a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 26515a18407fSRichard Henderson } 26525a18407fSRichard Henderson } 26535a18407fSRichard Henderson 26545a18407fSRichard Henderson /* Make sure that input arguments are available. */ 26555a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2656b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2657b83eabeaSRichard Henderson if (arg_ts) { 2658b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2659b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2660b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 26615a18407fSRichard Henderson ? INDEX_op_ld_i32 26625a18407fSRichard Henderson : INDEX_op_ld_i64); 2663ac1043f6SEmilio G. Cota TCGOp *lop = tcg_op_insert_before(s, op, lopc); 26645a18407fSRichard Henderson 2665b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2666b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2667b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 26685a18407fSRichard Henderson 26695a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2670b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 26715a18407fSRichard Henderson } 26725a18407fSRichard Henderson } 26735a18407fSRichard Henderson } 26745a18407fSRichard Henderson 26755a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 26765a18407fSRichard Henderson No action is required except keeping temp_state up to date 26775a18407fSRichard Henderson so that we reload when needed. */ 26785a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2679b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2680b83eabeaSRichard Henderson if (arg_ts) { 2681b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2682b83eabeaSRichard Henderson if (dir_ts) { 2683b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 26845a18407fSRichard Henderson changes = true; 26855a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2686b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 26875a18407fSRichard Henderson } 26885a18407fSRichard Henderson } 26895a18407fSRichard Henderson } 26905a18407fSRichard Henderson } 26915a18407fSRichard Henderson 26925a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 26935a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 26945a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 26955a18407fSRichard Henderson /* Nothing to do */ 26965a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 26975a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 26985a18407fSRichard Henderson /* Liveness should see that globals are synced back, 26995a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2700b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2701b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2702b83eabeaSRichard Henderson || arg_ts->state != 0); 27035a18407fSRichard Henderson } 27045a18407fSRichard Henderson } else { 27055a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 27065a18407fSRichard Henderson /* Liveness should see that globals are saved back, 27075a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2708b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2709b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2710b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 27115a18407fSRichard Henderson } 27125a18407fSRichard Henderson } 27135a18407fSRichard Henderson 27145a18407fSRichard Henderson /* Outputs become available. */ 27155a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 2716b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2717b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2718b83eabeaSRichard Henderson if (!dir_ts) { 27195a18407fSRichard Henderson continue; 27205a18407fSRichard Henderson } 2721b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 27225a18407fSRichard Henderson changes = true; 27235a18407fSRichard Henderson 27245a18407fSRichard Henderson /* The output is now live and modified. */ 2725b83eabeaSRichard Henderson arg_ts->state = 0; 27265a18407fSRichard Henderson 27275a18407fSRichard Henderson /* Sync outputs upon their last write. */ 27285a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 2729b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 27305a18407fSRichard Henderson ? INDEX_op_st_i32 27315a18407fSRichard Henderson : INDEX_op_st_i64); 2732ac1043f6SEmilio G. Cota TCGOp *sop = tcg_op_insert_after(s, op, sopc); 27335a18407fSRichard Henderson 2734b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 2735b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 2736b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 27375a18407fSRichard Henderson 2738b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 27395a18407fSRichard Henderson } 27405a18407fSRichard Henderson /* Drop outputs that are dead. */ 27415a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2742b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 27435a18407fSRichard Henderson } 27445a18407fSRichard Henderson } 27455a18407fSRichard Henderson } 27465a18407fSRichard Henderson 27475a18407fSRichard Henderson return changes; 27485a18407fSRichard Henderson } 27495a18407fSRichard Henderson 27508d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2751c896fe29Sbellard static void dump_regs(TCGContext *s) 2752c896fe29Sbellard { 2753c896fe29Sbellard TCGTemp *ts; 2754c896fe29Sbellard int i; 2755c896fe29Sbellard char buf[64]; 2756c896fe29Sbellard 2757c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2758c896fe29Sbellard ts = &s->temps[i]; 275943439139SRichard Henderson printf(" %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2760c896fe29Sbellard switch(ts->val_type) { 2761c896fe29Sbellard case TEMP_VAL_REG: 2762c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2763c896fe29Sbellard break; 2764c896fe29Sbellard case TEMP_VAL_MEM: 2765b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2766b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2767c896fe29Sbellard break; 2768c896fe29Sbellard case TEMP_VAL_CONST: 2769c896fe29Sbellard printf("$0x%" TCG_PRIlx, ts->val); 2770c896fe29Sbellard break; 2771c896fe29Sbellard case TEMP_VAL_DEAD: 2772c896fe29Sbellard printf("D"); 2773c896fe29Sbellard break; 2774c896fe29Sbellard default: 2775c896fe29Sbellard printf("???"); 2776c896fe29Sbellard break; 2777c896fe29Sbellard } 2778c896fe29Sbellard printf("\n"); 2779c896fe29Sbellard } 2780c896fe29Sbellard 2781c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2782f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2783c896fe29Sbellard printf("%s: %s\n", 2784c896fe29Sbellard tcg_target_reg_names[i], 2785f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2786c896fe29Sbellard } 2787c896fe29Sbellard } 2788c896fe29Sbellard } 2789c896fe29Sbellard 2790c896fe29Sbellard static void check_regs(TCGContext *s) 2791c896fe29Sbellard { 2792869938aeSRichard Henderson int reg; 2793b6638662SRichard Henderson int k; 2794c896fe29Sbellard TCGTemp *ts; 2795c896fe29Sbellard char buf[64]; 2796c896fe29Sbellard 2797c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2798f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2799f8b2f202SRichard Henderson if (ts != NULL) { 2800f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2801c896fe29Sbellard printf("Inconsistency for register %s:\n", 2802c896fe29Sbellard tcg_target_reg_names[reg]); 2803b03cce8eSbellard goto fail; 2804c896fe29Sbellard } 2805c896fe29Sbellard } 2806c896fe29Sbellard } 2807c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2808c896fe29Sbellard ts = &s->temps[k]; 2809f8b2f202SRichard Henderson if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg 2810f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2811c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2812f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2813b03cce8eSbellard fail: 2814c896fe29Sbellard printf("reg state:\n"); 2815c896fe29Sbellard dump_regs(s); 2816c896fe29Sbellard tcg_abort(); 2817c896fe29Sbellard } 2818c896fe29Sbellard } 2819c896fe29Sbellard } 2820c896fe29Sbellard #endif 2821c896fe29Sbellard 28222272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 2823c896fe29Sbellard { 28249b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 28259b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2826b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2827b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2828b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2829f44c9960SBlue Swirl #endif 2830b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2831b591dc59SBlue Swirl s->frame_end) { 28325ff9d6a4Sbellard tcg_abort(); 2833b591dc59SBlue Swirl } 2834c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2835b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2836c896fe29Sbellard ts->mem_allocated = 1; 2837e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2838c896fe29Sbellard } 2839c896fe29Sbellard 2840b3915dbbSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet); 2841b3915dbbSRichard Henderson 284259d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 284359d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 284459d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2845c896fe29Sbellard { 284659d7c14eSRichard Henderson if (ts->fixed_reg) { 284759d7c14eSRichard Henderson return; 284859d7c14eSRichard Henderson } 284959d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 285059d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 285159d7c14eSRichard Henderson } 285259d7c14eSRichard Henderson ts->val_type = (free_or_dead < 0 285359d7c14eSRichard Henderson || ts->temp_local 2854fa477d25SRichard Henderson || ts->temp_global 285559d7c14eSRichard Henderson ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 285659d7c14eSRichard Henderson } 2857c896fe29Sbellard 285859d7c14eSRichard Henderson /* Mark a temporary as dead. */ 285959d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 286059d7c14eSRichard Henderson { 286159d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 286259d7c14eSRichard Henderson } 286359d7c14eSRichard Henderson 286459d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 286559d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 286659d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 286759d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 286859d7c14eSRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, 286959d7c14eSRichard Henderson TCGRegSet allocated_regs, int free_or_dead) 287059d7c14eSRichard Henderson { 287159d7c14eSRichard Henderson if (ts->fixed_reg) { 287259d7c14eSRichard Henderson return; 287359d7c14eSRichard Henderson } 287459d7c14eSRichard Henderson if (!ts->mem_coherent) { 28757f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 28762272e4a7SRichard Henderson temp_allocate_frame(s, ts); 287759d7c14eSRichard Henderson } 287859d7c14eSRichard Henderson switch (ts->val_type) { 287959d7c14eSRichard Henderson case TEMP_VAL_CONST: 288059d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 288159d7c14eSRichard Henderson require it later in a register, so attempt to store the 288259d7c14eSRichard Henderson constant to memory directly. */ 288359d7c14eSRichard Henderson if (free_or_dead 288459d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 288559d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 288659d7c14eSRichard Henderson break; 288759d7c14eSRichard Henderson } 288859d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 288959d7c14eSRichard Henderson allocated_regs); 289059d7c14eSRichard Henderson /* fallthrough */ 289159d7c14eSRichard Henderson 289259d7c14eSRichard Henderson case TEMP_VAL_REG: 289359d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 289459d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 289559d7c14eSRichard Henderson break; 289659d7c14eSRichard Henderson 289759d7c14eSRichard Henderson case TEMP_VAL_MEM: 289859d7c14eSRichard Henderson break; 289959d7c14eSRichard Henderson 290059d7c14eSRichard Henderson case TEMP_VAL_DEAD: 290159d7c14eSRichard Henderson default: 290259d7c14eSRichard Henderson tcg_abort(); 2903c896fe29Sbellard } 29047f6ceedfSAurelien Jarno ts->mem_coherent = 1; 29057f6ceedfSAurelien Jarno } 290659d7c14eSRichard Henderson if (free_or_dead) { 290759d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 290859d7c14eSRichard Henderson } 290959d7c14eSRichard Henderson } 29107f6ceedfSAurelien Jarno 29117f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 2912b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 29137f6ceedfSAurelien Jarno { 2914f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 2915f8b2f202SRichard Henderson if (ts != NULL) { 291659d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, -1); 2917c896fe29Sbellard } 2918c896fe29Sbellard } 2919c896fe29Sbellard 2920*b016486eSRichard Henderson /** 2921*b016486eSRichard Henderson * tcg_reg_alloc: 2922*b016486eSRichard Henderson * @required_regs: Set of registers in which we must allocate. 2923*b016486eSRichard Henderson * @allocated_regs: Set of registers which must be avoided. 2924*b016486eSRichard Henderson * @preferred_regs: Set of registers we should prefer. 2925*b016486eSRichard Henderson * @rev: True if we search the registers in "indirect" order. 2926*b016486eSRichard Henderson * 2927*b016486eSRichard Henderson * The allocated register must be in @required_regs & ~@allocated_regs, 2928*b016486eSRichard Henderson * but if we can put it in @preferred_regs we may save a move later. 2929*b016486eSRichard Henderson */ 2930*b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs, 2931*b016486eSRichard Henderson TCGRegSet allocated_regs, 2932*b016486eSRichard Henderson TCGRegSet preferred_regs, bool rev) 2933c896fe29Sbellard { 2934*b016486eSRichard Henderson int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 2935*b016486eSRichard Henderson TCGRegSet reg_ct[2]; 293691478cefSRichard Henderson const int *order; 2937c896fe29Sbellard 2938*b016486eSRichard Henderson reg_ct[1] = required_regs & ~allocated_regs; 2939*b016486eSRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 2940*b016486eSRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 2941*b016486eSRichard Henderson 2942*b016486eSRichard Henderson /* Skip the preferred_regs option if it cannot be satisfied, 2943*b016486eSRichard Henderson or if the preference made no difference. */ 2944*b016486eSRichard Henderson f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 2945*b016486eSRichard Henderson 294691478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 2947c896fe29Sbellard 2948*b016486eSRichard Henderson /* Try free registers, preferences first. */ 2949*b016486eSRichard Henderson for (j = f; j < 2; j++) { 2950*b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 2951*b016486eSRichard Henderson 2952*b016486eSRichard Henderson if (tcg_regset_single(set)) { 2953*b016486eSRichard Henderson /* One register in the set. */ 2954*b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 2955*b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL) { 2956c896fe29Sbellard return reg; 2957c896fe29Sbellard } 2958*b016486eSRichard Henderson } else { 295991478cefSRichard Henderson for (i = 0; i < n; i++) { 2960*b016486eSRichard Henderson TCGReg reg = order[i]; 2961*b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL && 2962*b016486eSRichard Henderson tcg_regset_test_reg(set, reg)) { 2963*b016486eSRichard Henderson return reg; 2964*b016486eSRichard Henderson } 2965*b016486eSRichard Henderson } 2966*b016486eSRichard Henderson } 2967*b016486eSRichard Henderson } 2968*b016486eSRichard Henderson 2969*b016486eSRichard Henderson /* We must spill something. */ 2970*b016486eSRichard Henderson for (j = f; j < 2; j++) { 2971*b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 2972*b016486eSRichard Henderson 2973*b016486eSRichard Henderson if (tcg_regset_single(set)) { 2974*b016486eSRichard Henderson /* One register in the set. */ 2975*b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 2976b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 2977c896fe29Sbellard return reg; 2978*b016486eSRichard Henderson } else { 2979*b016486eSRichard Henderson for (i = 0; i < n; i++) { 2980*b016486eSRichard Henderson TCGReg reg = order[i]; 2981*b016486eSRichard Henderson if (tcg_regset_test_reg(set, reg)) { 2982*b016486eSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 2983*b016486eSRichard Henderson return reg; 2984*b016486eSRichard Henderson } 2985*b016486eSRichard Henderson } 2986c896fe29Sbellard } 2987c896fe29Sbellard } 2988c896fe29Sbellard 2989c896fe29Sbellard tcg_abort(); 2990c896fe29Sbellard } 2991c896fe29Sbellard 299240ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 299340ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 299440ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 299540ae5c62SRichard Henderson TCGRegSet allocated_regs) 299640ae5c62SRichard Henderson { 299740ae5c62SRichard Henderson TCGReg reg; 299840ae5c62SRichard Henderson 299940ae5c62SRichard Henderson switch (ts->val_type) { 300040ae5c62SRichard Henderson case TEMP_VAL_REG: 300140ae5c62SRichard Henderson return; 300240ae5c62SRichard Henderson case TEMP_VAL_CONST: 3003*b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3004*b016486eSRichard Henderson 0, ts->indirect_base); 300540ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 300640ae5c62SRichard Henderson ts->mem_coherent = 0; 300740ae5c62SRichard Henderson break; 300840ae5c62SRichard Henderson case TEMP_VAL_MEM: 3009*b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3010*b016486eSRichard Henderson 0, ts->indirect_base); 301140ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 301240ae5c62SRichard Henderson ts->mem_coherent = 1; 301340ae5c62SRichard Henderson break; 301440ae5c62SRichard Henderson case TEMP_VAL_DEAD: 301540ae5c62SRichard Henderson default: 301640ae5c62SRichard Henderson tcg_abort(); 301740ae5c62SRichard Henderson } 301840ae5c62SRichard Henderson ts->reg = reg; 301940ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 302040ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 302140ae5c62SRichard Henderson } 302240ae5c62SRichard Henderson 302359d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 3024e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 302559d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 30261ad80729SAurelien Jarno { 30272c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 3028eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 3029f8bf00f1SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg); 30301ad80729SAurelien Jarno } 30311ad80729SAurelien Jarno 30329814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 3033641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 3034641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 3035641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 3036641d5fbeSbellard { 3037ac3b8891SRichard Henderson int i, n; 3038641d5fbeSbellard 3039ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 3040b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 3041641d5fbeSbellard } 3042e5097dc8Sbellard } 3043e5097dc8Sbellard 30443d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 30453d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 30463d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 30473d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 30483d5c5f87SAurelien Jarno { 3049ac3b8891SRichard Henderson int i, n; 30503d5c5f87SAurelien Jarno 3051ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 305212b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 305312b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 305412b9b11aSRichard Henderson || ts->fixed_reg 305512b9b11aSRichard Henderson || ts->mem_coherent); 30563d5c5f87SAurelien Jarno } 30573d5c5f87SAurelien Jarno } 30583d5c5f87SAurelien Jarno 3059e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 3060e8996ee0Sbellard all globals are stored at their canonical location. */ 3061e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 3062e5097dc8Sbellard { 3063e5097dc8Sbellard int i; 3064e5097dc8Sbellard 3065c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 3066b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 3067641d5fbeSbellard if (ts->temp_local) { 3068b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 3069641d5fbeSbellard } else { 30702c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 3071eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 3072eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3073c896fe29Sbellard } 3074641d5fbeSbellard } 3075e8996ee0Sbellard 3076e8996ee0Sbellard save_globals(s, allocated_regs); 3077c896fe29Sbellard } 3078c896fe29Sbellard 30790fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 30800fe4fca4SPaolo Bonzini tcg_target_ulong val, TCGLifeData arg_life) 3081e8996ee0Sbellard { 3082e8996ee0Sbellard if (ots->fixed_reg) { 308359d7c14eSRichard Henderson /* For fixed registers, we do not do any constant propagation. */ 3084e8996ee0Sbellard tcg_out_movi(s, ots->type, ots->reg, val); 308559d7c14eSRichard Henderson return; 308659d7c14eSRichard Henderson } 308759d7c14eSRichard Henderson 308859d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 3089f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 3090f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3091f8b2f202SRichard Henderson } 3092e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 3093e8996ee0Sbellard ots->val = val; 309459d7c14eSRichard Henderson ots->mem_coherent = 0; 3095ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 309659d7c14eSRichard Henderson temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0)); 309759d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 3098f8bf00f1SRichard Henderson temp_dead(s, ots); 30994c4e1ab2SAurelien Jarno } 3100e8996ee0Sbellard } 3101e8996ee0Sbellard 3102dd186292SRichard Henderson static void tcg_reg_alloc_movi(TCGContext *s, const TCGOp *op) 31030fe4fca4SPaolo Bonzini { 310443439139SRichard Henderson TCGTemp *ots = arg_temp(op->args[0]); 3105dd186292SRichard Henderson tcg_target_ulong val = op->args[1]; 31060fe4fca4SPaolo Bonzini 3107dd186292SRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, op->life); 31080fe4fca4SPaolo Bonzini } 31090fe4fca4SPaolo Bonzini 3110dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 3111c896fe29Sbellard { 3112dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3113c29c1d7eSAurelien Jarno TCGRegSet allocated_regs; 3114c896fe29Sbellard TCGTemp *ts, *ots; 3115450445d5SRichard Henderson TCGType otype, itype; 3116c896fe29Sbellard 3117d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 311843439139SRichard Henderson ots = arg_temp(op->args[0]); 311943439139SRichard Henderson ts = arg_temp(op->args[1]); 3120450445d5SRichard Henderson 3121450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 3122450445d5SRichard Henderson otype = ots->type; 3123450445d5SRichard Henderson itype = ts->type; 3124c896fe29Sbellard 31250fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 31260fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 31270fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 31280fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 31290fe4fca4SPaolo Bonzini temp_dead(s, ts); 31300fe4fca4SPaolo Bonzini } 31310fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 31320fe4fca4SPaolo Bonzini return; 31330fe4fca4SPaolo Bonzini } 31340fe4fca4SPaolo Bonzini 31350fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 31360fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 31370fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 31380fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 31390fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 314040ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], allocated_regs); 3141c29c1d7eSAurelien Jarno } 3142c29c1d7eSAurelien Jarno 31430fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 3144c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(0) && !ots->fixed_reg) { 3145c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 3146c29c1d7eSAurelien Jarno liveness analysis disabled). */ 3147eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 3148c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 31492272e4a7SRichard Henderson temp_allocate_frame(s, ots); 3150c29c1d7eSAurelien Jarno } 3151b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 3152c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 3153f8bf00f1SRichard Henderson temp_dead(s, ts); 3154c29c1d7eSAurelien Jarno } 3155f8bf00f1SRichard Henderson temp_dead(s, ots); 3156e8996ee0Sbellard } else { 3157c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) { 3158c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 3159c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 3160f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3161c896fe29Sbellard } 3162c29c1d7eSAurelien Jarno ots->reg = ts->reg; 3163f8bf00f1SRichard Henderson temp_dead(s, ts); 3164c29c1d7eSAurelien Jarno } else { 3165c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 3166c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 3167c29c1d7eSAurelien Jarno input one. */ 3168c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 3169450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 3170*b016486eSRichard Henderson allocated_regs, 0, 3171*b016486eSRichard Henderson ots->indirect_base); 3172c29c1d7eSAurelien Jarno } 3173450445d5SRichard Henderson tcg_out_mov(s, otype, ots->reg, ts->reg); 3174c29c1d7eSAurelien Jarno } 3175c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 3176c896fe29Sbellard ots->mem_coherent = 0; 3177f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 3178ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 317959d7c14eSRichard Henderson temp_sync(s, ots, allocated_regs, 0); 3180c29c1d7eSAurelien Jarno } 3181ec7a869dSAurelien Jarno } 3182c896fe29Sbellard } 3183c896fe29Sbellard 3184dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3185c896fe29Sbellard { 3186dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3187dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 318882790a87SRichard Henderson TCGRegSet i_allocated_regs; 318982790a87SRichard Henderson TCGRegSet o_allocated_regs; 3190b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3191b6638662SRichard Henderson TCGReg reg; 3192c896fe29Sbellard TCGArg arg; 3193c896fe29Sbellard const TCGArgConstraint *arg_ct; 3194c896fe29Sbellard TCGTemp *ts; 3195c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3196c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3197c896fe29Sbellard 3198c896fe29Sbellard nb_oargs = def->nb_oargs; 3199c896fe29Sbellard nb_iargs = def->nb_iargs; 3200c896fe29Sbellard 3201c896fe29Sbellard /* copy constants */ 3202c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3203dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3204c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3205c896fe29Sbellard 3206d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3207d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 320882790a87SRichard Henderson 3209c896fe29Sbellard /* satisfy input constraints */ 3210c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 3211c896fe29Sbellard i = def->sorted_args[nb_oargs + k]; 3212dd186292SRichard Henderson arg = op->args[i]; 3213c896fe29Sbellard arg_ct = &def->args_ct[i]; 321443439139SRichard Henderson ts = arg_temp(arg); 321540ae5c62SRichard Henderson 321640ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 321740ae5c62SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct)) { 3218c896fe29Sbellard /* constant is OK for instruction */ 3219c896fe29Sbellard const_args[i] = 1; 3220c896fe29Sbellard new_args[i] = ts->val; 3221c896fe29Sbellard goto iarg_end; 3222c896fe29Sbellard } 322340ae5c62SRichard Henderson 322482790a87SRichard Henderson temp_load(s, ts, arg_ct->u.regs, i_allocated_regs); 322540ae5c62SRichard Henderson 32265ff9d6a4Sbellard if (arg_ct->ct & TCG_CT_IALIAS) { 32275ff9d6a4Sbellard if (ts->fixed_reg) { 32285ff9d6a4Sbellard /* if fixed register, we must allocate a new register 32295ff9d6a4Sbellard if the alias is not the same register */ 3230dd186292SRichard Henderson if (arg != op->args[arg_ct->alias_index]) 32315ff9d6a4Sbellard goto allocate_in_reg; 32325ff9d6a4Sbellard } else { 3233c896fe29Sbellard /* if the input is aliased to an output and if it is 3234c896fe29Sbellard not dead after the instruction, we must allocate 3235c896fe29Sbellard a new register and move it */ 3236866cb6cbSAurelien Jarno if (!IS_DEAD_ARG(i)) { 3237c896fe29Sbellard goto allocate_in_reg; 3238c896fe29Sbellard } 32397e1df267SAurelien Jarno /* check if the current register has already been allocated 32407e1df267SAurelien Jarno for another input aliased to an output */ 32417e1df267SAurelien Jarno int k2, i2; 32427e1df267SAurelien Jarno for (k2 = 0 ; k2 < k ; k2++) { 32437e1df267SAurelien Jarno i2 = def->sorted_args[nb_oargs + k2]; 32447e1df267SAurelien Jarno if ((def->args_ct[i2].ct & TCG_CT_IALIAS) && 32457e1df267SAurelien Jarno (new_args[i2] == ts->reg)) { 32467e1df267SAurelien Jarno goto allocate_in_reg; 32477e1df267SAurelien Jarno } 32487e1df267SAurelien Jarno } 32495ff9d6a4Sbellard } 3250866cb6cbSAurelien Jarno } 3251c896fe29Sbellard reg = ts->reg; 3252c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3253c896fe29Sbellard /* nothing to do : the constraint is satisfied */ 3254c896fe29Sbellard } else { 3255c896fe29Sbellard allocate_in_reg: 3256c896fe29Sbellard /* allocate a new register matching the constraint 3257c896fe29Sbellard and move the temporary register into it */ 325882790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs, 3259*b016486eSRichard Henderson 0, ts->indirect_base); 32603b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3261c896fe29Sbellard } 3262c896fe29Sbellard new_args[i] = reg; 3263c896fe29Sbellard const_args[i] = 0; 326482790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3265c896fe29Sbellard iarg_end: ; 3266c896fe29Sbellard } 3267c896fe29Sbellard 3268c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3269866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3270866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 327143439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3272c896fe29Sbellard } 3273c896fe29Sbellard } 3274c896fe29Sbellard 3275a52ad07eSAurelien Jarno if (def->flags & TCG_OPF_BB_END) { 327682790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3277a52ad07eSAurelien Jarno } else { 3278c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3279b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3280c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3281c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 328282790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3283c896fe29Sbellard } 3284c896fe29Sbellard } 32853d5c5f87SAurelien Jarno } 32863d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 32873d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 32883d5c5f87SAurelien Jarno an exception. */ 328982790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3290c896fe29Sbellard } 3291c896fe29Sbellard 3292c896fe29Sbellard /* satisfy the output constraints */ 3293c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 3294c896fe29Sbellard i = def->sorted_args[k]; 3295dd186292SRichard Henderson arg = op->args[i]; 3296c896fe29Sbellard arg_ct = &def->args_ct[i]; 329743439139SRichard Henderson ts = arg_temp(arg); 329817280ff4SRichard Henderson if ((arg_ct->ct & TCG_CT_ALIAS) 329917280ff4SRichard Henderson && !const_args[arg_ct->alias_index]) { 33005ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 330182790a87SRichard Henderson } else if (arg_ct->ct & TCG_CT_NEWREG) { 330282790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, 330382790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 3304*b016486eSRichard Henderson 0, ts->indirect_base); 3305c896fe29Sbellard } else { 3306c896fe29Sbellard /* if fixed register, we try to use it */ 3307c896fe29Sbellard reg = ts->reg; 3308c896fe29Sbellard if (ts->fixed_reg && 3309c896fe29Sbellard tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3310c896fe29Sbellard goto oarg_end; 3311c896fe29Sbellard } 331282790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs, 3313*b016486eSRichard Henderson 0, ts->indirect_base); 3314c896fe29Sbellard } 331582790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 3316c896fe29Sbellard /* if a fixed register is used, then a move will be done afterwards */ 3317c896fe29Sbellard if (!ts->fixed_reg) { 3318639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3319f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3320639368ddSAurelien Jarno } 3321c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3322c896fe29Sbellard ts->reg = reg; 3323c896fe29Sbellard /* temp value is modified, so the value kept in memory is 3324c896fe29Sbellard potentially not the same */ 3325c896fe29Sbellard ts->mem_coherent = 0; 3326f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3327c896fe29Sbellard } 3328c896fe29Sbellard oarg_end: 3329c896fe29Sbellard new_args[i] = reg; 3330c896fe29Sbellard } 3331e8996ee0Sbellard } 3332c896fe29Sbellard 3333c896fe29Sbellard /* emit instruction */ 3334d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 3335d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 3336d2fd745fSRichard Henderson new_args, const_args); 3337d2fd745fSRichard Henderson } else { 3338dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 3339d2fd745fSRichard Henderson } 3340c896fe29Sbellard 3341c896fe29Sbellard /* move the outputs in the correct register if needed */ 3342c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 334343439139SRichard Henderson ts = arg_temp(op->args[i]); 3344c896fe29Sbellard reg = new_args[i]; 3345c896fe29Sbellard if (ts->fixed_reg && ts->reg != reg) { 33463b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3347c896fe29Sbellard } 3348ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 334982790a87SRichard Henderson temp_sync(s, ts, o_allocated_regs, IS_DEAD_ARG(i)); 335059d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3351f8bf00f1SRichard Henderson temp_dead(s, ts); 3352ec7a869dSAurelien Jarno } 3353c896fe29Sbellard } 3354c896fe29Sbellard } 3355c896fe29Sbellard 3356b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 3357b03cce8eSbellard #define STACK_DIR(x) (-(x)) 3358b03cce8eSbellard #else 3359b03cce8eSbellard #define STACK_DIR(x) (x) 3360b03cce8eSbellard #endif 3361b03cce8eSbellard 3362dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 3363c896fe29Sbellard { 3364cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 3365cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 3366dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3367b6638662SRichard Henderson int flags, nb_regs, i; 3368b6638662SRichard Henderson TCGReg reg; 3369cf066674SRichard Henderson TCGArg arg; 3370c896fe29Sbellard TCGTemp *ts; 3371d3452f1fSRichard Henderson intptr_t stack_offset; 3372d3452f1fSRichard Henderson size_t call_stack_size; 3373cf066674SRichard Henderson tcg_insn_unit *func_addr; 3374cf066674SRichard Henderson int allocate_args; 3375c896fe29Sbellard TCGRegSet allocated_regs; 3376c896fe29Sbellard 3377dd186292SRichard Henderson func_addr = (tcg_insn_unit *)(intptr_t)op->args[nb_oargs + nb_iargs]; 3378dd186292SRichard Henderson flags = op->args[nb_oargs + nb_iargs + 1]; 3379c896fe29Sbellard 33806e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 3381c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 3382c45cb8bbSRichard Henderson nb_regs = nb_iargs; 3383cf066674SRichard Henderson } 3384c896fe29Sbellard 3385c896fe29Sbellard /* assign stack slots first */ 3386c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 3387c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 3388c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 3389b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 3390b03cce8eSbellard if (allocate_args) { 3391345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 3392345649c0SBlue Swirl preallocate call stack */ 3393345649c0SBlue Swirl tcg_abort(); 3394b03cce8eSbellard } 339539cf05d3Sbellard 339639cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 3397c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 3398dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 339939cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 340039cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 340139cf05d3Sbellard #endif 340239cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 340343439139SRichard Henderson ts = arg_temp(arg); 340440ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 340540ae5c62SRichard Henderson s->reserved_regs); 3406e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 340739cf05d3Sbellard } 340839cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 340939cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 341039cf05d3Sbellard #endif 3411c896fe29Sbellard } 3412c896fe29Sbellard 3413c896fe29Sbellard /* assign input registers */ 3414d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 3415c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 3416dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 341739cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 341843439139SRichard Henderson ts = arg_temp(arg); 3419c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 3420b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 342140ae5c62SRichard Henderson 3422c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 3423c896fe29Sbellard if (ts->reg != reg) { 34243b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3425c896fe29Sbellard } 3426c896fe29Sbellard } else { 3427ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 342840ae5c62SRichard Henderson 342940ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 343040ae5c62SRichard Henderson temp_load(s, ts, arg_set, allocated_regs); 3431c896fe29Sbellard } 343240ae5c62SRichard Henderson 3433c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 3434c896fe29Sbellard } 343539cf05d3Sbellard } 3436c896fe29Sbellard 3437c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3438866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 3439866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 344043439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3441c896fe29Sbellard } 3442c896fe29Sbellard } 3443c896fe29Sbellard 3444c896fe29Sbellard /* clobber call registers */ 3445c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3446c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 3447b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 3448c896fe29Sbellard } 3449c896fe29Sbellard } 3450c896fe29Sbellard 345178505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 345278505279SAurelien Jarno they might be read. */ 345378505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 345478505279SAurelien Jarno /* Nothing to do */ 345578505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 345678505279SAurelien Jarno sync_globals(s, allocated_regs); 345778505279SAurelien Jarno } else { 3458e8996ee0Sbellard save_globals(s, allocated_regs); 3459b9c18f56Saurel32 } 3460c896fe29Sbellard 3461cf066674SRichard Henderson tcg_out_call(s, func_addr); 3462c896fe29Sbellard 3463c896fe29Sbellard /* assign output registers and emit moves if needed */ 3464c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 3465dd186292SRichard Henderson arg = op->args[i]; 346643439139SRichard Henderson ts = arg_temp(arg); 3467c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 3468eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 346934b1a49cSRichard Henderson 3470c896fe29Sbellard if (ts->fixed_reg) { 3471c896fe29Sbellard if (ts->reg != reg) { 34723b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3473c896fe29Sbellard } 3474c896fe29Sbellard } else { 3475639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3476f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3477639368ddSAurelien Jarno } 3478c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3479c896fe29Sbellard ts->reg = reg; 3480c896fe29Sbellard ts->mem_coherent = 0; 3481f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3482ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 348359d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i)); 348459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3485f8bf00f1SRichard Henderson temp_dead(s, ts); 3486c896fe29Sbellard } 3487c896fe29Sbellard } 34888c11ad25SAurelien Jarno } 3489c896fe29Sbellard } 3490c896fe29Sbellard 3491c896fe29Sbellard #ifdef CONFIG_PROFILER 3492c896fe29Sbellard 3493c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 3494c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 3495c3fac113SEmilio G. Cota do { \ 3496c3fac113SEmilio G. Cota (to)->field += atomic_read(&((from)->field)); \ 3497c3fac113SEmilio G. Cota } while (0) 3498c896fe29Sbellard 3499c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 3500c3fac113SEmilio G. Cota do { \ 3501c3fac113SEmilio G. Cota typeof((from)->field) val__ = atomic_read(&((from)->field)); \ 3502c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 3503c3fac113SEmilio G. Cota (to)->field = val__; \ 3504c3fac113SEmilio G. Cota } \ 3505c3fac113SEmilio G. Cota } while (0) 3506c3fac113SEmilio G. Cota 3507c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 3508c3fac113SEmilio G. Cota static inline 3509c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 3510c896fe29Sbellard { 35113468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 3512c3fac113SEmilio G. Cota unsigned int i; 3513c3fac113SEmilio G. Cota 35143468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 35153468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 35163468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 3517c3fac113SEmilio G. Cota 3518c3fac113SEmilio G. Cota if (counters) { 351972fd2efbSEmilio G. Cota PROF_ADD(prof, orig, cpu_exec_time); 3520c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 3521c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 3522c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 3523c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 3524c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 3525c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 3526c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 3527c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 3528c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 3529c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 3530c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 3531c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 3532c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 3533c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 3534c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 3535c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 3536c3fac113SEmilio G. Cota } 3537c3fac113SEmilio G. Cota if (table) { 3538c896fe29Sbellard int i; 3539d70724ceSzhanghailiang 354015fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 3541c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 3542c3fac113SEmilio G. Cota } 3543c3fac113SEmilio G. Cota } 3544c3fac113SEmilio G. Cota } 3545c3fac113SEmilio G. Cota } 3546c3fac113SEmilio G. Cota 3547c3fac113SEmilio G. Cota #undef PROF_ADD 3548c3fac113SEmilio G. Cota #undef PROF_MAX 3549c3fac113SEmilio G. Cota 3550c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 3551c3fac113SEmilio G. Cota { 3552c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 3553c3fac113SEmilio G. Cota } 3554c3fac113SEmilio G. Cota 3555c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 3556c3fac113SEmilio G. Cota { 3557c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 3558c3fac113SEmilio G. Cota } 3559c3fac113SEmilio G. Cota 3560c3fac113SEmilio G. Cota void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3561c3fac113SEmilio G. Cota { 3562c3fac113SEmilio G. Cota TCGProfile prof = {}; 3563c3fac113SEmilio G. Cota int i; 3564c3fac113SEmilio G. Cota 3565c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 3566c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 3567246ae24dSMax Filippov cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, 3568c3fac113SEmilio G. Cota prof.table_op_count[i]); 3569c896fe29Sbellard } 3570c896fe29Sbellard } 357172fd2efbSEmilio G. Cota 357272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 357372fd2efbSEmilio G. Cota { 357472fd2efbSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 357572fd2efbSEmilio G. Cota unsigned int i; 357672fd2efbSEmilio G. Cota int64_t ret = 0; 357772fd2efbSEmilio G. Cota 357872fd2efbSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 357972fd2efbSEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 358072fd2efbSEmilio G. Cota const TCGProfile *prof = &s->prof; 358172fd2efbSEmilio G. Cota 358272fd2efbSEmilio G. Cota ret += atomic_read(&prof->cpu_exec_time); 358372fd2efbSEmilio G. Cota } 358472fd2efbSEmilio G. Cota return ret; 358572fd2efbSEmilio G. Cota } 3586246ae24dSMax Filippov #else 3587246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3588246ae24dSMax Filippov { 3589246ae24dSMax Filippov cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3590246ae24dSMax Filippov } 359172fd2efbSEmilio G. Cota 359272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 359372fd2efbSEmilio G. Cota { 359472fd2efbSEmilio G. Cota error_report("%s: TCG profiler not compiled", __func__); 359572fd2efbSEmilio G. Cota exit(EXIT_FAILURE); 359672fd2efbSEmilio G. Cota } 3597c896fe29Sbellard #endif 3598c896fe29Sbellard 3599c896fe29Sbellard 36005bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 3601c896fe29Sbellard { 3602c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 3603c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 3604c3fac113SEmilio G. Cota #endif 360515fa08f8SRichard Henderson int i, num_insns; 360615fa08f8SRichard Henderson TCGOp *op; 3607c896fe29Sbellard 360804fe6400SRichard Henderson #ifdef CONFIG_PROFILER 360904fe6400SRichard Henderson { 3610c1f543b7SEmilio G. Cota int n = 0; 361104fe6400SRichard Henderson 361215fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 361315fa08f8SRichard Henderson n++; 361415fa08f8SRichard Henderson } 3615c3fac113SEmilio G. Cota atomic_set(&prof->op_count, prof->op_count + n); 3616c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 3617c3fac113SEmilio G. Cota atomic_set(&prof->op_count_max, n); 361804fe6400SRichard Henderson } 361904fe6400SRichard Henderson 362004fe6400SRichard Henderson n = s->nb_temps; 3621c3fac113SEmilio G. Cota atomic_set(&prof->temp_count, prof->temp_count + n); 3622c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 3623c3fac113SEmilio G. Cota atomic_set(&prof->temp_count_max, n); 362404fe6400SRichard Henderson } 362504fe6400SRichard Henderson } 362604fe6400SRichard Henderson #endif 362704fe6400SRichard Henderson 3628c896fe29Sbellard #ifdef DEBUG_DISAS 3629d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 3630d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 36311ee73216SRichard Henderson qemu_log_lock(); 363293fcfe39Saliguori qemu_log("OP:\n"); 3633eeacee4dSBlue Swirl tcg_dump_ops(s); 363493fcfe39Saliguori qemu_log("\n"); 36351ee73216SRichard Henderson qemu_log_unlock(); 3636c896fe29Sbellard } 3637c896fe29Sbellard #endif 3638c896fe29Sbellard 3639c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 3640c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 3641c5cc28ffSAurelien Jarno #endif 3642c5cc28ffSAurelien Jarno 36438f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 3644c45cb8bbSRichard Henderson tcg_optimize(s); 36458f2e8c07SKirill Batuzov #endif 36468f2e8c07SKirill Batuzov 3647a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3648c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 3649c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time - profile_getclock()); 3650a23a9ec6Sbellard #endif 3651c5cc28ffSAurelien Jarno 3652b4fc67c7SRichard Henderson reachable_code_pass(s); 3653b83eabeaSRichard Henderson liveness_pass_1(s); 36545a18407fSRichard Henderson 36555a18407fSRichard Henderson if (s->nb_indirects > 0) { 36565a18407fSRichard Henderson #ifdef DEBUG_DISAS 36575a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 36585a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 36591ee73216SRichard Henderson qemu_log_lock(); 36605a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 36615a18407fSRichard Henderson tcg_dump_ops(s); 36625a18407fSRichard Henderson qemu_log("\n"); 36631ee73216SRichard Henderson qemu_log_unlock(); 36645a18407fSRichard Henderson } 36655a18407fSRichard Henderson #endif 36665a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 3667b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 36685a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 3669b83eabeaSRichard Henderson liveness_pass_1(s); 36705a18407fSRichard Henderson } 36715a18407fSRichard Henderson } 3672c5cc28ffSAurelien Jarno 3673a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3674c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time + profile_getclock()); 3675a23a9ec6Sbellard #endif 3676c896fe29Sbellard 3677c896fe29Sbellard #ifdef DEBUG_DISAS 3678d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 3679d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 36801ee73216SRichard Henderson qemu_log_lock(); 3681c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 3682eeacee4dSBlue Swirl tcg_dump_ops(s); 368393fcfe39Saliguori qemu_log("\n"); 36841ee73216SRichard Henderson qemu_log_unlock(); 3685c896fe29Sbellard } 3686c896fe29Sbellard #endif 3687c896fe29Sbellard 3688c896fe29Sbellard tcg_reg_alloc_start(s); 3689c896fe29Sbellard 3690e7e168f4SEmilio G. Cota s->code_buf = tb->tc.ptr; 3691e7e168f4SEmilio G. Cota s->code_ptr = tb->tc.ptr; 3692c896fe29Sbellard 3693659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 36946001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 3695659ef5cbSRichard Henderson #endif 369657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 369757a26946SRichard Henderson s->pool_labels = NULL; 369857a26946SRichard Henderson #endif 36999ecefc84SRichard Henderson 3700fca8a500SRichard Henderson num_insns = -1; 370115fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 3702c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 3703b3db8758Sblueswir1 3704c896fe29Sbellard #ifdef CONFIG_PROFILER 3705c3fac113SEmilio G. Cota atomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 3706c896fe29Sbellard #endif 3707c45cb8bbSRichard Henderson 3708c896fe29Sbellard switch (opc) { 3709c896fe29Sbellard case INDEX_op_mov_i32: 3710c896fe29Sbellard case INDEX_op_mov_i64: 3711d2fd745fSRichard Henderson case INDEX_op_mov_vec: 3712dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 3713c896fe29Sbellard break; 3714e8996ee0Sbellard case INDEX_op_movi_i32: 3715e8996ee0Sbellard case INDEX_op_movi_i64: 3716d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 3717dd186292SRichard Henderson tcg_reg_alloc_movi(s, op); 3718e8996ee0Sbellard break; 3719765b842aSRichard Henderson case INDEX_op_insn_start: 3720fca8a500SRichard Henderson if (num_insns >= 0) { 37219f754620SRichard Henderson size_t off = tcg_current_code_size(s); 37229f754620SRichard Henderson s->gen_insn_end_off[num_insns] = off; 37239f754620SRichard Henderson /* Assert that we do not overflow our stored offset. */ 37249f754620SRichard Henderson assert(s->gen_insn_end_off[num_insns] == off); 3725fca8a500SRichard Henderson } 3726fca8a500SRichard Henderson num_insns++; 3727bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 3728bad729e2SRichard Henderson target_ulong a; 3729bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 3730efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 3731bad729e2SRichard Henderson #else 3732efee3746SRichard Henderson a = op->args[i]; 3733bad729e2SRichard Henderson #endif 3734fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 3735bad729e2SRichard Henderson } 3736c896fe29Sbellard break; 37375ff9d6a4Sbellard case INDEX_op_discard: 373843439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 37395ff9d6a4Sbellard break; 3740c896fe29Sbellard case INDEX_op_set_label: 3741e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 3742efee3746SRichard Henderson tcg_out_label(s, arg_label(op->args[0]), s->code_ptr); 3743c896fe29Sbellard break; 3744c896fe29Sbellard case INDEX_op_call: 3745dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 3746c45cb8bbSRichard Henderson break; 3747c896fe29Sbellard default: 374825c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 3749be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 3750c896fe29Sbellard /* Note: in order to speed up the code, it would be much 3751c896fe29Sbellard faster to have specialized register allocator functions for 3752c896fe29Sbellard some common argument patterns */ 3753dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 3754c896fe29Sbellard break; 3755c896fe29Sbellard } 37568d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 3757c896fe29Sbellard check_regs(s); 3758c896fe29Sbellard #endif 3759b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 3760b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 3761b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 3762b125f9dcSRichard Henderson generating code without having to check during generation. */ 3763644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 3764b125f9dcSRichard Henderson return -1; 3765b125f9dcSRichard Henderson } 3766c896fe29Sbellard } 3767fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 3768fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 3769c45cb8bbSRichard Henderson 3770b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 3771659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 3772659ef5cbSRichard Henderson if (!tcg_out_ldst_finalize(s)) { 377323dceda6SRichard Henderson return -1; 377423dceda6SRichard Henderson } 3775659ef5cbSRichard Henderson #endif 377657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 377757a26946SRichard Henderson if (!tcg_out_pool_finalize(s)) { 377857a26946SRichard Henderson return -1; 377957a26946SRichard Henderson } 378057a26946SRichard Henderson #endif 3781c896fe29Sbellard 3782c896fe29Sbellard /* flush instruction cache */ 37831813e175SRichard Henderson flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr); 37842aeabc08SStefan Weil 37851813e175SRichard Henderson return tcg_current_code_size(s); 3786c896fe29Sbellard } 3787c896fe29Sbellard 3788a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3789405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3790a23a9ec6Sbellard { 3791c3fac113SEmilio G. Cota TCGProfile prof = {}; 3792c3fac113SEmilio G. Cota const TCGProfile *s; 3793c3fac113SEmilio G. Cota int64_t tb_count; 3794c3fac113SEmilio G. Cota int64_t tb_div_count; 3795c3fac113SEmilio G. Cota int64_t tot; 3796c3fac113SEmilio G. Cota 3797c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 3798c3fac113SEmilio G. Cota s = &prof; 3799c3fac113SEmilio G. Cota tb_count = s->tb_count; 3800c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 3801c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 3802a23a9ec6Sbellard 3803a23a9ec6Sbellard cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 3804a23a9ec6Sbellard tot, tot / 2.4e9); 3805a23a9ec6Sbellard cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n", 3806fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 3807fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 3808fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 3809a23a9ec6Sbellard cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n", 3810fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 3811a23a9ec6Sbellard cpu_fprintf(f, "deleted ops/TB %0.2f\n", 3812fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 3813a23a9ec6Sbellard cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n", 3814fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 3815fca8a500SRichard Henderson cpu_fprintf(f, "avg host code/TB %0.1f\n", 3816fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 3817fca8a500SRichard Henderson cpu_fprintf(f, "avg search data/TB %0.1f\n", 3818fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 3819a23a9ec6Sbellard 3820a23a9ec6Sbellard cpu_fprintf(f, "cycles/op %0.1f\n", 3821a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 3822a23a9ec6Sbellard cpu_fprintf(f, "cycles/in byte %0.1f\n", 3823a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 3824a23a9ec6Sbellard cpu_fprintf(f, "cycles/out byte %0.1f\n", 3825a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 3826fca8a500SRichard Henderson cpu_fprintf(f, "cycles/search byte %0.1f\n", 3827fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 3828fca8a500SRichard Henderson if (tot == 0) { 3829a23a9ec6Sbellard tot = 1; 3830fca8a500SRichard Henderson } 3831a23a9ec6Sbellard cpu_fprintf(f, " gen_interm time %0.1f%%\n", 3832a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 3833a23a9ec6Sbellard cpu_fprintf(f, " gen_code time %0.1f%%\n", 3834a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 3835c5cc28ffSAurelien Jarno cpu_fprintf(f, "optim./code time %0.1f%%\n", 3836c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 3837c5cc28ffSAurelien Jarno * 100.0); 3838a23a9ec6Sbellard cpu_fprintf(f, "liveness/code time %0.1f%%\n", 3839a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 3840a23a9ec6Sbellard cpu_fprintf(f, "cpu_restore count %" PRId64 "\n", 3841a23a9ec6Sbellard s->restore_count); 3842a23a9ec6Sbellard cpu_fprintf(f, " avg cycles %0.1f\n", 3843a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 3844a23a9ec6Sbellard } 3845a23a9ec6Sbellard #else 3846405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3847a23a9ec6Sbellard { 384824bf7b3aSbellard cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3849a23a9ec6Sbellard } 3850a23a9ec6Sbellard #endif 3851813da627SRichard Henderson 3852813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 38535872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 38545872bbf2SRichard Henderson 38555872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 38565872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 38575872bbf2SRichard Henderson 38585872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 38595872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 38605872bbf2SRichard Henderson prologue unwind info for the tcg machine. 38615872bbf2SRichard Henderson 38625872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 38635872bbf2SRichard Henderson */ 3864813da627SRichard Henderson 3865813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 3866813da627SRichard Henderson typedef enum { 3867813da627SRichard Henderson JIT_NOACTION = 0, 3868813da627SRichard Henderson JIT_REGISTER_FN, 3869813da627SRichard Henderson JIT_UNREGISTER_FN 3870813da627SRichard Henderson } jit_actions_t; 3871813da627SRichard Henderson 3872813da627SRichard Henderson struct jit_code_entry { 3873813da627SRichard Henderson struct jit_code_entry *next_entry; 3874813da627SRichard Henderson struct jit_code_entry *prev_entry; 3875813da627SRichard Henderson const void *symfile_addr; 3876813da627SRichard Henderson uint64_t symfile_size; 3877813da627SRichard Henderson }; 3878813da627SRichard Henderson 3879813da627SRichard Henderson struct jit_descriptor { 3880813da627SRichard Henderson uint32_t version; 3881813da627SRichard Henderson uint32_t action_flag; 3882813da627SRichard Henderson struct jit_code_entry *relevant_entry; 3883813da627SRichard Henderson struct jit_code_entry *first_entry; 3884813da627SRichard Henderson }; 3885813da627SRichard Henderson 3886813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 3887813da627SRichard Henderson void __jit_debug_register_code(void) 3888813da627SRichard Henderson { 3889813da627SRichard Henderson asm(""); 3890813da627SRichard Henderson } 3891813da627SRichard Henderson 3892813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 3893813da627SRichard Henderson the version before we can set it. */ 3894813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 3895813da627SRichard Henderson 3896813da627SRichard Henderson /* End GDB interface. */ 3897813da627SRichard Henderson 3898813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 3899813da627SRichard Henderson { 3900813da627SRichard Henderson const char *p = strtab + 1; 3901813da627SRichard Henderson 3902813da627SRichard Henderson while (1) { 3903813da627SRichard Henderson if (strcmp(p, str) == 0) { 3904813da627SRichard Henderson return p - strtab; 3905813da627SRichard Henderson } 3906813da627SRichard Henderson p += strlen(p) + 1; 3907813da627SRichard Henderson } 3908813da627SRichard Henderson } 3909813da627SRichard Henderson 39105872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size, 39112c90784aSRichard Henderson const void *debug_frame, 39122c90784aSRichard Henderson size_t debug_frame_size) 3913813da627SRichard Henderson { 39145872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 39155872bbf2SRichard Henderson uint32_t len; 39165872bbf2SRichard Henderson uint16_t version; 39175872bbf2SRichard Henderson uint32_t abbrev; 39185872bbf2SRichard Henderson uint8_t ptr_size; 39195872bbf2SRichard Henderson uint8_t cu_die; 39205872bbf2SRichard Henderson uint16_t cu_lang; 39215872bbf2SRichard Henderson uintptr_t cu_low_pc; 39225872bbf2SRichard Henderson uintptr_t cu_high_pc; 39235872bbf2SRichard Henderson uint8_t fn_die; 39245872bbf2SRichard Henderson char fn_name[16]; 39255872bbf2SRichard Henderson uintptr_t fn_low_pc; 39265872bbf2SRichard Henderson uintptr_t fn_high_pc; 39275872bbf2SRichard Henderson uint8_t cu_eoc; 39285872bbf2SRichard Henderson }; 3929813da627SRichard Henderson 3930813da627SRichard Henderson struct ElfImage { 3931813da627SRichard Henderson ElfW(Ehdr) ehdr; 3932813da627SRichard Henderson ElfW(Phdr) phdr; 39335872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 39345872bbf2SRichard Henderson ElfW(Sym) sym[2]; 39355872bbf2SRichard Henderson struct DebugInfo di; 39365872bbf2SRichard Henderson uint8_t da[24]; 39375872bbf2SRichard Henderson char str[80]; 39385872bbf2SRichard Henderson }; 39395872bbf2SRichard Henderson 39405872bbf2SRichard Henderson struct ElfImage *img; 39415872bbf2SRichard Henderson 39425872bbf2SRichard Henderson static const struct ElfImage img_template = { 39435872bbf2SRichard Henderson .ehdr = { 39445872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 39455872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 39465872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 39475872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 39485872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 39495872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 39505872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 39515872bbf2SRichard Henderson .e_type = ET_EXEC, 39525872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 39535872bbf2SRichard Henderson .e_version = EV_CURRENT, 39545872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 39555872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 39565872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 39575872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 39585872bbf2SRichard Henderson .e_phnum = 1, 39595872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 39605872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 39615872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 3962abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 3963abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 3964abbb3eaeSRichard Henderson #endif 3965abbb3eaeSRichard Henderson #ifdef ELF_OSABI 3966abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 3967abbb3eaeSRichard Henderson #endif 39685872bbf2SRichard Henderson }, 39695872bbf2SRichard Henderson .phdr = { 39705872bbf2SRichard Henderson .p_type = PT_LOAD, 39715872bbf2SRichard Henderson .p_flags = PF_X, 39725872bbf2SRichard Henderson }, 39735872bbf2SRichard Henderson .shdr = { 39745872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 39755872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 39765872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 39775872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 39785872bbf2SRichard Henderson will not look for contents. We can record any address. */ 39795872bbf2SRichard Henderson [1] = { /* .text */ 39805872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 39815872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 39825872bbf2SRichard Henderson }, 39835872bbf2SRichard Henderson [2] = { /* .debug_info */ 39845872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 39855872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 39865872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 39875872bbf2SRichard Henderson }, 39885872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 39895872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 39905872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 39915872bbf2SRichard Henderson .sh_size = sizeof(img->da), 39925872bbf2SRichard Henderson }, 39935872bbf2SRichard Henderson [4] = { /* .debug_frame */ 39945872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 39955872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 39965872bbf2SRichard Henderson }, 39975872bbf2SRichard Henderson [5] = { /* .symtab */ 39985872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 39995872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 40005872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 40015872bbf2SRichard Henderson .sh_info = 1, 40025872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 40035872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 40045872bbf2SRichard Henderson }, 40055872bbf2SRichard Henderson [6] = { /* .strtab */ 40065872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 40075872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 40085872bbf2SRichard Henderson .sh_size = sizeof(img->str), 40095872bbf2SRichard Henderson } 40105872bbf2SRichard Henderson }, 40115872bbf2SRichard Henderson .sym = { 40125872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 40135872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 40145872bbf2SRichard Henderson .st_shndx = 1, 40155872bbf2SRichard Henderson } 40165872bbf2SRichard Henderson }, 40175872bbf2SRichard Henderson .di = { 40185872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 40195872bbf2SRichard Henderson .version = 2, 40205872bbf2SRichard Henderson .ptr_size = sizeof(void *), 40215872bbf2SRichard Henderson .cu_die = 1, 40225872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 40235872bbf2SRichard Henderson .fn_die = 2, 40245872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 40255872bbf2SRichard Henderson }, 40265872bbf2SRichard Henderson .da = { 40275872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 40285872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 40295872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 40305872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 40315872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 40325872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 40335872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 40345872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 40355872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 40365872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 40375872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 40385872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 40395872bbf2SRichard Henderson 0 /* no more abbrev */ 40405872bbf2SRichard Henderson }, 40415872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 40425872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 4043813da627SRichard Henderson }; 4044813da627SRichard Henderson 4045813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 4046813da627SRichard Henderson static struct jit_code_entry one_entry; 4047813da627SRichard Henderson 40485872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 4049813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 40502c90784aSRichard Henderson DebugFrameHeader *dfh; 4051813da627SRichard Henderson 40525872bbf2SRichard Henderson img = g_malloc(img_size); 40535872bbf2SRichard Henderson *img = img_template; 4054813da627SRichard Henderson 40555872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 40565872bbf2SRichard Henderson img->phdr.p_paddr = buf; 40575872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 4058813da627SRichard Henderson 40595872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 40605872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 40615872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 4062813da627SRichard Henderson 40635872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 40645872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 40655872bbf2SRichard Henderson 40665872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 40675872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 40685872bbf2SRichard Henderson 40695872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 40705872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 40715872bbf2SRichard Henderson 40725872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 40735872bbf2SRichard Henderson img->sym[1].st_value = buf; 40745872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 40755872bbf2SRichard Henderson 40765872bbf2SRichard Henderson img->di.cu_low_pc = buf; 407745aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 40785872bbf2SRichard Henderson img->di.fn_low_pc = buf; 407945aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 4080813da627SRichard Henderson 40812c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 40822c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 40832c90784aSRichard Henderson dfh->fde.func_start = buf; 40842c90784aSRichard Henderson dfh->fde.func_len = buf_size; 40852c90784aSRichard Henderson 4086813da627SRichard Henderson #ifdef DEBUG_JIT 4087813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 4088813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 4089813da627SRichard Henderson { 4090813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 4091813da627SRichard Henderson if (f) { 40925872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 4093813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 4094813da627SRichard Henderson } 4095813da627SRichard Henderson fclose(f); 4096813da627SRichard Henderson } 4097813da627SRichard Henderson } 4098813da627SRichard Henderson #endif 4099813da627SRichard Henderson 4100813da627SRichard Henderson one_entry.symfile_addr = img; 4101813da627SRichard Henderson one_entry.symfile_size = img_size; 4102813da627SRichard Henderson 4103813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 4104813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 4105813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 4106813da627SRichard Henderson __jit_debug_register_code(); 4107813da627SRichard Henderson } 4108813da627SRichard Henderson #else 41095872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 41105872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 4111813da627SRichard Henderson 4112813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 41132c90784aSRichard Henderson const void *debug_frame, 41142c90784aSRichard Henderson size_t debug_frame_size) 4115813da627SRichard Henderson { 4116813da627SRichard Henderson } 4117813da627SRichard Henderson 4118813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size) 4119813da627SRichard Henderson { 4120813da627SRichard Henderson } 4121813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 4122db432672SRichard Henderson 4123db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 4124db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 4125db432672SRichard Henderson { 4126db432672SRichard Henderson g_assert_not_reached(); 4127db432672SRichard Henderson } 4128db432672SRichard Henderson #endif 4129