1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 3372fd2efbSEmilio G. Cota #include "qemu/error-report.h" 34f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 351de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 361de7afc9SPaolo Bonzini #include "qemu/timer.h" 37c896fe29Sbellard 38c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 39c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 40c896fe29Sbellard instructions */ 41c896fe29Sbellard #define NO_CPU_IO_DEFS 42c896fe29Sbellard #include "cpu.h" 43c896fe29Sbellard 4463c91552SPaolo Bonzini #include "exec/cpu-common.h" 4563c91552SPaolo Bonzini #include "exec/exec-all.h" 4663c91552SPaolo Bonzini 47c896fe29Sbellard #include "tcg-op.h" 48813da627SRichard Henderson 49edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 50813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 51edee2579SRichard Henderson #else 52edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 53813da627SRichard Henderson #endif 54813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 55813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 56813da627SRichard Henderson #else 57813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 58813da627SRichard Henderson #endif 59813da627SRichard Henderson 60c896fe29Sbellard #include "elf.h" 61508127e2SPaolo Bonzini #include "exec/log.h" 623468b59eSEmilio G. Cota #include "sysemu/sysemu.h" 63c896fe29Sbellard 64ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and 65ce151109SPeter Maydell used here. */ 66e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 67f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode); 68e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 696ac17786SRichard Henderson static bool patch_reloc(tcg_insn_unit *code_ptr, int type, 702ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 71c896fe29Sbellard 72497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 73497a22ebSRichard Henderson typedef struct { 74497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 75497a22ebSRichard Henderson uint32_t id; 76497a22ebSRichard Henderson uint8_t version; 77497a22ebSRichard Henderson char augmentation[1]; 78497a22ebSRichard Henderson uint8_t code_align; 79497a22ebSRichard Henderson uint8_t data_align; 80497a22ebSRichard Henderson uint8_t return_column; 81497a22ebSRichard Henderson } DebugFrameCIE; 82497a22ebSRichard Henderson 83497a22ebSRichard Henderson typedef struct QEMU_PACKED { 84497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 85497a22ebSRichard Henderson uint32_t cie_offset; 86edee2579SRichard Henderson uintptr_t func_start; 87edee2579SRichard Henderson uintptr_t func_len; 88497a22ebSRichard Henderson } DebugFrameFDEHeader; 89497a22ebSRichard Henderson 902c90784aSRichard Henderson typedef struct QEMU_PACKED { 912c90784aSRichard Henderson DebugFrameCIE cie; 922c90784aSRichard Henderson DebugFrameFDEHeader fde; 932c90784aSRichard Henderson } DebugFrameHeader; 942c90784aSRichard Henderson 95813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 962c90784aSRichard Henderson const void *debug_frame, 972c90784aSRichard Henderson size_t debug_frame_size) 98813da627SRichard Henderson __attribute__((unused)); 99813da627SRichard Henderson 100ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */ 101069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct, 102069ea736SRichard Henderson const char *ct_str, TCGType type); 1032a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 104a05b5b9bSRichard Henderson intptr_t arg2); 1052a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 106c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1072a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 108c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args, 109c0ad3001SStefan Weil const int *const_args); 110d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 111d2fd745fSRichard Henderson static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 112d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 113d2fd745fSRichard Henderson const int *const_args); 114d2fd745fSRichard Henderson #else 115d2fd745fSRichard Henderson static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 116d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 117d2fd745fSRichard Henderson const int *const_args) 118d2fd745fSRichard Henderson { 119d2fd745fSRichard Henderson g_assert_not_reached(); 120d2fd745fSRichard Henderson } 121d2fd745fSRichard Henderson #endif 1222a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 123a05b5b9bSRichard Henderson intptr_t arg2); 12459d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 12559d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 126cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); 127f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type, 128c0ad3001SStefan Weil const TCGArgConstraint *arg_ct); 129659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 130659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s); 131659ef5cbSRichard Henderson #endif 132c896fe29Sbellard 133a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024 134a505785cSEmilio G. Cota 135df2cce29SEmilio G. Cota static TCGContext **tcg_ctxs; 136df2cce29SEmilio G. Cota static unsigned int n_tcg_ctxs; 1371c2adb95SRichard Henderson TCGv_env cpu_env = 0; 138df2cce29SEmilio G. Cota 139be2cdc5eSEmilio G. Cota struct tcg_region_tree { 140be2cdc5eSEmilio G. Cota QemuMutex lock; 141be2cdc5eSEmilio G. Cota GTree *tree; 142be2cdc5eSEmilio G. Cota /* padding to avoid false sharing is computed at run-time */ 143be2cdc5eSEmilio G. Cota }; 144be2cdc5eSEmilio G. Cota 145e8feb96fSEmilio G. Cota /* 146e8feb96fSEmilio G. Cota * We divide code_gen_buffer into equally-sized "regions" that TCG threads 147e8feb96fSEmilio G. Cota * dynamically allocate from as demand dictates. Given appropriate region 148e8feb96fSEmilio G. Cota * sizing, this minimizes flushes even when some TCG threads generate a lot 149e8feb96fSEmilio G. Cota * more code than others. 150e8feb96fSEmilio G. Cota */ 151e8feb96fSEmilio G. Cota struct tcg_region_state { 152e8feb96fSEmilio G. Cota QemuMutex lock; 153e8feb96fSEmilio G. Cota 154e8feb96fSEmilio G. Cota /* fields set at init time */ 155e8feb96fSEmilio G. Cota void *start; 156e8feb96fSEmilio G. Cota void *start_aligned; 157e8feb96fSEmilio G. Cota void *end; 158e8feb96fSEmilio G. Cota size_t n; 159e8feb96fSEmilio G. Cota size_t size; /* size of one region */ 160e8feb96fSEmilio G. Cota size_t stride; /* .size + guard size */ 161e8feb96fSEmilio G. Cota 162e8feb96fSEmilio G. Cota /* fields protected by the lock */ 163e8feb96fSEmilio G. Cota size_t current; /* current region index */ 164e8feb96fSEmilio G. Cota size_t agg_size_full; /* aggregate size of full regions */ 165e8feb96fSEmilio G. Cota }; 166e8feb96fSEmilio G. Cota 167e8feb96fSEmilio G. Cota static struct tcg_region_state region; 168be2cdc5eSEmilio G. Cota /* 169be2cdc5eSEmilio G. Cota * This is an array of struct tcg_region_tree's, with padding. 170be2cdc5eSEmilio G. Cota * We use void * to simplify the computation of region_trees[i]; each 171be2cdc5eSEmilio G. Cota * struct is found every tree_size bytes. 172be2cdc5eSEmilio G. Cota */ 173be2cdc5eSEmilio G. Cota static void *region_trees; 174be2cdc5eSEmilio G. Cota static size_t tree_size; 175d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 176b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 177c896fe29Sbellard 1781813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1794196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 180c896fe29Sbellard { 181c896fe29Sbellard *s->code_ptr++ = v; 182c896fe29Sbellard } 183c896fe29Sbellard 1844196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1854196dca6SPeter Maydell uint8_t v) 1865c53bb81SPeter Maydell { 1871813e175SRichard Henderson *p = v; 1885c53bb81SPeter Maydell } 1891813e175SRichard Henderson #endif 1905c53bb81SPeter Maydell 1911813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1924196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 193c896fe29Sbellard { 1941813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1951813e175SRichard Henderson *s->code_ptr++ = v; 1961813e175SRichard Henderson } else { 1971813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1984387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1991813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 2001813e175SRichard Henderson } 201c896fe29Sbellard } 202c896fe29Sbellard 2034196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 2044196dca6SPeter Maydell uint16_t v) 2055c53bb81SPeter Maydell { 2061813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 2071813e175SRichard Henderson *p = v; 2081813e175SRichard Henderson } else { 2095c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2105c53bb81SPeter Maydell } 2111813e175SRichard Henderson } 2121813e175SRichard Henderson #endif 2135c53bb81SPeter Maydell 2141813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2154196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 216c896fe29Sbellard { 2171813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2181813e175SRichard Henderson *s->code_ptr++ = v; 2191813e175SRichard Henderson } else { 2201813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2214387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2221813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2231813e175SRichard Henderson } 224c896fe29Sbellard } 225c896fe29Sbellard 2264196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2274196dca6SPeter Maydell uint32_t v) 2285c53bb81SPeter Maydell { 2291813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2301813e175SRichard Henderson *p = v; 2311813e175SRichard Henderson } else { 2325c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2335c53bb81SPeter Maydell } 2341813e175SRichard Henderson } 2351813e175SRichard Henderson #endif 2365c53bb81SPeter Maydell 2371813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2384196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 239ac26eb69SRichard Henderson { 2401813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2411813e175SRichard Henderson *s->code_ptr++ = v; 2421813e175SRichard Henderson } else { 2431813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2444387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2451813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2461813e175SRichard Henderson } 247ac26eb69SRichard Henderson } 248ac26eb69SRichard Henderson 2494196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2504196dca6SPeter Maydell uint64_t v) 2515c53bb81SPeter Maydell { 2521813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2531813e175SRichard Henderson *p = v; 2541813e175SRichard Henderson } else { 2555c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2565c53bb81SPeter Maydell } 2571813e175SRichard Henderson } 2581813e175SRichard Henderson #endif 2595c53bb81SPeter Maydell 260c896fe29Sbellard /* label relocation processing */ 261c896fe29Sbellard 2621813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 263bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 264c896fe29Sbellard { 265c896fe29Sbellard TCGRelocation *r; 266c896fe29Sbellard 267c896fe29Sbellard if (l->has_value) { 268623e265cSpbrook /* FIXME: This may break relocations on RISC targets that 269623e265cSpbrook modify instruction fields in place. The caller may not have 270623e265cSpbrook written the initial value. */ 2716ac17786SRichard Henderson bool ok = patch_reloc(code_ptr, type, l->u.value, addend); 2726ac17786SRichard Henderson tcg_debug_assert(ok); 273c896fe29Sbellard } else { 274c896fe29Sbellard /* add a new relocation entry */ 275c896fe29Sbellard r = tcg_malloc(sizeof(TCGRelocation)); 276c896fe29Sbellard r->type = type; 277c896fe29Sbellard r->ptr = code_ptr; 278c896fe29Sbellard r->addend = addend; 279c896fe29Sbellard r->next = l->u.first_reloc; 280c896fe29Sbellard l->u.first_reloc = r; 281c896fe29Sbellard } 282c896fe29Sbellard } 283c896fe29Sbellard 284bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr) 285c896fe29Sbellard { 2862ba7fae2SRichard Henderson intptr_t value = (intptr_t)ptr; 2871813e175SRichard Henderson TCGRelocation *r; 288c896fe29Sbellard 289eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 2901813e175SRichard Henderson 2911813e175SRichard Henderson for (r = l->u.first_reloc; r != NULL; r = r->next) { 2926ac17786SRichard Henderson bool ok = patch_reloc(r->ptr, r->type, value, r->addend); 2936ac17786SRichard Henderson tcg_debug_assert(ok); 294c896fe29Sbellard } 2951813e175SRichard Henderson 296c896fe29Sbellard l->has_value = 1; 2971813e175SRichard Henderson l->u.value_ptr = ptr; 298c896fe29Sbellard } 299c896fe29Sbellard 30042a268c2SRichard Henderson TCGLabel *gen_new_label(void) 301c896fe29Sbellard { 302b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 30351e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 304c896fe29Sbellard 30551e3972cSRichard Henderson *l = (TCGLabel){ 30651e3972cSRichard Henderson .id = s->nb_labels++ 30751e3972cSRichard Henderson }; 30842a268c2SRichard Henderson 30942a268c2SRichard Henderson return l; 310c896fe29Sbellard } 311c896fe29Sbellard 3129f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which) 3139f754620SRichard Henderson { 3149f754620SRichard Henderson size_t off = tcg_current_code_size(s); 3159f754620SRichard Henderson s->tb_jmp_reset_offset[which] = off; 3169f754620SRichard Henderson /* Make sure that we didn't overflow the stored offset. */ 3179f754620SRichard Henderson assert(s->tb_jmp_reset_offset[which] == off); 3189f754620SRichard Henderson } 3199f754620SRichard Henderson 320ce151109SPeter Maydell #include "tcg-target.inc.c" 321c896fe29Sbellard 322be2cdc5eSEmilio G. Cota /* compare a pointer @ptr and a tb_tc @s */ 323be2cdc5eSEmilio G. Cota static int ptr_cmp_tb_tc(const void *ptr, const struct tb_tc *s) 324be2cdc5eSEmilio G. Cota { 325be2cdc5eSEmilio G. Cota if (ptr >= s->ptr + s->size) { 326be2cdc5eSEmilio G. Cota return 1; 327be2cdc5eSEmilio G. Cota } else if (ptr < s->ptr) { 328be2cdc5eSEmilio G. Cota return -1; 329be2cdc5eSEmilio G. Cota } 330be2cdc5eSEmilio G. Cota return 0; 331be2cdc5eSEmilio G. Cota } 332be2cdc5eSEmilio G. Cota 333be2cdc5eSEmilio G. Cota static gint tb_tc_cmp(gconstpointer ap, gconstpointer bp) 334be2cdc5eSEmilio G. Cota { 335be2cdc5eSEmilio G. Cota const struct tb_tc *a = ap; 336be2cdc5eSEmilio G. Cota const struct tb_tc *b = bp; 337be2cdc5eSEmilio G. Cota 338be2cdc5eSEmilio G. Cota /* 339be2cdc5eSEmilio G. Cota * When both sizes are set, we know this isn't a lookup. 340be2cdc5eSEmilio G. Cota * This is the most likely case: every TB must be inserted; lookups 341be2cdc5eSEmilio G. Cota * are a lot less frequent. 342be2cdc5eSEmilio G. Cota */ 343be2cdc5eSEmilio G. Cota if (likely(a->size && b->size)) { 344be2cdc5eSEmilio G. Cota if (a->ptr > b->ptr) { 345be2cdc5eSEmilio G. Cota return 1; 346be2cdc5eSEmilio G. Cota } else if (a->ptr < b->ptr) { 347be2cdc5eSEmilio G. Cota return -1; 348be2cdc5eSEmilio G. Cota } 349be2cdc5eSEmilio G. Cota /* a->ptr == b->ptr should happen only on deletions */ 350be2cdc5eSEmilio G. Cota g_assert(a->size == b->size); 351be2cdc5eSEmilio G. Cota return 0; 352be2cdc5eSEmilio G. Cota } 353be2cdc5eSEmilio G. Cota /* 354be2cdc5eSEmilio G. Cota * All lookups have either .size field set to 0. 355be2cdc5eSEmilio G. Cota * From the glib sources we see that @ap is always the lookup key. However 356be2cdc5eSEmilio G. Cota * the docs provide no guarantee, so we just mark this case as likely. 357be2cdc5eSEmilio G. Cota */ 358be2cdc5eSEmilio G. Cota if (likely(a->size == 0)) { 359be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(a->ptr, b); 360be2cdc5eSEmilio G. Cota } 361be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(b->ptr, a); 362be2cdc5eSEmilio G. Cota } 363be2cdc5eSEmilio G. Cota 364be2cdc5eSEmilio G. Cota static void tcg_region_trees_init(void) 365be2cdc5eSEmilio G. Cota { 366be2cdc5eSEmilio G. Cota size_t i; 367be2cdc5eSEmilio G. Cota 368be2cdc5eSEmilio G. Cota tree_size = ROUND_UP(sizeof(struct tcg_region_tree), qemu_dcache_linesize); 369be2cdc5eSEmilio G. Cota region_trees = qemu_memalign(qemu_dcache_linesize, region.n * tree_size); 370be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 371be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 372be2cdc5eSEmilio G. Cota 373be2cdc5eSEmilio G. Cota qemu_mutex_init(&rt->lock); 374be2cdc5eSEmilio G. Cota rt->tree = g_tree_new(tb_tc_cmp); 375be2cdc5eSEmilio G. Cota } 376be2cdc5eSEmilio G. Cota } 377be2cdc5eSEmilio G. Cota 378be2cdc5eSEmilio G. Cota static struct tcg_region_tree *tc_ptr_to_region_tree(void *p) 379be2cdc5eSEmilio G. Cota { 380be2cdc5eSEmilio G. Cota size_t region_idx; 381be2cdc5eSEmilio G. Cota 382be2cdc5eSEmilio G. Cota if (p < region.start_aligned) { 383be2cdc5eSEmilio G. Cota region_idx = 0; 384be2cdc5eSEmilio G. Cota } else { 385be2cdc5eSEmilio G. Cota ptrdiff_t offset = p - region.start_aligned; 386be2cdc5eSEmilio G. Cota 387be2cdc5eSEmilio G. Cota if (offset > region.stride * (region.n - 1)) { 388be2cdc5eSEmilio G. Cota region_idx = region.n - 1; 389be2cdc5eSEmilio G. Cota } else { 390be2cdc5eSEmilio G. Cota region_idx = offset / region.stride; 391be2cdc5eSEmilio G. Cota } 392be2cdc5eSEmilio G. Cota } 393be2cdc5eSEmilio G. Cota return region_trees + region_idx * tree_size; 394be2cdc5eSEmilio G. Cota } 395be2cdc5eSEmilio G. Cota 396be2cdc5eSEmilio G. Cota void tcg_tb_insert(TranslationBlock *tb) 397be2cdc5eSEmilio G. Cota { 398be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 399be2cdc5eSEmilio G. Cota 400be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 401be2cdc5eSEmilio G. Cota g_tree_insert(rt->tree, &tb->tc, tb); 402be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 403be2cdc5eSEmilio G. Cota } 404be2cdc5eSEmilio G. Cota 405be2cdc5eSEmilio G. Cota void tcg_tb_remove(TranslationBlock *tb) 406be2cdc5eSEmilio G. Cota { 407be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 408be2cdc5eSEmilio G. Cota 409be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 410be2cdc5eSEmilio G. Cota g_tree_remove(rt->tree, &tb->tc); 411be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 412be2cdc5eSEmilio G. Cota } 413be2cdc5eSEmilio G. Cota 414be2cdc5eSEmilio G. Cota /* 415be2cdc5eSEmilio G. Cota * Find the TB 'tb' such that 416be2cdc5eSEmilio G. Cota * tb->tc.ptr <= tc_ptr < tb->tc.ptr + tb->tc.size 417be2cdc5eSEmilio G. Cota * Return NULL if not found. 418be2cdc5eSEmilio G. Cota */ 419be2cdc5eSEmilio G. Cota TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr) 420be2cdc5eSEmilio G. Cota { 421be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree((void *)tc_ptr); 422be2cdc5eSEmilio G. Cota TranslationBlock *tb; 423be2cdc5eSEmilio G. Cota struct tb_tc s = { .ptr = (void *)tc_ptr }; 424be2cdc5eSEmilio G. Cota 425be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 426be2cdc5eSEmilio G. Cota tb = g_tree_lookup(rt->tree, &s); 427be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 428be2cdc5eSEmilio G. Cota return tb; 429be2cdc5eSEmilio G. Cota } 430be2cdc5eSEmilio G. Cota 431be2cdc5eSEmilio G. Cota static void tcg_region_tree_lock_all(void) 432be2cdc5eSEmilio G. Cota { 433be2cdc5eSEmilio G. Cota size_t i; 434be2cdc5eSEmilio G. Cota 435be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 436be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 437be2cdc5eSEmilio G. Cota 438be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 439be2cdc5eSEmilio G. Cota } 440be2cdc5eSEmilio G. Cota } 441be2cdc5eSEmilio G. Cota 442be2cdc5eSEmilio G. Cota static void tcg_region_tree_unlock_all(void) 443be2cdc5eSEmilio G. Cota { 444be2cdc5eSEmilio G. Cota size_t i; 445be2cdc5eSEmilio G. Cota 446be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 447be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 448be2cdc5eSEmilio G. Cota 449be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 450be2cdc5eSEmilio G. Cota } 451be2cdc5eSEmilio G. Cota } 452be2cdc5eSEmilio G. Cota 453be2cdc5eSEmilio G. Cota void tcg_tb_foreach(GTraverseFunc func, gpointer user_data) 454be2cdc5eSEmilio G. Cota { 455be2cdc5eSEmilio G. Cota size_t i; 456be2cdc5eSEmilio G. Cota 457be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 458be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 459be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 460be2cdc5eSEmilio G. Cota 461be2cdc5eSEmilio G. Cota g_tree_foreach(rt->tree, func, user_data); 462be2cdc5eSEmilio G. Cota } 463be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 464be2cdc5eSEmilio G. Cota } 465be2cdc5eSEmilio G. Cota 466be2cdc5eSEmilio G. Cota size_t tcg_nb_tbs(void) 467be2cdc5eSEmilio G. Cota { 468be2cdc5eSEmilio G. Cota size_t nb_tbs = 0; 469be2cdc5eSEmilio G. Cota size_t i; 470be2cdc5eSEmilio G. Cota 471be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 472be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 473be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 474be2cdc5eSEmilio G. Cota 475be2cdc5eSEmilio G. Cota nb_tbs += g_tree_nnodes(rt->tree); 476be2cdc5eSEmilio G. Cota } 477be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 478be2cdc5eSEmilio G. Cota return nb_tbs; 479be2cdc5eSEmilio G. Cota } 480be2cdc5eSEmilio G. Cota 481be2cdc5eSEmilio G. Cota static void tcg_region_tree_reset_all(void) 482be2cdc5eSEmilio G. Cota { 483be2cdc5eSEmilio G. Cota size_t i; 484be2cdc5eSEmilio G. Cota 485be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 486be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 487be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 488be2cdc5eSEmilio G. Cota 489be2cdc5eSEmilio G. Cota /* Increment the refcount first so that destroy acts as a reset */ 490be2cdc5eSEmilio G. Cota g_tree_ref(rt->tree); 491be2cdc5eSEmilio G. Cota g_tree_destroy(rt->tree); 492be2cdc5eSEmilio G. Cota } 493be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 494be2cdc5eSEmilio G. Cota } 495be2cdc5eSEmilio G. Cota 496e8feb96fSEmilio G. Cota static void tcg_region_bounds(size_t curr_region, void **pstart, void **pend) 497e8feb96fSEmilio G. Cota { 498e8feb96fSEmilio G. Cota void *start, *end; 499e8feb96fSEmilio G. Cota 500e8feb96fSEmilio G. Cota start = region.start_aligned + curr_region * region.stride; 501e8feb96fSEmilio G. Cota end = start + region.size; 502e8feb96fSEmilio G. Cota 503e8feb96fSEmilio G. Cota if (curr_region == 0) { 504e8feb96fSEmilio G. Cota start = region.start; 505e8feb96fSEmilio G. Cota } 506e8feb96fSEmilio G. Cota if (curr_region == region.n - 1) { 507e8feb96fSEmilio G. Cota end = region.end; 508e8feb96fSEmilio G. Cota } 509e8feb96fSEmilio G. Cota 510e8feb96fSEmilio G. Cota *pstart = start; 511e8feb96fSEmilio G. Cota *pend = end; 512e8feb96fSEmilio G. Cota } 513e8feb96fSEmilio G. Cota 514e8feb96fSEmilio G. Cota static void tcg_region_assign(TCGContext *s, size_t curr_region) 515e8feb96fSEmilio G. Cota { 516e8feb96fSEmilio G. Cota void *start, *end; 517e8feb96fSEmilio G. Cota 518e8feb96fSEmilio G. Cota tcg_region_bounds(curr_region, &start, &end); 519e8feb96fSEmilio G. Cota 520e8feb96fSEmilio G. Cota s->code_gen_buffer = start; 521e8feb96fSEmilio G. Cota s->code_gen_ptr = start; 522e8feb96fSEmilio G. Cota s->code_gen_buffer_size = end - start; 523e8feb96fSEmilio G. Cota s->code_gen_highwater = end - TCG_HIGHWATER; 524e8feb96fSEmilio G. Cota } 525e8feb96fSEmilio G. Cota 526e8feb96fSEmilio G. Cota static bool tcg_region_alloc__locked(TCGContext *s) 527e8feb96fSEmilio G. Cota { 528e8feb96fSEmilio G. Cota if (region.current == region.n) { 529e8feb96fSEmilio G. Cota return true; 530e8feb96fSEmilio G. Cota } 531e8feb96fSEmilio G. Cota tcg_region_assign(s, region.current); 532e8feb96fSEmilio G. Cota region.current++; 533e8feb96fSEmilio G. Cota return false; 534e8feb96fSEmilio G. Cota } 535e8feb96fSEmilio G. Cota 536e8feb96fSEmilio G. Cota /* 537e8feb96fSEmilio G. Cota * Request a new region once the one in use has filled up. 538e8feb96fSEmilio G. Cota * Returns true on error. 539e8feb96fSEmilio G. Cota */ 540e8feb96fSEmilio G. Cota static bool tcg_region_alloc(TCGContext *s) 541e8feb96fSEmilio G. Cota { 542e8feb96fSEmilio G. Cota bool err; 543e8feb96fSEmilio G. Cota /* read the region size now; alloc__locked will overwrite it on success */ 544e8feb96fSEmilio G. Cota size_t size_full = s->code_gen_buffer_size; 545e8feb96fSEmilio G. Cota 546e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 547e8feb96fSEmilio G. Cota err = tcg_region_alloc__locked(s); 548e8feb96fSEmilio G. Cota if (!err) { 549e8feb96fSEmilio G. Cota region.agg_size_full += size_full - TCG_HIGHWATER; 550e8feb96fSEmilio G. Cota } 551e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 552e8feb96fSEmilio G. Cota return err; 553e8feb96fSEmilio G. Cota } 554e8feb96fSEmilio G. Cota 555e8feb96fSEmilio G. Cota /* 556e8feb96fSEmilio G. Cota * Perform a context's first region allocation. 557e8feb96fSEmilio G. Cota * This function does _not_ increment region.agg_size_full. 558e8feb96fSEmilio G. Cota */ 559e8feb96fSEmilio G. Cota static inline bool tcg_region_initial_alloc__locked(TCGContext *s) 560e8feb96fSEmilio G. Cota { 561e8feb96fSEmilio G. Cota return tcg_region_alloc__locked(s); 562e8feb96fSEmilio G. Cota } 563e8feb96fSEmilio G. Cota 564e8feb96fSEmilio G. Cota /* Call from a safe-work context */ 565e8feb96fSEmilio G. Cota void tcg_region_reset_all(void) 566e8feb96fSEmilio G. Cota { 5673468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 568e8feb96fSEmilio G. Cota unsigned int i; 569e8feb96fSEmilio G. Cota 570e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 571e8feb96fSEmilio G. Cota region.current = 0; 572e8feb96fSEmilio G. Cota region.agg_size_full = 0; 573e8feb96fSEmilio G. Cota 5743468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 5753468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 5763468b59eSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(s); 577e8feb96fSEmilio G. Cota 578e8feb96fSEmilio G. Cota g_assert(!err); 579e8feb96fSEmilio G. Cota } 580e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 581be2cdc5eSEmilio G. Cota 582be2cdc5eSEmilio G. Cota tcg_region_tree_reset_all(); 583e8feb96fSEmilio G. Cota } 584e8feb96fSEmilio G. Cota 5853468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 5863468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5873468b59eSEmilio G. Cota { 5883468b59eSEmilio G. Cota return 1; 5893468b59eSEmilio G. Cota } 5903468b59eSEmilio G. Cota #else 5913468b59eSEmilio G. Cota /* 5923468b59eSEmilio G. Cota * It is likely that some vCPUs will translate more code than others, so we 5933468b59eSEmilio G. Cota * first try to set more regions than max_cpus, with those regions being of 5943468b59eSEmilio G. Cota * reasonable size. If that's not possible we make do by evenly dividing 5953468b59eSEmilio G. Cota * the code_gen_buffer among the vCPUs. 5963468b59eSEmilio G. Cota */ 5973468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5983468b59eSEmilio G. Cota { 5993468b59eSEmilio G. Cota size_t i; 6003468b59eSEmilio G. Cota 6013468b59eSEmilio G. Cota /* Use a single region if all we have is one vCPU thread */ 6023468b59eSEmilio G. Cota if (max_cpus == 1 || !qemu_tcg_mttcg_enabled()) { 6033468b59eSEmilio G. Cota return 1; 6043468b59eSEmilio G. Cota } 6053468b59eSEmilio G. Cota 6063468b59eSEmilio G. Cota /* Try to have more regions than max_cpus, with each region being >= 2 MB */ 6073468b59eSEmilio G. Cota for (i = 8; i > 0; i--) { 6083468b59eSEmilio G. Cota size_t regions_per_thread = i; 6093468b59eSEmilio G. Cota size_t region_size; 6103468b59eSEmilio G. Cota 6113468b59eSEmilio G. Cota region_size = tcg_init_ctx.code_gen_buffer_size; 6123468b59eSEmilio G. Cota region_size /= max_cpus * regions_per_thread; 6133468b59eSEmilio G. Cota 6143468b59eSEmilio G. Cota if (region_size >= 2 * 1024u * 1024) { 6153468b59eSEmilio G. Cota return max_cpus * regions_per_thread; 6163468b59eSEmilio G. Cota } 6173468b59eSEmilio G. Cota } 6183468b59eSEmilio G. Cota /* If we can't, then just allocate one region per vCPU thread */ 6193468b59eSEmilio G. Cota return max_cpus; 6203468b59eSEmilio G. Cota } 6213468b59eSEmilio G. Cota #endif 6223468b59eSEmilio G. Cota 623e8feb96fSEmilio G. Cota /* 624e8feb96fSEmilio G. Cota * Initializes region partitioning. 625e8feb96fSEmilio G. Cota * 626e8feb96fSEmilio G. Cota * Called at init time from the parent thread (i.e. the one calling 627e8feb96fSEmilio G. Cota * tcg_context_init), after the target's TCG globals have been set. 6283468b59eSEmilio G. Cota * 6293468b59eSEmilio G. Cota * Region partitioning works by splitting code_gen_buffer into separate regions, 6303468b59eSEmilio G. Cota * and then assigning regions to TCG threads so that the threads can translate 6313468b59eSEmilio G. Cota * code in parallel without synchronization. 6323468b59eSEmilio G. Cota * 6333468b59eSEmilio G. Cota * In softmmu the number of TCG threads is bounded by max_cpus, so we use at 6343468b59eSEmilio G. Cota * least max_cpus regions in MTTCG. In !MTTCG we use a single region. 6353468b59eSEmilio G. Cota * Note that the TCG options from the command-line (i.e. -accel accel=tcg,[...]) 6363468b59eSEmilio G. Cota * must have been parsed before calling this function, since it calls 6373468b59eSEmilio G. Cota * qemu_tcg_mttcg_enabled(). 6383468b59eSEmilio G. Cota * 6393468b59eSEmilio G. Cota * In user-mode we use a single region. Having multiple regions in user-mode 6403468b59eSEmilio G. Cota * is not supported, because the number of vCPU threads (recall that each thread 6413468b59eSEmilio G. Cota * spawned by the guest corresponds to a vCPU thread) is only bounded by the 6423468b59eSEmilio G. Cota * OS, and usually this number is huge (tens of thousands is not uncommon). 6433468b59eSEmilio G. Cota * Thus, given this large bound on the number of vCPU threads and the fact 6443468b59eSEmilio G. Cota * that code_gen_buffer is allocated at compile-time, we cannot guarantee 6453468b59eSEmilio G. Cota * that the availability of at least one region per vCPU thread. 6463468b59eSEmilio G. Cota * 6473468b59eSEmilio G. Cota * However, this user-mode limitation is unlikely to be a significant problem 6483468b59eSEmilio G. Cota * in practice. Multi-threaded guests share most if not all of their translated 6493468b59eSEmilio G. Cota * code, which makes parallel code generation less appealing than in softmmu. 650e8feb96fSEmilio G. Cota */ 651e8feb96fSEmilio G. Cota void tcg_region_init(void) 652e8feb96fSEmilio G. Cota { 653e8feb96fSEmilio G. Cota void *buf = tcg_init_ctx.code_gen_buffer; 654e8feb96fSEmilio G. Cota void *aligned; 655e8feb96fSEmilio G. Cota size_t size = tcg_init_ctx.code_gen_buffer_size; 656e8feb96fSEmilio G. Cota size_t page_size = qemu_real_host_page_size; 657e8feb96fSEmilio G. Cota size_t region_size; 658e8feb96fSEmilio G. Cota size_t n_regions; 659e8feb96fSEmilio G. Cota size_t i; 660e8feb96fSEmilio G. Cota 6613468b59eSEmilio G. Cota n_regions = tcg_n_regions(); 662e8feb96fSEmilio G. Cota 663e8feb96fSEmilio G. Cota /* The first region will be 'aligned - buf' bytes larger than the others */ 664e8feb96fSEmilio G. Cota aligned = QEMU_ALIGN_PTR_UP(buf, page_size); 665e8feb96fSEmilio G. Cota g_assert(aligned < tcg_init_ctx.code_gen_buffer + size); 666e8feb96fSEmilio G. Cota /* 667e8feb96fSEmilio G. Cota * Make region_size a multiple of page_size, using aligned as the start. 668e8feb96fSEmilio G. Cota * As a result of this we might end up with a few extra pages at the end of 669e8feb96fSEmilio G. Cota * the buffer; we will assign those to the last region. 670e8feb96fSEmilio G. Cota */ 671e8feb96fSEmilio G. Cota region_size = (size - (aligned - buf)) / n_regions; 672e8feb96fSEmilio G. Cota region_size = QEMU_ALIGN_DOWN(region_size, page_size); 673e8feb96fSEmilio G. Cota 674e8feb96fSEmilio G. Cota /* A region must have at least 2 pages; one code, one guard */ 675e8feb96fSEmilio G. Cota g_assert(region_size >= 2 * page_size); 676e8feb96fSEmilio G. Cota 677e8feb96fSEmilio G. Cota /* init the region struct */ 678e8feb96fSEmilio G. Cota qemu_mutex_init(®ion.lock); 679e8feb96fSEmilio G. Cota region.n = n_regions; 680e8feb96fSEmilio G. Cota region.size = region_size - page_size; 681e8feb96fSEmilio G. Cota region.stride = region_size; 682e8feb96fSEmilio G. Cota region.start = buf; 683e8feb96fSEmilio G. Cota region.start_aligned = aligned; 684e8feb96fSEmilio G. Cota /* page-align the end, since its last page will be a guard page */ 685e8feb96fSEmilio G. Cota region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size); 686e8feb96fSEmilio G. Cota /* account for that last guard page */ 687e8feb96fSEmilio G. Cota region.end -= page_size; 688e8feb96fSEmilio G. Cota 689e8feb96fSEmilio G. Cota /* set guard pages */ 690e8feb96fSEmilio G. Cota for (i = 0; i < region.n; i++) { 691e8feb96fSEmilio G. Cota void *start, *end; 692e8feb96fSEmilio G. Cota int rc; 693e8feb96fSEmilio G. Cota 694e8feb96fSEmilio G. Cota tcg_region_bounds(i, &start, &end); 695e8feb96fSEmilio G. Cota rc = qemu_mprotect_none(end, page_size); 696e8feb96fSEmilio G. Cota g_assert(!rc); 697e8feb96fSEmilio G. Cota } 698e8feb96fSEmilio G. Cota 699be2cdc5eSEmilio G. Cota tcg_region_trees_init(); 700be2cdc5eSEmilio G. Cota 7013468b59eSEmilio G. Cota /* In user-mode we support only one ctx, so do the initial allocation now */ 7023468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 703e8feb96fSEmilio G. Cota { 704e8feb96fSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(tcg_ctx); 705e8feb96fSEmilio G. Cota 706e8feb96fSEmilio G. Cota g_assert(!err); 707e8feb96fSEmilio G. Cota } 7083468b59eSEmilio G. Cota #endif 709e8feb96fSEmilio G. Cota } 710e8feb96fSEmilio G. Cota 711e8feb96fSEmilio G. Cota /* 7123468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 7133468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 7143468b59eSEmilio G. Cota * before initiating translation. 7153468b59eSEmilio G. Cota * 7163468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 7173468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 7183468b59eSEmilio G. Cota * 7193468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 7203468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 7213468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 7223468b59eSEmilio G. Cota * 7233468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 7243468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 7253468b59eSEmilio G. Cota */ 7263468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 7273468b59eSEmilio G. Cota void tcg_register_thread(void) 7283468b59eSEmilio G. Cota { 7293468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 7303468b59eSEmilio G. Cota } 7313468b59eSEmilio G. Cota #else 7323468b59eSEmilio G. Cota void tcg_register_thread(void) 7333468b59eSEmilio G. Cota { 7343468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 7353468b59eSEmilio G. Cota unsigned int i, n; 7363468b59eSEmilio G. Cota bool err; 7373468b59eSEmilio G. Cota 7383468b59eSEmilio G. Cota *s = tcg_init_ctx; 7393468b59eSEmilio G. Cota 7403468b59eSEmilio G. Cota /* Relink mem_base. */ 7413468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 7423468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 7433468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 7443468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 7453468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 7463468b59eSEmilio G. Cota } 7473468b59eSEmilio G. Cota } 7483468b59eSEmilio G. Cota 7493468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 7503468b59eSEmilio G. Cota n = atomic_fetch_inc(&n_tcg_ctxs); 7513468b59eSEmilio G. Cota g_assert(n < max_cpus); 7523468b59eSEmilio G. Cota atomic_set(&tcg_ctxs[n], s); 7533468b59eSEmilio G. Cota 7543468b59eSEmilio G. Cota tcg_ctx = s; 7553468b59eSEmilio G. Cota qemu_mutex_lock(®ion.lock); 7563468b59eSEmilio G. Cota err = tcg_region_initial_alloc__locked(tcg_ctx); 7573468b59eSEmilio G. Cota g_assert(!err); 7583468b59eSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 7593468b59eSEmilio G. Cota } 7603468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 7613468b59eSEmilio G. Cota 7623468b59eSEmilio G. Cota /* 763e8feb96fSEmilio G. Cota * Returns the size (in bytes) of all translated code (i.e. from all regions) 764e8feb96fSEmilio G. Cota * currently in the cache. 765e8feb96fSEmilio G. Cota * See also: tcg_code_capacity() 766e8feb96fSEmilio G. Cota * Do not confuse with tcg_current_code_size(); that one applies to a single 767e8feb96fSEmilio G. Cota * TCG context. 768e8feb96fSEmilio G. Cota */ 769e8feb96fSEmilio G. Cota size_t tcg_code_size(void) 770e8feb96fSEmilio G. Cota { 7713468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 772e8feb96fSEmilio G. Cota unsigned int i; 773e8feb96fSEmilio G. Cota size_t total; 774e8feb96fSEmilio G. Cota 775e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 776e8feb96fSEmilio G. Cota total = region.agg_size_full; 7773468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 7783468b59eSEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 779e8feb96fSEmilio G. Cota size_t size; 780e8feb96fSEmilio G. Cota 781e8feb96fSEmilio G. Cota size = atomic_read(&s->code_gen_ptr) - s->code_gen_buffer; 782e8feb96fSEmilio G. Cota g_assert(size <= s->code_gen_buffer_size); 783e8feb96fSEmilio G. Cota total += size; 784e8feb96fSEmilio G. Cota } 785e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 786e8feb96fSEmilio G. Cota return total; 787e8feb96fSEmilio G. Cota } 788e8feb96fSEmilio G. Cota 789e8feb96fSEmilio G. Cota /* 790e8feb96fSEmilio G. Cota * Returns the code capacity (in bytes) of the entire cache, i.e. including all 791e8feb96fSEmilio G. Cota * regions. 792e8feb96fSEmilio G. Cota * See also: tcg_code_size() 793e8feb96fSEmilio G. Cota */ 794e8feb96fSEmilio G. Cota size_t tcg_code_capacity(void) 795e8feb96fSEmilio G. Cota { 796e8feb96fSEmilio G. Cota size_t guard_size, capacity; 797e8feb96fSEmilio G. Cota 798e8feb96fSEmilio G. Cota /* no need for synchronization; these variables are set at init time */ 799e8feb96fSEmilio G. Cota guard_size = region.stride - region.size; 800e8feb96fSEmilio G. Cota capacity = region.end + guard_size - region.start; 801e8feb96fSEmilio G. Cota capacity -= region.n * (guard_size + TCG_HIGHWATER); 802e8feb96fSEmilio G. Cota return capacity; 803e8feb96fSEmilio G. Cota } 804e8feb96fSEmilio G. Cota 805128ed227SEmilio G. Cota size_t tcg_tb_phys_invalidate_count(void) 806128ed227SEmilio G. Cota { 807128ed227SEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 808128ed227SEmilio G. Cota unsigned int i; 809128ed227SEmilio G. Cota size_t total = 0; 810128ed227SEmilio G. Cota 811128ed227SEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 812128ed227SEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 813128ed227SEmilio G. Cota 814128ed227SEmilio G. Cota total += atomic_read(&s->tb_phys_invalidate_count); 815128ed227SEmilio G. Cota } 816128ed227SEmilio G. Cota return total; 817128ed227SEmilio G. Cota } 818128ed227SEmilio G. Cota 819c896fe29Sbellard /* pool based memory allocation */ 820c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 821c896fe29Sbellard { 822c896fe29Sbellard TCGPool *p; 823c896fe29Sbellard int pool_size; 824c896fe29Sbellard 825c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 826c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 8277267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 828c896fe29Sbellard p->size = size; 8294055299eSKirill Batuzov p->next = s->pool_first_large; 8304055299eSKirill Batuzov s->pool_first_large = p; 8314055299eSKirill Batuzov return p->data; 832c896fe29Sbellard } else { 833c896fe29Sbellard p = s->pool_current; 834c896fe29Sbellard if (!p) { 835c896fe29Sbellard p = s->pool_first; 836c896fe29Sbellard if (!p) 837c896fe29Sbellard goto new_pool; 838c896fe29Sbellard } else { 839c896fe29Sbellard if (!p->next) { 840c896fe29Sbellard new_pool: 841c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 8427267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 843c896fe29Sbellard p->size = pool_size; 844c896fe29Sbellard p->next = NULL; 845c896fe29Sbellard if (s->pool_current) 846c896fe29Sbellard s->pool_current->next = p; 847c896fe29Sbellard else 848c896fe29Sbellard s->pool_first = p; 849c896fe29Sbellard } else { 850c896fe29Sbellard p = p->next; 851c896fe29Sbellard } 852c896fe29Sbellard } 853c896fe29Sbellard } 854c896fe29Sbellard s->pool_current = p; 855c896fe29Sbellard s->pool_cur = p->data + size; 856c896fe29Sbellard s->pool_end = p->data + p->size; 857c896fe29Sbellard return p->data; 858c896fe29Sbellard } 859c896fe29Sbellard 860c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 861c896fe29Sbellard { 8624055299eSKirill Batuzov TCGPool *p, *t; 8634055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 8644055299eSKirill Batuzov t = p->next; 8654055299eSKirill Batuzov g_free(p); 8664055299eSKirill Batuzov } 8674055299eSKirill Batuzov s->pool_first_large = NULL; 868c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 869c896fe29Sbellard s->pool_current = NULL; 870c896fe29Sbellard } 871c896fe29Sbellard 872100b5e01SRichard Henderson typedef struct TCGHelperInfo { 873100b5e01SRichard Henderson void *func; 874100b5e01SRichard Henderson const char *name; 875afb49896SRichard Henderson unsigned flags; 876afb49896SRichard Henderson unsigned sizemask; 877100b5e01SRichard Henderson } TCGHelperInfo; 878100b5e01SRichard Henderson 8792ef6175aSRichard Henderson #include "exec/helper-proto.h" 8802ef6175aSRichard Henderson 881100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 8822ef6175aSRichard Henderson #include "exec/helper-tcg.h" 883100b5e01SRichard Henderson }; 884619205fdSEmilio G. Cota static GHashTable *helper_table; 885100b5e01SRichard Henderson 88691478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 887f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 8881c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 8891c2adb95SRichard Henderson TCGReg reg, const char *name); 89091478cefSRichard Henderson 891c896fe29Sbellard void tcg_context_init(TCGContext *s) 892c896fe29Sbellard { 893100b5e01SRichard Henderson int op, total_args, n, i; 894c896fe29Sbellard TCGOpDef *def; 895c896fe29Sbellard TCGArgConstraint *args_ct; 896c896fe29Sbellard int *sorted_args; 8971c2adb95SRichard Henderson TCGTemp *ts; 898c896fe29Sbellard 899c896fe29Sbellard memset(s, 0, sizeof(*s)); 900c896fe29Sbellard s->nb_globals = 0; 901c896fe29Sbellard 902c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 903c896fe29Sbellard space */ 904c896fe29Sbellard total_args = 0; 905c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 906c896fe29Sbellard def = &tcg_op_defs[op]; 907c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 908c896fe29Sbellard total_args += n; 909c896fe29Sbellard } 910c896fe29Sbellard 9117267c094SAnthony Liguori args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args); 9127267c094SAnthony Liguori sorted_args = g_malloc(sizeof(int) * total_args); 913c896fe29Sbellard 914c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 915c896fe29Sbellard def = &tcg_op_defs[op]; 916c896fe29Sbellard def->args_ct = args_ct; 917c896fe29Sbellard def->sorted_args = sorted_args; 918c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 919c896fe29Sbellard sorted_args += n; 920c896fe29Sbellard args_ct += n; 921c896fe29Sbellard } 922c896fe29Sbellard 9235cd8f621SRichard Henderson /* Register helpers. */ 92484fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 925619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 92684fd9dd3SRichard Henderson 927100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 92884fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 92972866e82SRichard Henderson (gpointer)&all_helpers[i]); 930100b5e01SRichard Henderson } 9315cd8f621SRichard Henderson 932c896fe29Sbellard tcg_target_init(s); 933f69d277eSRichard Henderson process_op_defs(s); 93491478cefSRichard Henderson 93591478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 93691478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 93791478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 93891478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 93991478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 94091478cefSRichard Henderson break; 94191478cefSRichard Henderson } 94291478cefSRichard Henderson } 94391478cefSRichard Henderson for (i = 0; i < n; ++i) { 94491478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 94591478cefSRichard Henderson } 94691478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 94791478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 94891478cefSRichard Henderson } 949b1311c4aSEmilio G. Cota 950b1311c4aSEmilio G. Cota tcg_ctx = s; 9513468b59eSEmilio G. Cota /* 9523468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 9533468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 9543468b59eSEmilio G. Cota * reasoning behind this. 9553468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 9563468b59eSEmilio G. Cota */ 9573468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 958df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 959df2cce29SEmilio G. Cota n_tcg_ctxs = 1; 9603468b59eSEmilio G. Cota #else 9613468b59eSEmilio G. Cota tcg_ctxs = g_new(TCGContext *, max_cpus); 9623468b59eSEmilio G. Cota #endif 9631c2adb95SRichard Henderson 9641c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 9651c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 9661c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 9679002ec79SRichard Henderson } 968b03cce8eSbellard 9696e3b2bfdSEmilio G. Cota /* 9706e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 9716e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 9726e3b2bfdSEmilio G. Cota */ 9736e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 9746e3b2bfdSEmilio G. Cota { 9756e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 9766e3b2bfdSEmilio G. Cota TranslationBlock *tb; 9776e3b2bfdSEmilio G. Cota void *next; 9786e3b2bfdSEmilio G. Cota 979e8feb96fSEmilio G. Cota retry: 9806e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 9816e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 9826e3b2bfdSEmilio G. Cota 9836e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 984e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 9856e3b2bfdSEmilio G. Cota return NULL; 9866e3b2bfdSEmilio G. Cota } 987e8feb96fSEmilio G. Cota goto retry; 988e8feb96fSEmilio G. Cota } 989e8feb96fSEmilio G. Cota atomic_set(&s->code_gen_ptr, next); 99057a26946SRichard Henderson s->data_gen_ptr = NULL; 9916e3b2bfdSEmilio G. Cota return tb; 9926e3b2bfdSEmilio G. Cota } 9936e3b2bfdSEmilio G. Cota 9949002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 9959002ec79SRichard Henderson { 9968163b749SRichard Henderson size_t prologue_size, total_size; 9978163b749SRichard Henderson void *buf0, *buf1; 9988163b749SRichard Henderson 9998163b749SRichard Henderson /* Put the prologue at the beginning of code_gen_buffer. */ 10008163b749SRichard Henderson buf0 = s->code_gen_buffer; 10015b38ee31SRichard Henderson total_size = s->code_gen_buffer_size; 10028163b749SRichard Henderson s->code_ptr = buf0; 10038163b749SRichard Henderson s->code_buf = buf0; 10045b38ee31SRichard Henderson s->data_gen_ptr = NULL; 10058163b749SRichard Henderson s->code_gen_prologue = buf0; 10068163b749SRichard Henderson 10075b38ee31SRichard Henderson /* Compute a high-water mark, at which we voluntarily flush the buffer 10085b38ee31SRichard Henderson and start over. The size here is arbitrary, significantly larger 10095b38ee31SRichard Henderson than we expect the code generation for any one opcode to require. */ 10105b38ee31SRichard Henderson s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER); 10115b38ee31SRichard Henderson 10125b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10135b38ee31SRichard Henderson s->pool_labels = NULL; 10145b38ee31SRichard Henderson #endif 10155b38ee31SRichard Henderson 10168163b749SRichard Henderson /* Generate the prologue. */ 1017b03cce8eSbellard tcg_target_qemu_prologue(s); 10185b38ee31SRichard Henderson 10195b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10205b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 10215b38ee31SRichard Henderson { 10225b38ee31SRichard Henderson bool ok = tcg_out_pool_finalize(s); 10235b38ee31SRichard Henderson tcg_debug_assert(ok); 10245b38ee31SRichard Henderson } 10255b38ee31SRichard Henderson #endif 10265b38ee31SRichard Henderson 10278163b749SRichard Henderson buf1 = s->code_ptr; 10288163b749SRichard Henderson flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1); 10298163b749SRichard Henderson 10308163b749SRichard Henderson /* Deduct the prologue from the buffer. */ 10318163b749SRichard Henderson prologue_size = tcg_current_code_size(s); 10328163b749SRichard Henderson s->code_gen_ptr = buf1; 10338163b749SRichard Henderson s->code_gen_buffer = buf1; 10348163b749SRichard Henderson s->code_buf = buf1; 10355b38ee31SRichard Henderson total_size -= prologue_size; 10368163b749SRichard Henderson s->code_gen_buffer_size = total_size; 10378163b749SRichard Henderson 10388163b749SRichard Henderson tcg_register_jit(s->code_gen_buffer, total_size); 1039d6b64b2bSRichard Henderson 1040d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 1041d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 10421ee73216SRichard Henderson qemu_log_lock(); 10438163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 10445b38ee31SRichard Henderson if (s->data_gen_ptr) { 10455b38ee31SRichard Henderson size_t code_size = s->data_gen_ptr - buf0; 10465b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 10475b38ee31SRichard Henderson size_t i; 10485b38ee31SRichard Henderson 10495b38ee31SRichard Henderson log_disas(buf0, code_size); 10505b38ee31SRichard Henderson 10515b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 10525b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 10535b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 10545b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10555b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 10565b38ee31SRichard Henderson } else { 10575b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .long 0x%08x\n", 10585b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10595b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 10605b38ee31SRichard Henderson } 10615b38ee31SRichard Henderson } 10625b38ee31SRichard Henderson } else { 10638163b749SRichard Henderson log_disas(buf0, prologue_size); 10645b38ee31SRichard Henderson } 1065d6b64b2bSRichard Henderson qemu_log("\n"); 1066d6b64b2bSRichard Henderson qemu_log_flush(); 10671ee73216SRichard Henderson qemu_log_unlock(); 1068d6b64b2bSRichard Henderson } 1069d6b64b2bSRichard Henderson #endif 1070cedbcb01SEmilio G. Cota 1071cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 1072cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 1073cedbcb01SEmilio G. Cota tcg_debug_assert(s->code_gen_epilogue != NULL); 1074cedbcb01SEmilio G. Cota } 1075c896fe29Sbellard } 1076c896fe29Sbellard 1077c896fe29Sbellard void tcg_func_start(TCGContext *s) 1078c896fe29Sbellard { 1079c896fe29Sbellard tcg_pool_reset(s); 1080c896fe29Sbellard s->nb_temps = s->nb_globals; 10810ec9eabcSRichard Henderson 10820ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 10830ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 10840ec9eabcSRichard Henderson 1085abebf925SRichard Henderson s->nb_ops = 0; 1086c896fe29Sbellard s->nb_labels = 0; 1087c896fe29Sbellard s->current_frame_offset = s->frame_start; 1088c896fe29Sbellard 10890a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 10900a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 10910a209d4bSRichard Henderson #endif 10920a209d4bSRichard Henderson 109315fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 109415fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 1095c896fe29Sbellard } 1096c896fe29Sbellard 10977ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s) 10987ca4b752SRichard Henderson { 10997ca4b752SRichard Henderson int n = s->nb_temps++; 11007ca4b752SRichard Henderson tcg_debug_assert(n < TCG_MAX_TEMPS); 11017ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 11027ca4b752SRichard Henderson } 11037ca4b752SRichard Henderson 11047ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s) 11057ca4b752SRichard Henderson { 1106fa477d25SRichard Henderson TCGTemp *ts; 1107fa477d25SRichard Henderson 11087ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 11097ca4b752SRichard Henderson s->nb_globals++; 1110fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 1111fa477d25SRichard Henderson ts->temp_global = 1; 1112fa477d25SRichard Henderson 1113fa477d25SRichard Henderson return ts; 1114c896fe29Sbellard } 1115c896fe29Sbellard 1116085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 1117b6638662SRichard Henderson TCGReg reg, const char *name) 1118c896fe29Sbellard { 1119c896fe29Sbellard TCGTemp *ts; 1120c896fe29Sbellard 1121b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 1122c896fe29Sbellard tcg_abort(); 1123b3a62939SRichard Henderson } 11247ca4b752SRichard Henderson 11257ca4b752SRichard Henderson ts = tcg_global_alloc(s); 1126c896fe29Sbellard ts->base_type = type; 1127c896fe29Sbellard ts->type = type; 1128c896fe29Sbellard ts->fixed_reg = 1; 1129c896fe29Sbellard ts->reg = reg; 1130c896fe29Sbellard ts->name = name; 1131c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 11327ca4b752SRichard Henderson 1133085272b3SRichard Henderson return ts; 1134a7812ae4Spbrook } 1135a7812ae4Spbrook 1136b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 1137a7812ae4Spbrook { 1138b3a62939SRichard Henderson s->frame_start = start; 1139b3a62939SRichard Henderson s->frame_end = start + size; 1140085272b3SRichard Henderson s->frame_temp 1141085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 1142b3a62939SRichard Henderson } 1143a7812ae4Spbrook 1144085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 1145e1ccc054SRichard Henderson intptr_t offset, const char *name) 1146c896fe29Sbellard { 1147b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1148dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 11497ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 1150b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 11517ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 11527ca4b752SRichard Henderson bigendian = 1; 11537ca4b752SRichard Henderson #endif 1154c896fe29Sbellard 1155b3915dbbSRichard Henderson if (!base_ts->fixed_reg) { 11565a18407fSRichard Henderson /* We do not support double-indirect registers. */ 11575a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 1158b3915dbbSRichard Henderson base_ts->indirect_base = 1; 11595a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 11605a18407fSRichard Henderson ? 2 : 1); 11615a18407fSRichard Henderson indirect_reg = 1; 1162b3915dbbSRichard Henderson } 1163b3915dbbSRichard Henderson 11647ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 11657ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 1166c896fe29Sbellard char buf[64]; 11677ca4b752SRichard Henderson 11687ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 1169c896fe29Sbellard ts->type = TCG_TYPE_I32; 1170b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1171c896fe29Sbellard ts->mem_allocated = 1; 1172b3a62939SRichard Henderson ts->mem_base = base_ts; 11737ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 1174c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1175c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 1176c896fe29Sbellard ts->name = strdup(buf); 1177c896fe29Sbellard 11787ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 11797ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 11807ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 1181b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 11827ca4b752SRichard Henderson ts2->mem_allocated = 1; 11837ca4b752SRichard Henderson ts2->mem_base = base_ts; 11847ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 1185c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1186c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 1187120c1084SRichard Henderson ts2->name = strdup(buf); 11887ca4b752SRichard Henderson } else { 1189c896fe29Sbellard ts->base_type = type; 1190c896fe29Sbellard ts->type = type; 1191b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1192c896fe29Sbellard ts->mem_allocated = 1; 1193b3a62939SRichard Henderson ts->mem_base = base_ts; 1194c896fe29Sbellard ts->mem_offset = offset; 1195c896fe29Sbellard ts->name = name; 1196c896fe29Sbellard } 1197085272b3SRichard Henderson return ts; 1198c896fe29Sbellard } 1199c896fe29Sbellard 12005bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 1201c896fe29Sbellard { 1202b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1203c896fe29Sbellard TCGTemp *ts; 1204641d5fbeSbellard int idx, k; 1205c896fe29Sbellard 12060ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 12070ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 12080ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 12090ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 12100ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 12110ec9eabcSRichard Henderson 1212e8996ee0Sbellard ts = &s->temps[idx]; 1213e8996ee0Sbellard ts->temp_allocated = 1; 12147ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 12157ca4b752SRichard Henderson tcg_debug_assert(ts->temp_local == temp_local); 1216e8996ee0Sbellard } else { 12177ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 12187ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 12197ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 12207ca4b752SRichard Henderson 1221c896fe29Sbellard ts->base_type = type; 1222c896fe29Sbellard ts->type = TCG_TYPE_I32; 1223e8996ee0Sbellard ts->temp_allocated = 1; 1224641d5fbeSbellard ts->temp_local = temp_local; 12257ca4b752SRichard Henderson 12267ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 12277ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 12287ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 12297ca4b752SRichard Henderson ts2->temp_allocated = 1; 12307ca4b752SRichard Henderson ts2->temp_local = temp_local; 12317ca4b752SRichard Henderson } else { 1232c896fe29Sbellard ts->base_type = type; 1233c896fe29Sbellard ts->type = type; 1234e8996ee0Sbellard ts->temp_allocated = 1; 1235641d5fbeSbellard ts->temp_local = temp_local; 1236c896fe29Sbellard } 1237e8996ee0Sbellard } 123827bfd83cSPeter Maydell 123927bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 124027bfd83cSPeter Maydell s->temps_in_use++; 124127bfd83cSPeter Maydell #endif 1242085272b3SRichard Henderson return ts; 1243c896fe29Sbellard } 1244c896fe29Sbellard 1245d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 1246d2fd745fSRichard Henderson { 1247d2fd745fSRichard Henderson TCGTemp *t; 1248d2fd745fSRichard Henderson 1249d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 1250d2fd745fSRichard Henderson switch (type) { 1251d2fd745fSRichard Henderson case TCG_TYPE_V64: 1252d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 1253d2fd745fSRichard Henderson break; 1254d2fd745fSRichard Henderson case TCG_TYPE_V128: 1255d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 1256d2fd745fSRichard Henderson break; 1257d2fd745fSRichard Henderson case TCG_TYPE_V256: 1258d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 1259d2fd745fSRichard Henderson break; 1260d2fd745fSRichard Henderson default: 1261d2fd745fSRichard Henderson g_assert_not_reached(); 1262d2fd745fSRichard Henderson } 1263d2fd745fSRichard Henderson #endif 1264d2fd745fSRichard Henderson 1265d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 1266d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1267d2fd745fSRichard Henderson } 1268d2fd745fSRichard Henderson 1269d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 1270d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 1271d2fd745fSRichard Henderson { 1272d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 1273d2fd745fSRichard Henderson 1274d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 1275d2fd745fSRichard Henderson 1276d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 1277d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1278d2fd745fSRichard Henderson } 1279d2fd745fSRichard Henderson 12805bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 1281c896fe29Sbellard { 1282b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1283085272b3SRichard Henderson int k, idx; 1284c896fe29Sbellard 128527bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 128627bfd83cSPeter Maydell s->temps_in_use--; 128727bfd83cSPeter Maydell if (s->temps_in_use < 0) { 128827bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 128927bfd83cSPeter Maydell } 129027bfd83cSPeter Maydell #endif 129127bfd83cSPeter Maydell 1292085272b3SRichard Henderson tcg_debug_assert(ts->temp_global == 0); 1293eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 1294e8996ee0Sbellard ts->temp_allocated = 0; 12950ec9eabcSRichard Henderson 1296085272b3SRichard Henderson idx = temp_idx(ts); 129718d13fa2SAlexander Graf k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0); 12980ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 1299e8996ee0Sbellard } 1300e8996ee0Sbellard 1301a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1302a7812ae4Spbrook { 1303a7812ae4Spbrook TCGv_i32 t0; 1304a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1305e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1306e8996ee0Sbellard return t0; 1307c896fe29Sbellard } 1308c896fe29Sbellard 1309a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1310c896fe29Sbellard { 1311a7812ae4Spbrook TCGv_i64 t0; 1312a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1313e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1314e8996ee0Sbellard return t0; 1315c896fe29Sbellard } 1316c896fe29Sbellard 1317a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1318bdffd4a9Saurel32 { 1319a7812ae4Spbrook TCGv_i32 t0; 1320a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1321bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1322bdffd4a9Saurel32 return t0; 1323bdffd4a9Saurel32 } 1324bdffd4a9Saurel32 1325a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1326bdffd4a9Saurel32 { 1327a7812ae4Spbrook TCGv_i64 t0; 1328a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1329bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1330bdffd4a9Saurel32 return t0; 1331bdffd4a9Saurel32 } 1332bdffd4a9Saurel32 133327bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 133427bfd83cSPeter Maydell void tcg_clear_temp_count(void) 133527bfd83cSPeter Maydell { 1336b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 133727bfd83cSPeter Maydell s->temps_in_use = 0; 133827bfd83cSPeter Maydell } 133927bfd83cSPeter Maydell 134027bfd83cSPeter Maydell int tcg_check_temp_count(void) 134127bfd83cSPeter Maydell { 1342b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 134327bfd83cSPeter Maydell if (s->temps_in_use) { 134427bfd83cSPeter Maydell /* Clear the count so that we don't give another 134527bfd83cSPeter Maydell * warning immediately next time around. 134627bfd83cSPeter Maydell */ 134727bfd83cSPeter Maydell s->temps_in_use = 0; 134827bfd83cSPeter Maydell return 1; 134927bfd83cSPeter Maydell } 135027bfd83cSPeter Maydell return 0; 135127bfd83cSPeter Maydell } 135227bfd83cSPeter Maydell #endif 135327bfd83cSPeter Maydell 1354be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1355be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1356be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1357be0f34b5SRichard Henderson { 1358d2fd745fSRichard Henderson const bool have_vec 1359d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1360d2fd745fSRichard Henderson 1361be0f34b5SRichard Henderson switch (op) { 1362be0f34b5SRichard Henderson case INDEX_op_discard: 1363be0f34b5SRichard Henderson case INDEX_op_set_label: 1364be0f34b5SRichard Henderson case INDEX_op_call: 1365be0f34b5SRichard Henderson case INDEX_op_br: 1366be0f34b5SRichard Henderson case INDEX_op_mb: 1367be0f34b5SRichard Henderson case INDEX_op_insn_start: 1368be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1369be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1370be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1371be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1372be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1373be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1374be0f34b5SRichard Henderson return true; 1375be0f34b5SRichard Henderson 1376be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 1377be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 1378be0f34b5SRichard Henderson 1379be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1380be0f34b5SRichard Henderson case INDEX_op_movi_i32: 1381be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1382be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1383be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1384be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1385be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1386be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1387be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1388be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1389be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1390be0f34b5SRichard Henderson case INDEX_op_st_i32: 1391be0f34b5SRichard Henderson case INDEX_op_add_i32: 1392be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1393be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1394be0f34b5SRichard Henderson case INDEX_op_and_i32: 1395be0f34b5SRichard Henderson case INDEX_op_or_i32: 1396be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1397be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1398be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1399be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1400be0f34b5SRichard Henderson return true; 1401be0f34b5SRichard Henderson 1402be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1403be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1404be0f34b5SRichard Henderson case INDEX_op_div_i32: 1405be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1406be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1407be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1408be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1409be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1410be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1411be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1412be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1413be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1414be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1415be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1416be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1417be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1418be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1419be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1420be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1421be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1422be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1423be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1424be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1425be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1426be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1427be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1428be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1429be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1430be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1431be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1432be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1433be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1434be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1435be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1436be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1437be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1438be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1439be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1440be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1441be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1442be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1443be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1444be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1445be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1446be0f34b5SRichard Henderson case INDEX_op_not_i32: 1447be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1448be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1449be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1450be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1451be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1452be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1453be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1454be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1455be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1456be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1457be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1458be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1459be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1460be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1461be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1462be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1463be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1464be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1465be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1466be0f34b5SRichard Henderson 1467be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1468be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1469be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1470be0f34b5SRichard Henderson 1471be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1472be0f34b5SRichard Henderson case INDEX_op_movi_i64: 1473be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1474be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1475be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1476be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1477be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1478be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1479be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1480be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1481be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1482be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1483be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1484be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1485be0f34b5SRichard Henderson case INDEX_op_st_i64: 1486be0f34b5SRichard Henderson case INDEX_op_add_i64: 1487be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1488be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1489be0f34b5SRichard Henderson case INDEX_op_and_i64: 1490be0f34b5SRichard Henderson case INDEX_op_or_i64: 1491be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1492be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1493be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1494be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1495be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1496be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1497be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1498be0f34b5SRichard Henderson 1499be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1500be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1501be0f34b5SRichard Henderson case INDEX_op_div_i64: 1502be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1503be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1504be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1505be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1506be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1507be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1508be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1509be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1510be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1511be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1512be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1513be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1514be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1515be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1516be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1517be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1518be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1519be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1520be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1521be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1522be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1523be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1524be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1525be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1526be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1527be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1528be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1529be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1530be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1531be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1532be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1533be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1534be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1535be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1536be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1537be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1538be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1539be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1540be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1541be0f34b5SRichard Henderson case INDEX_op_not_i64: 1542be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1543be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1544be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1545be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1546be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1547be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1548be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1549be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1550be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1551be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1552be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1553be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1554be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1555be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1556be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1557be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1558be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1559be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1560be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1561be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1562be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1563be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1564be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1565be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1566be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1567be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1568be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1569be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1570be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1571be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1572be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1573be0f34b5SRichard Henderson 1574d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1575d2fd745fSRichard Henderson case INDEX_op_dup_vec: 1576d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 1577d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1578d2fd745fSRichard Henderson case INDEX_op_st_vec: 1579d2fd745fSRichard Henderson case INDEX_op_add_vec: 1580d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1581d2fd745fSRichard Henderson case INDEX_op_and_vec: 1582d2fd745fSRichard Henderson case INDEX_op_or_vec: 1583d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1584212be173SRichard Henderson case INDEX_op_cmp_vec: 1585d2fd745fSRichard Henderson return have_vec; 1586d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1587d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1588d2fd745fSRichard Henderson case INDEX_op_not_vec: 1589d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1590d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1591d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1592d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1593d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1594d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1595d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 15963774030aSRichard Henderson case INDEX_op_mul_vec: 15973774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1598d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1599d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1600d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1601d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1602d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1603d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1604d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1605d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1606d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1607d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1608d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1609d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1610d2fd745fSRichard Henderson 1611db432672SRichard Henderson default: 1612db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1613db432672SRichard Henderson return true; 1614be0f34b5SRichard Henderson } 1615be0f34b5SRichard Henderson } 1616be0f34b5SRichard Henderson 161739cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 161839cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 161939cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1620ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1621c896fe29Sbellard { 162275e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 1623bbb8a1b4SRichard Henderson unsigned sizemask, flags; 1624afb49896SRichard Henderson TCGHelperInfo *info; 162575e8b9b7SRichard Henderson TCGOp *op; 1626afb49896SRichard Henderson 1627619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 1628bbb8a1b4SRichard Henderson flags = info->flags; 1629bbb8a1b4SRichard Henderson sizemask = info->sizemask; 16302bece2c8SRichard Henderson 163134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 163234b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 163334b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 163434b1a49cSRichard Henderson separate parameters. Split them. */ 163534b1a49cSRichard Henderson int orig_sizemask = sizemask; 163634b1a49cSRichard Henderson int orig_nargs = nargs; 163734b1a49cSRichard Henderson TCGv_i64 retl, reth; 1638ae8b75dcSRichard Henderson TCGTemp *split_args[MAX_OPC_PARAM]; 163934b1a49cSRichard Henderson 1640f764718dSRichard Henderson retl = NULL; 1641f764718dSRichard Henderson reth = NULL; 164234b1a49cSRichard Henderson if (sizemask != 0) { 164334b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 164434b1a49cSRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 164534b1a49cSRichard Henderson if (is_64bit) { 1646085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 164734b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 164834b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 164934b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 1650ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(h); 1651ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(l); 165234b1a49cSRichard Henderson } else { 165334b1a49cSRichard Henderson split_args[real_args++] = args[i]; 165434b1a49cSRichard Henderson } 165534b1a49cSRichard Henderson } 165634b1a49cSRichard Henderson nargs = real_args; 165734b1a49cSRichard Henderson args = split_args; 165834b1a49cSRichard Henderson sizemask = 0; 165934b1a49cSRichard Henderson } 166034b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 16612bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 16622bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 16632bece2c8SRichard Henderson int is_signed = sizemask & (2 << (i+1)*2); 16642bece2c8SRichard Henderson if (!is_64bit) { 16652bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 1666085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 16672bece2c8SRichard Henderson if (is_signed) { 16682bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 16692bece2c8SRichard Henderson } else { 16702bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 16712bece2c8SRichard Henderson } 1672ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 16732bece2c8SRichard Henderson } 16742bece2c8SRichard Henderson } 16752bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 16762bece2c8SRichard Henderson 167715fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 167875e8b9b7SRichard Henderson 167975e8b9b7SRichard Henderson pi = 0; 1680ae8b75dcSRichard Henderson if (ret != NULL) { 168134b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 168234b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 168334b1a49cSRichard Henderson if (orig_sizemask & 1) { 168434b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 168534b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 168634b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 168734b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 168834b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1689ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(reth); 1690ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(retl); 169134b1a49cSRichard Henderson nb_rets = 2; 169234b1a49cSRichard Henderson } else { 1693ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 169434b1a49cSRichard Henderson nb_rets = 1; 169534b1a49cSRichard Henderson } 169634b1a49cSRichard Henderson #else 169734b1a49cSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) { 169802eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1699ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1700ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1701a7812ae4Spbrook #else 1702ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1703ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1704a7812ae4Spbrook #endif 1705a7812ae4Spbrook nb_rets = 2; 170634b1a49cSRichard Henderson } else { 1707ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1708a7812ae4Spbrook nb_rets = 1; 1709a7812ae4Spbrook } 171034b1a49cSRichard Henderson #endif 1711a7812ae4Spbrook } else { 1712a7812ae4Spbrook nb_rets = 0; 1713a7812ae4Spbrook } 1714cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 171575e8b9b7SRichard Henderson 1716a7812ae4Spbrook real_args = 0; 1717a7812ae4Spbrook for (i = 0; i < nargs; i++) { 17182bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 1719bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 172039cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 172139cf05d3Sbellard /* some targets want aligned 64 bit args */ 1722ebd486d5Smalc if (real_args & 1) { 172375e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1724ebd486d5Smalc real_args++; 172539cf05d3Sbellard } 172639cf05d3Sbellard #endif 17273f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 17283f90f252SRichard Henderson arguments at lower addresses, which means we need to 17293f90f252SRichard Henderson reverse the order compared to how we would normally 17303f90f252SRichard Henderson treat either big or little-endian. For those arguments 17313f90f252SRichard Henderson that will wind up in registers, this still works for 17323f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 17333f90f252SRichard Henderson argument registers are *also* allocated in decreasing 17343f90f252SRichard Henderson order. If another such target is added, this logic may 17353f90f252SRichard Henderson have to get more complicated to differentiate between 17363f90f252SRichard Henderson stack arguments and register arguments. */ 173702eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1738ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1739ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1740c896fe29Sbellard #else 1741ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1742ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1743c896fe29Sbellard #endif 1744a7812ae4Spbrook real_args += 2; 17452bece2c8SRichard Henderson continue; 17462bece2c8SRichard Henderson } 17472bece2c8SRichard Henderson 1748ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1749a7812ae4Spbrook real_args++; 1750c896fe29Sbellard } 175175e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 175275e8b9b7SRichard Henderson op->args[pi++] = flags; 1753cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1754a7812ae4Spbrook 175575e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1756cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 175775e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 17582bece2c8SRichard Henderson 175934b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 176034b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 176134b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 176234b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 176334b1a49cSRichard Henderson int is_64bit = orig_sizemask & (1 << (i+1)*2); 176434b1a49cSRichard Henderson if (is_64bit) { 1765085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 1766085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 176734b1a49cSRichard Henderson } else { 176834b1a49cSRichard Henderson real_args++; 176934b1a49cSRichard Henderson } 177034b1a49cSRichard Henderson } 177134b1a49cSRichard Henderson if (orig_sizemask & 1) { 177234b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 177334b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 177434b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 1775085272b3SRichard Henderson tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth); 177634b1a49cSRichard Henderson tcg_temp_free_i64(retl); 177734b1a49cSRichard Henderson tcg_temp_free_i64(reth); 177834b1a49cSRichard Henderson } 177934b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 17802bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 17812bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 17822bece2c8SRichard Henderson if (!is_64bit) { 1783085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 17842bece2c8SRichard Henderson } 17852bece2c8SRichard Henderson } 17862bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1787a7812ae4Spbrook } 1788c896fe29Sbellard 17898fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1790c896fe29Sbellard { 1791ac3b8891SRichard Henderson int i, n; 1792c896fe29Sbellard TCGTemp *ts; 1793ac3b8891SRichard Henderson 1794ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 1795c896fe29Sbellard ts = &s->temps[i]; 1796ac3b8891SRichard Henderson ts->val_type = (ts->fixed_reg ? TEMP_VAL_REG : TEMP_VAL_MEM); 1797c896fe29Sbellard } 1798ac3b8891SRichard Henderson for (n = s->nb_temps; i < n; i++) { 1799e8996ee0Sbellard ts = &s->temps[i]; 1800ac3b8891SRichard Henderson ts->val_type = (ts->temp_local ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 1801e8996ee0Sbellard ts->mem_allocated = 0; 1802e8996ee0Sbellard ts->fixed_reg = 0; 1803e8996ee0Sbellard } 1804f8b2f202SRichard Henderson 1805f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1806c896fe29Sbellard } 1807c896fe29Sbellard 1808f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1809f8b2f202SRichard Henderson TCGTemp *ts) 1810c896fe29Sbellard { 18111807f4c4SRichard Henderson int idx = temp_idx(ts); 1812ac56dd48Spbrook 1813fa477d25SRichard Henderson if (ts->temp_global) { 1814ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1815f8b2f202SRichard Henderson } else if (ts->temp_local) { 1816641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1817f8b2f202SRichard Henderson } else { 1818ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1819c896fe29Sbellard } 1820c896fe29Sbellard return buf; 1821c896fe29Sbellard } 1822c896fe29Sbellard 182343439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 182443439139SRichard Henderson int buf_size, TCGArg arg) 1825f8b2f202SRichard Henderson { 182643439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1827f8b2f202SRichard Henderson } 1828f8b2f202SRichard Henderson 18296e085f72SRichard Henderson /* Find helper name. */ 18306e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val) 1831e8996ee0Sbellard { 18326e085f72SRichard Henderson const char *ret = NULL; 1833619205fdSEmilio G. Cota if (helper_table) { 1834619205fdSEmilio G. Cota TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val); 183572866e82SRichard Henderson if (info) { 183672866e82SRichard Henderson ret = info->name; 183772866e82SRichard Henderson } 1838e8996ee0Sbellard } 18396e085f72SRichard Henderson return ret; 18404dc81f28Sbellard } 18414dc81f28Sbellard 1842f48f3edeSblueswir1 static const char * const cond_name[] = 1843f48f3edeSblueswir1 { 18440aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 18450aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1846f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1847f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1848f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1849f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1850f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1851f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1852f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1853f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1854f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1855f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1856f48f3edeSblueswir1 }; 1857f48f3edeSblueswir1 1858f713d6adSRichard Henderson static const char * const ldst_name[] = 1859f713d6adSRichard Henderson { 1860f713d6adSRichard Henderson [MO_UB] = "ub", 1861f713d6adSRichard Henderson [MO_SB] = "sb", 1862f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1863f713d6adSRichard Henderson [MO_LESW] = "lesw", 1864f713d6adSRichard Henderson [MO_LEUL] = "leul", 1865f713d6adSRichard Henderson [MO_LESL] = "lesl", 1866f713d6adSRichard Henderson [MO_LEQ] = "leq", 1867f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1868f713d6adSRichard Henderson [MO_BESW] = "besw", 1869f713d6adSRichard Henderson [MO_BEUL] = "beul", 1870f713d6adSRichard Henderson [MO_BESL] = "besl", 1871f713d6adSRichard Henderson [MO_BEQ] = "beq", 1872f713d6adSRichard Henderson }; 1873f713d6adSRichard Henderson 18741f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 18751f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY 18761f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 18771f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 18781f00b27fSSergey Sorokin #else 18791f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 18801f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 18811f00b27fSSergey Sorokin #endif 18821f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 18831f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 18841f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 18851f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 18861f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 18871f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 18881f00b27fSSergey Sorokin }; 18891f00b27fSSergey Sorokin 1890b016486eSRichard Henderson static inline bool tcg_regset_single(TCGRegSet d) 1891b016486eSRichard Henderson { 1892b016486eSRichard Henderson return (d & (d - 1)) == 0; 1893b016486eSRichard Henderson } 1894b016486eSRichard Henderson 1895b016486eSRichard Henderson static inline TCGReg tcg_regset_first(TCGRegSet d) 1896b016486eSRichard Henderson { 1897b016486eSRichard Henderson if (TCG_TARGET_NB_REGS <= 32) { 1898b016486eSRichard Henderson return ctz32(d); 1899b016486eSRichard Henderson } else { 1900b016486eSRichard Henderson return ctz64(d); 1901b016486eSRichard Henderson } 1902b016486eSRichard Henderson } 1903b016486eSRichard Henderson 19041894f69aSRichard Henderson static void tcg_dump_ops(TCGContext *s, bool have_prefs) 1905c896fe29Sbellard { 1906c896fe29Sbellard char buf[128]; 1907c45cb8bbSRichard Henderson TCGOp *op; 1908c896fe29Sbellard 190915fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1910c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1911c45cb8bbSRichard Henderson const TCGOpDef *def; 1912c45cb8bbSRichard Henderson TCGOpcode c; 1913bdfb460eSRichard Henderson int col = 0; 1914c45cb8bbSRichard Henderson 1915c45cb8bbSRichard Henderson c = op->opc; 1916c896fe29Sbellard def = &tcg_op_defs[c]; 1917c45cb8bbSRichard Henderson 1918765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 1919b016486eSRichard Henderson nb_oargs = 0; 192015fa08f8SRichard Henderson col += qemu_log("\n ----"); 19219aef40edSRichard Henderson 19229aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 19239aef40edSRichard Henderson target_ulong a; 19247e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1925efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 19267e4597d7Sbellard #else 1927efee3746SRichard Henderson a = op->args[i]; 19287e4597d7Sbellard #endif 1929bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1930eeacee4dSBlue Swirl } 19317e4597d7Sbellard } else if (c == INDEX_op_call) { 1932c896fe29Sbellard /* variable number of arguments */ 1933cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1934cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1935c896fe29Sbellard nb_cargs = def->nb_cargs; 1936b03cce8eSbellard 1937cf066674SRichard Henderson /* function name, flags, out args */ 1938bdfb460eSRichard Henderson col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name, 1939efee3746SRichard Henderson tcg_find_helper(s, op->args[nb_oargs + nb_iargs]), 1940efee3746SRichard Henderson op->args[nb_oargs + nb_iargs + 1], nb_oargs); 1941b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 194243439139SRichard Henderson col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1943efee3746SRichard Henderson op->args[i])); 1944b03cce8eSbellard } 1945cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1946efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1947cf066674SRichard Henderson const char *t = "<dummy>"; 1948cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 194943439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1950b03cce8eSbellard } 1951bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1952e8996ee0Sbellard } 1953b03cce8eSbellard } else { 1954bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1955c45cb8bbSRichard Henderson 1956c896fe29Sbellard nb_oargs = def->nb_oargs; 1957c896fe29Sbellard nb_iargs = def->nb_iargs; 1958c896fe29Sbellard nb_cargs = def->nb_cargs; 1959c896fe29Sbellard 1960d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1961d2fd745fSRichard Henderson col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op), 1962d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1963d2fd745fSRichard Henderson } 1964d2fd745fSRichard Henderson 1965c896fe29Sbellard k = 0; 1966c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1967eeacee4dSBlue Swirl if (k != 0) { 1968bdfb460eSRichard Henderson col += qemu_log(","); 1969eeacee4dSBlue Swirl } 197043439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1971efee3746SRichard Henderson op->args[k++])); 1972c896fe29Sbellard } 1973c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1974eeacee4dSBlue Swirl if (k != 0) { 1975bdfb460eSRichard Henderson col += qemu_log(","); 1976eeacee4dSBlue Swirl } 197743439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1978efee3746SRichard Henderson op->args[k++])); 1979c896fe29Sbellard } 1980be210acbSRichard Henderson switch (c) { 1981be210acbSRichard Henderson case INDEX_op_brcond_i32: 1982ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1983ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1984be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1985be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1986ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1987be210acbSRichard Henderson case INDEX_op_setcond_i64: 1988ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1989212be173SRichard Henderson case INDEX_op_cmp_vec: 1990efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1991efee3746SRichard Henderson && cond_name[op->args[k]]) { 1992efee3746SRichard Henderson col += qemu_log(",%s", cond_name[op->args[k++]]); 1993eeacee4dSBlue Swirl } else { 1994efee3746SRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]); 1995eeacee4dSBlue Swirl } 1996f48f3edeSblueswir1 i = 1; 1997be210acbSRichard Henderson break; 1998f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1999f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 2000f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 2001f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 200259227d5dSRichard Henderson { 2003efee3746SRichard Henderson TCGMemOpIdx oi = op->args[k++]; 200459227d5dSRichard Henderson TCGMemOp op = get_memop(oi); 200559227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 200659227d5dSRichard Henderson 200759c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 2008bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 200959c4b7e8SRichard Henderson } else { 20101f00b27fSSergey Sorokin const char *s_al, *s_op; 20111f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 201259c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 2013bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 2014f713d6adSRichard Henderson } 2015f713d6adSRichard Henderson i = 1; 201659227d5dSRichard Henderson } 2017f713d6adSRichard Henderson break; 2018be210acbSRichard Henderson default: 2019f48f3edeSblueswir1 i = 0; 2020be210acbSRichard Henderson break; 2021be210acbSRichard Henderson } 202251e3972cSRichard Henderson switch (c) { 202351e3972cSRichard Henderson case INDEX_op_set_label: 202451e3972cSRichard Henderson case INDEX_op_br: 202551e3972cSRichard Henderson case INDEX_op_brcond_i32: 202651e3972cSRichard Henderson case INDEX_op_brcond_i64: 202751e3972cSRichard Henderson case INDEX_op_brcond2_i32: 2028efee3746SRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", 2029efee3746SRichard Henderson arg_label(op->args[k])->id); 203051e3972cSRichard Henderson i++, k++; 203151e3972cSRichard Henderson break; 203251e3972cSRichard Henderson default: 203351e3972cSRichard Henderson break; 2034eeacee4dSBlue Swirl } 203551e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 2036efee3746SRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]); 2037bdfb460eSRichard Henderson } 2038bdfb460eSRichard Henderson } 2039bdfb460eSRichard Henderson 20401894f69aSRichard Henderson if (have_prefs || op->life) { 20411894f69aSRichard Henderson for (; col < 40; ++col) { 2042bdfb460eSRichard Henderson putc(' ', qemu_logfile); 2043bdfb460eSRichard Henderson } 20441894f69aSRichard Henderson } 20451894f69aSRichard Henderson 20461894f69aSRichard Henderson if (op->life) { 20471894f69aSRichard Henderson unsigned life = op->life; 2048bdfb460eSRichard Henderson 2049bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 2050bdfb460eSRichard Henderson qemu_log(" sync:"); 2051bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 2052bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 2053bdfb460eSRichard Henderson qemu_log(" %d", i); 2054bdfb460eSRichard Henderson } 2055bdfb460eSRichard Henderson } 2056bdfb460eSRichard Henderson } 2057bdfb460eSRichard Henderson life /= DEAD_ARG; 2058bdfb460eSRichard Henderson if (life) { 2059bdfb460eSRichard Henderson qemu_log(" dead:"); 2060bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 2061bdfb460eSRichard Henderson if (life & 1) { 2062bdfb460eSRichard Henderson qemu_log(" %d", i); 2063bdfb460eSRichard Henderson } 2064bdfb460eSRichard Henderson } 2065c896fe29Sbellard } 2066b03cce8eSbellard } 20671894f69aSRichard Henderson 20681894f69aSRichard Henderson if (have_prefs) { 20691894f69aSRichard Henderson for (i = 0; i < nb_oargs; ++i) { 20701894f69aSRichard Henderson TCGRegSet set = op->output_pref[i]; 20711894f69aSRichard Henderson 20721894f69aSRichard Henderson if (i == 0) { 20731894f69aSRichard Henderson qemu_log(" pref="); 20741894f69aSRichard Henderson } else { 20751894f69aSRichard Henderson qemu_log(","); 20761894f69aSRichard Henderson } 20771894f69aSRichard Henderson if (set == 0) { 20781894f69aSRichard Henderson qemu_log("none"); 20791894f69aSRichard Henderson } else if (set == MAKE_64BIT_MASK(0, TCG_TARGET_NB_REGS)) { 20801894f69aSRichard Henderson qemu_log("all"); 20811894f69aSRichard Henderson #ifdef CONFIG_DEBUG_TCG 20821894f69aSRichard Henderson } else if (tcg_regset_single(set)) { 20831894f69aSRichard Henderson TCGReg reg = tcg_regset_first(set); 20841894f69aSRichard Henderson qemu_log("%s", tcg_target_reg_names[reg]); 20851894f69aSRichard Henderson #endif 20861894f69aSRichard Henderson } else if (TCG_TARGET_NB_REGS <= 32) { 20871894f69aSRichard Henderson qemu_log("%#x", (uint32_t)set); 20881894f69aSRichard Henderson } else { 20891894f69aSRichard Henderson qemu_log("%#" PRIx64, (uint64_t)set); 20901894f69aSRichard Henderson } 20911894f69aSRichard Henderson } 20921894f69aSRichard Henderson } 20931894f69aSRichard Henderson 2094eeacee4dSBlue Swirl qemu_log("\n"); 2095c896fe29Sbellard } 2096c896fe29Sbellard } 2097c896fe29Sbellard 2098c896fe29Sbellard /* we give more priority to constraints with less registers */ 2099c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 2100c896fe29Sbellard { 2101c896fe29Sbellard const TCGArgConstraint *arg_ct; 2102c896fe29Sbellard 2103c896fe29Sbellard int i, n; 2104c896fe29Sbellard arg_ct = &def->args_ct[k]; 2105c896fe29Sbellard if (arg_ct->ct & TCG_CT_ALIAS) { 2106c896fe29Sbellard /* an alias is equivalent to a single register */ 2107c896fe29Sbellard n = 1; 2108c896fe29Sbellard } else { 2109c896fe29Sbellard if (!(arg_ct->ct & TCG_CT_REG)) 2110c896fe29Sbellard return 0; 2111c896fe29Sbellard n = 0; 2112c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2113c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, i)) 2114c896fe29Sbellard n++; 2115c896fe29Sbellard } 2116c896fe29Sbellard } 2117c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 2118c896fe29Sbellard } 2119c896fe29Sbellard 2120c896fe29Sbellard /* sort from highest priority to lowest */ 2121c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 2122c896fe29Sbellard { 2123c896fe29Sbellard int i, j, p1, p2, tmp; 2124c896fe29Sbellard 2125c896fe29Sbellard for(i = 0; i < n; i++) 2126c896fe29Sbellard def->sorted_args[start + i] = start + i; 2127c896fe29Sbellard if (n <= 1) 2128c896fe29Sbellard return; 2129c896fe29Sbellard for(i = 0; i < n - 1; i++) { 2130c896fe29Sbellard for(j = i + 1; j < n; j++) { 2131c896fe29Sbellard p1 = get_constraint_priority(def, def->sorted_args[start + i]); 2132c896fe29Sbellard p2 = get_constraint_priority(def, def->sorted_args[start + j]); 2133c896fe29Sbellard if (p1 < p2) { 2134c896fe29Sbellard tmp = def->sorted_args[start + i]; 2135c896fe29Sbellard def->sorted_args[start + i] = def->sorted_args[start + j]; 2136c896fe29Sbellard def->sorted_args[start + j] = tmp; 2137c896fe29Sbellard } 2138c896fe29Sbellard } 2139c896fe29Sbellard } 2140c896fe29Sbellard } 2141c896fe29Sbellard 2142f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 2143c896fe29Sbellard { 2144a9751609SRichard Henderson TCGOpcode op; 2145c896fe29Sbellard 2146f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 2147f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 2148f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 2149069ea736SRichard Henderson TCGType type; 2150069ea736SRichard Henderson int i, nb_args; 2151f69d277eSRichard Henderson 2152f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 2153f69d277eSRichard Henderson continue; 2154f69d277eSRichard Henderson } 2155f69d277eSRichard Henderson 2156c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 2157f69d277eSRichard Henderson if (nb_args == 0) { 2158f69d277eSRichard Henderson continue; 2159f69d277eSRichard Henderson } 2160f69d277eSRichard Henderson 2161f69d277eSRichard Henderson tdefs = tcg_target_op_def(op); 2162f69d277eSRichard Henderson /* Missing TCGTargetOpDef entry. */ 2163f69d277eSRichard Henderson tcg_debug_assert(tdefs != NULL); 2164f69d277eSRichard Henderson 2165069ea736SRichard Henderson type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32); 2166c896fe29Sbellard for (i = 0; i < nb_args; i++) { 2167f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 2168f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2169eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2170f69d277eSRichard Henderson 2171ccb1bb66SRichard Henderson def->args_ct[i].u.regs = 0; 2172c896fe29Sbellard def->args_ct[i].ct = 0; 217317280ff4SRichard Henderson while (*ct_str != '\0') { 217417280ff4SRichard Henderson switch(*ct_str) { 217517280ff4SRichard Henderson case '0' ... '9': 217617280ff4SRichard Henderson { 217717280ff4SRichard Henderson int oarg = *ct_str - '0'; 217817280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 2179eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 2180eabb7b91SAurelien Jarno tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG); 218117280ff4SRichard Henderson /* TCG_CT_ALIAS is for the output arguments. 218217280ff4SRichard Henderson The input is tagged with TCG_CT_IALIAS. */ 2183c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 218417280ff4SRichard Henderson def->args_ct[oarg].ct |= TCG_CT_ALIAS; 21855ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 2186c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_IALIAS; 21875ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 218817280ff4SRichard Henderson } 218917280ff4SRichard Henderson ct_str++; 2190c896fe29Sbellard break; 219182790a87SRichard Henderson case '&': 219282790a87SRichard Henderson def->args_ct[i].ct |= TCG_CT_NEWREG; 219382790a87SRichard Henderson ct_str++; 219482790a87SRichard Henderson break; 2195c896fe29Sbellard case 'i': 2196c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2197c896fe29Sbellard ct_str++; 2198c896fe29Sbellard break; 2199c896fe29Sbellard default: 2200069ea736SRichard Henderson ct_str = target_parse_constraint(&def->args_ct[i], 2201069ea736SRichard Henderson ct_str, type); 2202f69d277eSRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2203069ea736SRichard Henderson tcg_debug_assert(ct_str != NULL); 2204c896fe29Sbellard } 2205c896fe29Sbellard } 2206c896fe29Sbellard } 2207c896fe29Sbellard 2208c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2209eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2210c68aaa18SStefan Weil 2211c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2212c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2213c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2214c896fe29Sbellard } 2215c896fe29Sbellard } 2216c896fe29Sbellard 22170c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 22180c627cdcSRichard Henderson { 2219d88a117eSRichard Henderson TCGLabel *label; 2220d88a117eSRichard Henderson 2221d88a117eSRichard Henderson switch (op->opc) { 2222d88a117eSRichard Henderson case INDEX_op_br: 2223d88a117eSRichard Henderson label = arg_label(op->args[0]); 2224d88a117eSRichard Henderson label->refs--; 2225d88a117eSRichard Henderson break; 2226d88a117eSRichard Henderson case INDEX_op_brcond_i32: 2227d88a117eSRichard Henderson case INDEX_op_brcond_i64: 2228d88a117eSRichard Henderson label = arg_label(op->args[3]); 2229d88a117eSRichard Henderson label->refs--; 2230d88a117eSRichard Henderson break; 2231d88a117eSRichard Henderson case INDEX_op_brcond2_i32: 2232d88a117eSRichard Henderson label = arg_label(op->args[5]); 2233d88a117eSRichard Henderson label->refs--; 2234d88a117eSRichard Henderson break; 2235d88a117eSRichard Henderson default: 2236d88a117eSRichard Henderson break; 2237d88a117eSRichard Henderson } 2238d88a117eSRichard Henderson 223915fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 224015fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2241abebf925SRichard Henderson s->nb_ops--; 22420c627cdcSRichard Henderson 22430c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2244c3fac113SEmilio G. Cota atomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 22450c627cdcSRichard Henderson #endif 22460c627cdcSRichard Henderson } 22470c627cdcSRichard Henderson 224815fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 224915fa08f8SRichard Henderson { 225015fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 225115fa08f8SRichard Henderson TCGOp *op; 225215fa08f8SRichard Henderson 225315fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 225415fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 225515fa08f8SRichard Henderson } else { 225615fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 225715fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 225815fa08f8SRichard Henderson } 225915fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 226015fa08f8SRichard Henderson op->opc = opc; 2261abebf925SRichard Henderson s->nb_ops++; 226215fa08f8SRichard Henderson 226315fa08f8SRichard Henderson return op; 226415fa08f8SRichard Henderson } 226515fa08f8SRichard Henderson 226615fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 226715fa08f8SRichard Henderson { 226815fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 226915fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 227015fa08f8SRichard Henderson return op; 227115fa08f8SRichard Henderson } 227215fa08f8SRichard Henderson 2273ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 22745a18407fSRichard Henderson { 227515fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 227615fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 22775a18407fSRichard Henderson return new_op; 22785a18407fSRichard Henderson } 22795a18407fSRichard Henderson 2280ac1043f6SEmilio G. Cota TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, TCGOpcode opc) 22815a18407fSRichard Henderson { 228215fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 228315fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 22845a18407fSRichard Henderson return new_op; 22855a18407fSRichard Henderson } 22865a18407fSRichard Henderson 2287b4fc67c7SRichard Henderson /* Reachable analysis : remove unreachable code. */ 2288b4fc67c7SRichard Henderson static void reachable_code_pass(TCGContext *s) 2289b4fc67c7SRichard Henderson { 2290b4fc67c7SRichard Henderson TCGOp *op, *op_next; 2291b4fc67c7SRichard Henderson bool dead = false; 2292b4fc67c7SRichard Henderson 2293b4fc67c7SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 2294b4fc67c7SRichard Henderson bool remove = dead; 2295b4fc67c7SRichard Henderson TCGLabel *label; 2296b4fc67c7SRichard Henderson int call_flags; 2297b4fc67c7SRichard Henderson 2298b4fc67c7SRichard Henderson switch (op->opc) { 2299b4fc67c7SRichard Henderson case INDEX_op_set_label: 2300b4fc67c7SRichard Henderson label = arg_label(op->args[0]); 2301b4fc67c7SRichard Henderson if (label->refs == 0) { 2302b4fc67c7SRichard Henderson /* 2303b4fc67c7SRichard Henderson * While there is an occasional backward branch, virtually 2304b4fc67c7SRichard Henderson * all branches generated by the translators are forward. 2305b4fc67c7SRichard Henderson * Which means that generally we will have already removed 2306b4fc67c7SRichard Henderson * all references to the label that will be, and there is 2307b4fc67c7SRichard Henderson * little to be gained by iterating. 2308b4fc67c7SRichard Henderson */ 2309b4fc67c7SRichard Henderson remove = true; 2310b4fc67c7SRichard Henderson } else { 2311b4fc67c7SRichard Henderson /* Once we see a label, insns become live again. */ 2312b4fc67c7SRichard Henderson dead = false; 2313b4fc67c7SRichard Henderson remove = false; 2314b4fc67c7SRichard Henderson 2315b4fc67c7SRichard Henderson /* 2316b4fc67c7SRichard Henderson * Optimization can fold conditional branches to unconditional. 2317b4fc67c7SRichard Henderson * If we find a label with one reference which is preceded by 2318b4fc67c7SRichard Henderson * an unconditional branch to it, remove both. This needed to 2319b4fc67c7SRichard Henderson * wait until the dead code in between them was removed. 2320b4fc67c7SRichard Henderson */ 2321b4fc67c7SRichard Henderson if (label->refs == 1) { 2322b4fc67c7SRichard Henderson TCGOp *op_prev = QTAILQ_PREV(op, TCGOpHead, link); 2323b4fc67c7SRichard Henderson if (op_prev->opc == INDEX_op_br && 2324b4fc67c7SRichard Henderson label == arg_label(op_prev->args[0])) { 2325b4fc67c7SRichard Henderson tcg_op_remove(s, op_prev); 2326b4fc67c7SRichard Henderson remove = true; 2327b4fc67c7SRichard Henderson } 2328b4fc67c7SRichard Henderson } 2329b4fc67c7SRichard Henderson } 2330b4fc67c7SRichard Henderson break; 2331b4fc67c7SRichard Henderson 2332b4fc67c7SRichard Henderson case INDEX_op_br: 2333b4fc67c7SRichard Henderson case INDEX_op_exit_tb: 2334b4fc67c7SRichard Henderson case INDEX_op_goto_ptr: 2335b4fc67c7SRichard Henderson /* Unconditional branches; everything following is dead. */ 2336b4fc67c7SRichard Henderson dead = true; 2337b4fc67c7SRichard Henderson break; 2338b4fc67c7SRichard Henderson 2339b4fc67c7SRichard Henderson case INDEX_op_call: 2340b4fc67c7SRichard Henderson /* Notice noreturn helper calls, raising exceptions. */ 2341b4fc67c7SRichard Henderson call_flags = op->args[TCGOP_CALLO(op) + TCGOP_CALLI(op) + 1]; 2342b4fc67c7SRichard Henderson if (call_flags & TCG_CALL_NO_RETURN) { 2343b4fc67c7SRichard Henderson dead = true; 2344b4fc67c7SRichard Henderson } 2345b4fc67c7SRichard Henderson break; 2346b4fc67c7SRichard Henderson 2347b4fc67c7SRichard Henderson case INDEX_op_insn_start: 2348b4fc67c7SRichard Henderson /* Never remove -- we need to keep these for unwind. */ 2349b4fc67c7SRichard Henderson remove = false; 2350b4fc67c7SRichard Henderson break; 2351b4fc67c7SRichard Henderson 2352b4fc67c7SRichard Henderson default: 2353b4fc67c7SRichard Henderson break; 2354b4fc67c7SRichard Henderson } 2355b4fc67c7SRichard Henderson 2356b4fc67c7SRichard Henderson if (remove) { 2357b4fc67c7SRichard Henderson tcg_op_remove(s, op); 2358b4fc67c7SRichard Henderson } 2359b4fc67c7SRichard Henderson } 2360b4fc67c7SRichard Henderson } 2361b4fc67c7SRichard Henderson 2362c70fbf0aSRichard Henderson #define TS_DEAD 1 2363c70fbf0aSRichard Henderson #define TS_MEM 2 2364c70fbf0aSRichard Henderson 23655a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 23665a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 23675a18407fSRichard Henderson 23689c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 23699c43b68dSAurelien Jarno should be in memory. */ 2370b83eabeaSRichard Henderson static void tcg_la_func_end(TCGContext *s) 2371c896fe29Sbellard { 2372b83eabeaSRichard Henderson int ng = s->nb_globals; 2373b83eabeaSRichard Henderson int nt = s->nb_temps; 2374b83eabeaSRichard Henderson int i; 2375b83eabeaSRichard Henderson 2376b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2377b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2378b83eabeaSRichard Henderson } 2379b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2380b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 2381b83eabeaSRichard Henderson } 2382c896fe29Sbellard } 2383c896fe29Sbellard 23849c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 23859c43b68dSAurelien Jarno and local temps should be in memory. */ 2386b83eabeaSRichard Henderson static void tcg_la_bb_end(TCGContext *s) 2387641d5fbeSbellard { 2388b83eabeaSRichard Henderson int ng = s->nb_globals; 2389b83eabeaSRichard Henderson int nt = s->nb_temps; 2390b83eabeaSRichard Henderson int i; 2391641d5fbeSbellard 2392b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2393b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2394c70fbf0aSRichard Henderson } 2395b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2396b83eabeaSRichard Henderson s->temps[i].state = (s->temps[i].temp_local 2397b83eabeaSRichard Henderson ? TS_DEAD | TS_MEM 2398b83eabeaSRichard Henderson : TS_DEAD); 2399641d5fbeSbellard } 2400641d5fbeSbellard } 2401641d5fbeSbellard 2402a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2403c896fe29Sbellard given input arguments is dead. Instructions updating dead 2404c896fe29Sbellard temporaries are removed. */ 2405b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2406c896fe29Sbellard { 2407c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 240815fa08f8SRichard Henderson TCGOp *op, *op_prev; 2409c896fe29Sbellard 2410b83eabeaSRichard Henderson tcg_la_func_end(s); 2411c896fe29Sbellard 241215fa08f8SRichard Henderson QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, TCGOpHead, link, op_prev) { 2413c45cb8bbSRichard Henderson int i, nb_iargs, nb_oargs; 2414c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2415c45cb8bbSRichard Henderson bool have_opc_new2; 2416a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 2417b83eabeaSRichard Henderson TCGTemp *arg_ts; 2418c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2419c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2420c45cb8bbSRichard Henderson 2421c45cb8bbSRichard Henderson switch (opc) { 2422c896fe29Sbellard case INDEX_op_call: 2423c6e113f5Sbellard { 2424c6e113f5Sbellard int call_flags; 2425c6e113f5Sbellard 2426cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2427cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2428efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 2429c6e113f5Sbellard 2430c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 243178505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2432c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 2433b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2434b83eabeaSRichard Henderson if (arg_ts->state != TS_DEAD) { 2435c6e113f5Sbellard goto do_not_remove_call; 2436c6e113f5Sbellard } 24379c43b68dSAurelien Jarno } 2438c45cb8bbSRichard Henderson goto do_remove; 2439*152c35aaSRichard Henderson } 2440c6e113f5Sbellard do_not_remove_call: 2441c896fe29Sbellard 2442c896fe29Sbellard /* output args are dead */ 2443c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2444b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2445b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2446a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 24476b64b624SAurelien Jarno } 2448b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2449a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 24509c43b68dSAurelien Jarno } 2451b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2452c896fe29Sbellard } 2453c896fe29Sbellard 245478505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 245578505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 24569c43b68dSAurelien Jarno /* globals should go back to memory */ 2457b83eabeaSRichard Henderson for (i = 0; i < nb_globals; i++) { 2458b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2459b83eabeaSRichard Henderson } 2460c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2461c70fbf0aSRichard Henderson /* globals should be synced to memory */ 2462c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2463b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2464c70fbf0aSRichard Henderson } 2465b9c18f56Saurel32 } 2466c896fe29Sbellard 2467c19f47bfSAurelien Jarno /* record arguments that die in this helper */ 2468866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2469b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2470b83eabeaSRichard Henderson if (arg_ts && arg_ts->state & TS_DEAD) { 2471a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2472c896fe29Sbellard } 2473c896fe29Sbellard } 247467cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2475c70fbf0aSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2476b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2477b83eabeaSRichard Henderson if (arg_ts) { 2478b83eabeaSRichard Henderson arg_ts->state &= ~TS_DEAD; 2479c70fbf0aSRichard Henderson } 2480c19f47bfSAurelien Jarno } 2481c6e113f5Sbellard } 2482c896fe29Sbellard break; 2483765b842aSRichard Henderson case INDEX_op_insn_start: 2484c896fe29Sbellard break; 24855ff9d6a4Sbellard case INDEX_op_discard: 24865ff9d6a4Sbellard /* mark the temporary as dead */ 2487b83eabeaSRichard Henderson arg_temp(op->args[0])->state = TS_DEAD; 24885ff9d6a4Sbellard break; 24891305c451SRichard Henderson 24901305c451SRichard Henderson case INDEX_op_add2_i32: 2491c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2492f1fae40cSRichard Henderson goto do_addsub2; 24931305c451SRichard Henderson case INDEX_op_sub2_i32: 2494c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2495f1fae40cSRichard Henderson goto do_addsub2; 2496f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2497c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2498f1fae40cSRichard Henderson goto do_addsub2; 2499f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2500c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2501f1fae40cSRichard Henderson do_addsub2: 25021305c451SRichard Henderson nb_iargs = 4; 25031305c451SRichard Henderson nb_oargs = 2; 25041305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 25051305c451SRichard Henderson the low part. The result can be optimized to a simple 25061305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 25071305c451SRichard Henderson cpu mode is set to 32 bit. */ 2508b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2509b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 25101305c451SRichard Henderson goto do_remove; 25111305c451SRichard Henderson } 2512c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2513c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2514c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2515efee3746SRichard Henderson op->args[1] = op->args[2]; 2516efee3746SRichard Henderson op->args[2] = op->args[4]; 25171305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 25181305c451SRichard Henderson nb_iargs = 2; 25191305c451SRichard Henderson nb_oargs = 1; 25201305c451SRichard Henderson } 25211305c451SRichard Henderson goto do_not_remove; 25221305c451SRichard Henderson 25231414968aSRichard Henderson case INDEX_op_mulu2_i32: 2524c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2525c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2526c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 252703271524SRichard Henderson goto do_mul2; 2528f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2529c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2530c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2531c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2532f1fae40cSRichard Henderson goto do_mul2; 2533f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2534c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2535c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2536c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 253703271524SRichard Henderson goto do_mul2; 2538f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2539c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2540c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2541c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 254203271524SRichard Henderson goto do_mul2; 2543f1fae40cSRichard Henderson do_mul2: 25441414968aSRichard Henderson nb_iargs = 2; 25451414968aSRichard Henderson nb_oargs = 2; 2546b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2547b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 254803271524SRichard Henderson /* Both parts of the operation are dead. */ 25491414968aSRichard Henderson goto do_remove; 25501414968aSRichard Henderson } 255103271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2552c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2553efee3746SRichard Henderson op->args[1] = op->args[2]; 2554efee3746SRichard Henderson op->args[2] = op->args[3]; 2555b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 255603271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2557c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2558efee3746SRichard Henderson op->args[0] = op->args[1]; 2559efee3746SRichard Henderson op->args[1] = op->args[2]; 2560efee3746SRichard Henderson op->args[2] = op->args[3]; 256103271524SRichard Henderson } else { 256203271524SRichard Henderson goto do_not_remove; 256303271524SRichard Henderson } 256403271524SRichard Henderson /* Mark the single-word operation live. */ 25651414968aSRichard Henderson nb_oargs = 1; 25661414968aSRichard Henderson goto do_not_remove; 25671414968aSRichard Henderson 2568c896fe29Sbellard default: 25691305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2570c896fe29Sbellard nb_iargs = def->nb_iargs; 2571c896fe29Sbellard nb_oargs = def->nb_oargs; 2572c896fe29Sbellard 2573c896fe29Sbellard /* Test if the operation can be removed because all 25745ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 25755ff9d6a4Sbellard implies side effects */ 25765ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2577c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2578b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2579c896fe29Sbellard goto do_not_remove; 2580c896fe29Sbellard } 25819c43b68dSAurelien Jarno } 2582*152c35aaSRichard Henderson goto do_remove; 2583*152c35aaSRichard Henderson } 2584*152c35aaSRichard Henderson goto do_not_remove; 2585*152c35aaSRichard Henderson 25861305c451SRichard Henderson do_remove: 25870c627cdcSRichard Henderson tcg_op_remove(s, op); 2588*152c35aaSRichard Henderson break; 2589*152c35aaSRichard Henderson 2590c896fe29Sbellard do_not_remove: 2591c896fe29Sbellard /* output args are dead */ 2592c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2593b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2594b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2595a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 25966b64b624SAurelien Jarno } 2597b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2598a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 25999c43b68dSAurelien Jarno } 2600b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2601c896fe29Sbellard } 2602c896fe29Sbellard 2603c896fe29Sbellard /* if end of basic block, update */ 2604c896fe29Sbellard if (def->flags & TCG_OPF_BB_END) { 2605b83eabeaSRichard Henderson tcg_la_bb_end(s); 26063d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 26073d5c5f87SAurelien Jarno /* globals should be synced to memory */ 2608c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2609b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2610c70fbf0aSRichard Henderson } 2611c896fe29Sbellard } 2612c896fe29Sbellard 2613c19f47bfSAurelien Jarno /* record arguments that die in this opcode */ 2614866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2615b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2616b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2617a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2618c896fe29Sbellard } 2619c19f47bfSAurelien Jarno } 262067cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2621c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2622b83eabeaSRichard Henderson arg_temp(op->args[i])->state &= ~TS_DEAD; 2623c896fe29Sbellard } 2624c896fe29Sbellard break; 2625c896fe29Sbellard } 2626bee158cbSRichard Henderson op->life = arg_life; 262769e3706dSRichard Henderson op->output_pref[0] = 0; 262869e3706dSRichard Henderson op->output_pref[1] = 0; 2629c896fe29Sbellard } 26301ff0a2c5SEvgeny Voevodin } 2631c896fe29Sbellard 26325a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2633b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 26345a18407fSRichard Henderson { 26355a18407fSRichard Henderson int nb_globals = s->nb_globals; 263615fa08f8SRichard Henderson int nb_temps, i; 26375a18407fSRichard Henderson bool changes = false; 263815fa08f8SRichard Henderson TCGOp *op, *op_next; 26395a18407fSRichard Henderson 26405a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 26415a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 26425a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 26435a18407fSRichard Henderson if (its->indirect_reg) { 26445a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 26455a18407fSRichard Henderson dts->type = its->type; 26465a18407fSRichard Henderson dts->base_type = its->base_type; 2647b83eabeaSRichard Henderson its->state_ptr = dts; 2648b83eabeaSRichard Henderson } else { 2649b83eabeaSRichard Henderson its->state_ptr = NULL; 26505a18407fSRichard Henderson } 2651b83eabeaSRichard Henderson /* All globals begin dead. */ 2652b83eabeaSRichard Henderson its->state = TS_DEAD; 26535a18407fSRichard Henderson } 2654b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2655b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2656b83eabeaSRichard Henderson its->state_ptr = NULL; 2657b83eabeaSRichard Henderson its->state = TS_DEAD; 2658b83eabeaSRichard Henderson } 26595a18407fSRichard Henderson 266015fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 26615a18407fSRichard Henderson TCGOpcode opc = op->opc; 26625a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 26635a18407fSRichard Henderson TCGLifeData arg_life = op->life; 26645a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2665b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 26665a18407fSRichard Henderson 26675a18407fSRichard Henderson if (opc == INDEX_op_call) { 2668cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2669cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2670efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 26715a18407fSRichard Henderson } else { 26725a18407fSRichard Henderson nb_iargs = def->nb_iargs; 26735a18407fSRichard Henderson nb_oargs = def->nb_oargs; 26745a18407fSRichard Henderson 26755a18407fSRichard Henderson /* Set flags similar to how calls require. */ 26765a18407fSRichard Henderson if (def->flags & TCG_OPF_BB_END) { 26775a18407fSRichard Henderson /* Like writing globals: save_globals */ 26785a18407fSRichard Henderson call_flags = 0; 26795a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 26805a18407fSRichard Henderson /* Like reading globals: sync_globals */ 26815a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 26825a18407fSRichard Henderson } else { 26835a18407fSRichard Henderson /* No effect on globals. */ 26845a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 26855a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 26865a18407fSRichard Henderson } 26875a18407fSRichard Henderson } 26885a18407fSRichard Henderson 26895a18407fSRichard Henderson /* Make sure that input arguments are available. */ 26905a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2691b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2692b83eabeaSRichard Henderson if (arg_ts) { 2693b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2694b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2695b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 26965a18407fSRichard Henderson ? INDEX_op_ld_i32 26975a18407fSRichard Henderson : INDEX_op_ld_i64); 2698ac1043f6SEmilio G. Cota TCGOp *lop = tcg_op_insert_before(s, op, lopc); 26995a18407fSRichard Henderson 2700b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2701b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2702b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 27035a18407fSRichard Henderson 27045a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2705b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 27065a18407fSRichard Henderson } 27075a18407fSRichard Henderson } 27085a18407fSRichard Henderson } 27095a18407fSRichard Henderson 27105a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 27115a18407fSRichard Henderson No action is required except keeping temp_state up to date 27125a18407fSRichard Henderson so that we reload when needed. */ 27135a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2714b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2715b83eabeaSRichard Henderson if (arg_ts) { 2716b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2717b83eabeaSRichard Henderson if (dir_ts) { 2718b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 27195a18407fSRichard Henderson changes = true; 27205a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2721b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 27225a18407fSRichard Henderson } 27235a18407fSRichard Henderson } 27245a18407fSRichard Henderson } 27255a18407fSRichard Henderson } 27265a18407fSRichard Henderson 27275a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 27285a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 27295a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 27305a18407fSRichard Henderson /* Nothing to do */ 27315a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 27325a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 27335a18407fSRichard Henderson /* Liveness should see that globals are synced back, 27345a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2735b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2736b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2737b83eabeaSRichard Henderson || arg_ts->state != 0); 27385a18407fSRichard Henderson } 27395a18407fSRichard Henderson } else { 27405a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 27415a18407fSRichard Henderson /* Liveness should see that globals are saved back, 27425a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2743b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2744b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2745b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 27465a18407fSRichard Henderson } 27475a18407fSRichard Henderson } 27485a18407fSRichard Henderson 27495a18407fSRichard Henderson /* Outputs become available. */ 27505a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 2751b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2752b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2753b83eabeaSRichard Henderson if (!dir_ts) { 27545a18407fSRichard Henderson continue; 27555a18407fSRichard Henderson } 2756b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 27575a18407fSRichard Henderson changes = true; 27585a18407fSRichard Henderson 27595a18407fSRichard Henderson /* The output is now live and modified. */ 2760b83eabeaSRichard Henderson arg_ts->state = 0; 27615a18407fSRichard Henderson 27625a18407fSRichard Henderson /* Sync outputs upon their last write. */ 27635a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 2764b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 27655a18407fSRichard Henderson ? INDEX_op_st_i32 27665a18407fSRichard Henderson : INDEX_op_st_i64); 2767ac1043f6SEmilio G. Cota TCGOp *sop = tcg_op_insert_after(s, op, sopc); 27685a18407fSRichard Henderson 2769b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 2770b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 2771b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 27725a18407fSRichard Henderson 2773b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 27745a18407fSRichard Henderson } 27755a18407fSRichard Henderson /* Drop outputs that are dead. */ 27765a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2777b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 27785a18407fSRichard Henderson } 27795a18407fSRichard Henderson } 27805a18407fSRichard Henderson } 27815a18407fSRichard Henderson 27825a18407fSRichard Henderson return changes; 27835a18407fSRichard Henderson } 27845a18407fSRichard Henderson 27858d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2786c896fe29Sbellard static void dump_regs(TCGContext *s) 2787c896fe29Sbellard { 2788c896fe29Sbellard TCGTemp *ts; 2789c896fe29Sbellard int i; 2790c896fe29Sbellard char buf[64]; 2791c896fe29Sbellard 2792c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2793c896fe29Sbellard ts = &s->temps[i]; 279443439139SRichard Henderson printf(" %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2795c896fe29Sbellard switch(ts->val_type) { 2796c896fe29Sbellard case TEMP_VAL_REG: 2797c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2798c896fe29Sbellard break; 2799c896fe29Sbellard case TEMP_VAL_MEM: 2800b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2801b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2802c896fe29Sbellard break; 2803c896fe29Sbellard case TEMP_VAL_CONST: 2804c896fe29Sbellard printf("$0x%" TCG_PRIlx, ts->val); 2805c896fe29Sbellard break; 2806c896fe29Sbellard case TEMP_VAL_DEAD: 2807c896fe29Sbellard printf("D"); 2808c896fe29Sbellard break; 2809c896fe29Sbellard default: 2810c896fe29Sbellard printf("???"); 2811c896fe29Sbellard break; 2812c896fe29Sbellard } 2813c896fe29Sbellard printf("\n"); 2814c896fe29Sbellard } 2815c896fe29Sbellard 2816c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2817f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2818c896fe29Sbellard printf("%s: %s\n", 2819c896fe29Sbellard tcg_target_reg_names[i], 2820f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2821c896fe29Sbellard } 2822c896fe29Sbellard } 2823c896fe29Sbellard } 2824c896fe29Sbellard 2825c896fe29Sbellard static void check_regs(TCGContext *s) 2826c896fe29Sbellard { 2827869938aeSRichard Henderson int reg; 2828b6638662SRichard Henderson int k; 2829c896fe29Sbellard TCGTemp *ts; 2830c896fe29Sbellard char buf[64]; 2831c896fe29Sbellard 2832c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2833f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2834f8b2f202SRichard Henderson if (ts != NULL) { 2835f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2836c896fe29Sbellard printf("Inconsistency for register %s:\n", 2837c896fe29Sbellard tcg_target_reg_names[reg]); 2838b03cce8eSbellard goto fail; 2839c896fe29Sbellard } 2840c896fe29Sbellard } 2841c896fe29Sbellard } 2842c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2843c896fe29Sbellard ts = &s->temps[k]; 2844f8b2f202SRichard Henderson if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg 2845f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2846c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2847f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2848b03cce8eSbellard fail: 2849c896fe29Sbellard printf("reg state:\n"); 2850c896fe29Sbellard dump_regs(s); 2851c896fe29Sbellard tcg_abort(); 2852c896fe29Sbellard } 2853c896fe29Sbellard } 2854c896fe29Sbellard } 2855c896fe29Sbellard #endif 2856c896fe29Sbellard 28572272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 2858c896fe29Sbellard { 28599b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 28609b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2861b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2862b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2863b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2864f44c9960SBlue Swirl #endif 2865b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2866b591dc59SBlue Swirl s->frame_end) { 28675ff9d6a4Sbellard tcg_abort(); 2868b591dc59SBlue Swirl } 2869c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2870b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2871c896fe29Sbellard ts->mem_allocated = 1; 2872e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2873c896fe29Sbellard } 2874c896fe29Sbellard 2875b722452aSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet, TCGRegSet); 2876b3915dbbSRichard Henderson 287759d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 287859d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 287959d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2880c896fe29Sbellard { 288159d7c14eSRichard Henderson if (ts->fixed_reg) { 288259d7c14eSRichard Henderson return; 288359d7c14eSRichard Henderson } 288459d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 288559d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 288659d7c14eSRichard Henderson } 288759d7c14eSRichard Henderson ts->val_type = (free_or_dead < 0 288859d7c14eSRichard Henderson || ts->temp_local 2889fa477d25SRichard Henderson || ts->temp_global 289059d7c14eSRichard Henderson ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 289159d7c14eSRichard Henderson } 2892c896fe29Sbellard 289359d7c14eSRichard Henderson /* Mark a temporary as dead. */ 289459d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 289559d7c14eSRichard Henderson { 289659d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 289759d7c14eSRichard Henderson } 289859d7c14eSRichard Henderson 289959d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 290059d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 290159d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 290259d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 290398b4e186SRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs, 290498b4e186SRichard Henderson TCGRegSet preferred_regs, int free_or_dead) 290559d7c14eSRichard Henderson { 290659d7c14eSRichard Henderson if (ts->fixed_reg) { 290759d7c14eSRichard Henderson return; 290859d7c14eSRichard Henderson } 290959d7c14eSRichard Henderson if (!ts->mem_coherent) { 29107f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 29112272e4a7SRichard Henderson temp_allocate_frame(s, ts); 291259d7c14eSRichard Henderson } 291359d7c14eSRichard Henderson switch (ts->val_type) { 291459d7c14eSRichard Henderson case TEMP_VAL_CONST: 291559d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 291659d7c14eSRichard Henderson require it later in a register, so attempt to store the 291759d7c14eSRichard Henderson constant to memory directly. */ 291859d7c14eSRichard Henderson if (free_or_dead 291959d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 292059d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 292159d7c14eSRichard Henderson break; 292259d7c14eSRichard Henderson } 292359d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 292498b4e186SRichard Henderson allocated_regs, preferred_regs); 292559d7c14eSRichard Henderson /* fallthrough */ 292659d7c14eSRichard Henderson 292759d7c14eSRichard Henderson case TEMP_VAL_REG: 292859d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 292959d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 293059d7c14eSRichard Henderson break; 293159d7c14eSRichard Henderson 293259d7c14eSRichard Henderson case TEMP_VAL_MEM: 293359d7c14eSRichard Henderson break; 293459d7c14eSRichard Henderson 293559d7c14eSRichard Henderson case TEMP_VAL_DEAD: 293659d7c14eSRichard Henderson default: 293759d7c14eSRichard Henderson tcg_abort(); 2938c896fe29Sbellard } 29397f6ceedfSAurelien Jarno ts->mem_coherent = 1; 29407f6ceedfSAurelien Jarno } 294159d7c14eSRichard Henderson if (free_or_dead) { 294259d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 294359d7c14eSRichard Henderson } 294459d7c14eSRichard Henderson } 29457f6ceedfSAurelien Jarno 29467f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 2947b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 29487f6ceedfSAurelien Jarno { 2949f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 2950f8b2f202SRichard Henderson if (ts != NULL) { 295198b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, -1); 2952c896fe29Sbellard } 2953c896fe29Sbellard } 2954c896fe29Sbellard 2955b016486eSRichard Henderson /** 2956b016486eSRichard Henderson * tcg_reg_alloc: 2957b016486eSRichard Henderson * @required_regs: Set of registers in which we must allocate. 2958b016486eSRichard Henderson * @allocated_regs: Set of registers which must be avoided. 2959b016486eSRichard Henderson * @preferred_regs: Set of registers we should prefer. 2960b016486eSRichard Henderson * @rev: True if we search the registers in "indirect" order. 2961b016486eSRichard Henderson * 2962b016486eSRichard Henderson * The allocated register must be in @required_regs & ~@allocated_regs, 2963b016486eSRichard Henderson * but if we can put it in @preferred_regs we may save a move later. 2964b016486eSRichard Henderson */ 2965b016486eSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet required_regs, 2966b016486eSRichard Henderson TCGRegSet allocated_regs, 2967b016486eSRichard Henderson TCGRegSet preferred_regs, bool rev) 2968c896fe29Sbellard { 2969b016486eSRichard Henderson int i, j, f, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 2970b016486eSRichard Henderson TCGRegSet reg_ct[2]; 297191478cefSRichard Henderson const int *order; 2972c896fe29Sbellard 2973b016486eSRichard Henderson reg_ct[1] = required_regs & ~allocated_regs; 2974b016486eSRichard Henderson tcg_debug_assert(reg_ct[1] != 0); 2975b016486eSRichard Henderson reg_ct[0] = reg_ct[1] & preferred_regs; 2976b016486eSRichard Henderson 2977b016486eSRichard Henderson /* Skip the preferred_regs option if it cannot be satisfied, 2978b016486eSRichard Henderson or if the preference made no difference. */ 2979b016486eSRichard Henderson f = reg_ct[0] == 0 || reg_ct[0] == reg_ct[1]; 2980b016486eSRichard Henderson 298191478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 2982c896fe29Sbellard 2983b016486eSRichard Henderson /* Try free registers, preferences first. */ 2984b016486eSRichard Henderson for (j = f; j < 2; j++) { 2985b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 2986b016486eSRichard Henderson 2987b016486eSRichard Henderson if (tcg_regset_single(set)) { 2988b016486eSRichard Henderson /* One register in the set. */ 2989b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 2990b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL) { 2991c896fe29Sbellard return reg; 2992c896fe29Sbellard } 2993b016486eSRichard Henderson } else { 299491478cefSRichard Henderson for (i = 0; i < n; i++) { 2995b016486eSRichard Henderson TCGReg reg = order[i]; 2996b016486eSRichard Henderson if (s->reg_to_temp[reg] == NULL && 2997b016486eSRichard Henderson tcg_regset_test_reg(set, reg)) { 2998b016486eSRichard Henderson return reg; 2999b016486eSRichard Henderson } 3000b016486eSRichard Henderson } 3001b016486eSRichard Henderson } 3002b016486eSRichard Henderson } 3003b016486eSRichard Henderson 3004b016486eSRichard Henderson /* We must spill something. */ 3005b016486eSRichard Henderson for (j = f; j < 2; j++) { 3006b016486eSRichard Henderson TCGRegSet set = reg_ct[j]; 3007b016486eSRichard Henderson 3008b016486eSRichard Henderson if (tcg_regset_single(set)) { 3009b016486eSRichard Henderson /* One register in the set. */ 3010b016486eSRichard Henderson TCGReg reg = tcg_regset_first(set); 3011b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3012c896fe29Sbellard return reg; 3013b016486eSRichard Henderson } else { 3014b016486eSRichard Henderson for (i = 0; i < n; i++) { 3015b016486eSRichard Henderson TCGReg reg = order[i]; 3016b016486eSRichard Henderson if (tcg_regset_test_reg(set, reg)) { 3017b016486eSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 3018b016486eSRichard Henderson return reg; 3019b016486eSRichard Henderson } 3020b016486eSRichard Henderson } 3021c896fe29Sbellard } 3022c896fe29Sbellard } 3023c896fe29Sbellard 3024c896fe29Sbellard tcg_abort(); 3025c896fe29Sbellard } 3026c896fe29Sbellard 302740ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 302840ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 302940ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 3030b722452aSRichard Henderson TCGRegSet allocated_regs, TCGRegSet preferred_regs) 303140ae5c62SRichard Henderson { 303240ae5c62SRichard Henderson TCGReg reg; 303340ae5c62SRichard Henderson 303440ae5c62SRichard Henderson switch (ts->val_type) { 303540ae5c62SRichard Henderson case TEMP_VAL_REG: 303640ae5c62SRichard Henderson return; 303740ae5c62SRichard Henderson case TEMP_VAL_CONST: 3038b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3039b722452aSRichard Henderson preferred_regs, ts->indirect_base); 304040ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 304140ae5c62SRichard Henderson ts->mem_coherent = 0; 304240ae5c62SRichard Henderson break; 304340ae5c62SRichard Henderson case TEMP_VAL_MEM: 3044b016486eSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, 3045b722452aSRichard Henderson preferred_regs, ts->indirect_base); 304640ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 304740ae5c62SRichard Henderson ts->mem_coherent = 1; 304840ae5c62SRichard Henderson break; 304940ae5c62SRichard Henderson case TEMP_VAL_DEAD: 305040ae5c62SRichard Henderson default: 305140ae5c62SRichard Henderson tcg_abort(); 305240ae5c62SRichard Henderson } 305340ae5c62SRichard Henderson ts->reg = reg; 305440ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 305540ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 305640ae5c62SRichard Henderson } 305740ae5c62SRichard Henderson 305859d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 3059e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 306059d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 30611ad80729SAurelien Jarno { 30622c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 3063eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 3064f8bf00f1SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg); 30651ad80729SAurelien Jarno } 30661ad80729SAurelien Jarno 30679814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 3068641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 3069641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 3070641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 3071641d5fbeSbellard { 3072ac3b8891SRichard Henderson int i, n; 3073641d5fbeSbellard 3074ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 3075b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 3076641d5fbeSbellard } 3077e5097dc8Sbellard } 3078e5097dc8Sbellard 30793d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 30803d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 30813d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 30823d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 30833d5c5f87SAurelien Jarno { 3084ac3b8891SRichard Henderson int i, n; 30853d5c5f87SAurelien Jarno 3086ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 308712b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 308812b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 308912b9b11aSRichard Henderson || ts->fixed_reg 309012b9b11aSRichard Henderson || ts->mem_coherent); 30913d5c5f87SAurelien Jarno } 30923d5c5f87SAurelien Jarno } 30933d5c5f87SAurelien Jarno 3094e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 3095e8996ee0Sbellard all globals are stored at their canonical location. */ 3096e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 3097e5097dc8Sbellard { 3098e5097dc8Sbellard int i; 3099e5097dc8Sbellard 3100c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 3101b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 3102641d5fbeSbellard if (ts->temp_local) { 3103b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 3104641d5fbeSbellard } else { 31052c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 3106eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 3107eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 3108c896fe29Sbellard } 3109641d5fbeSbellard } 3110e8996ee0Sbellard 3111e8996ee0Sbellard save_globals(s, allocated_regs); 3112c896fe29Sbellard } 3113c896fe29Sbellard 31140fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 3115ba87719cSRichard Henderson tcg_target_ulong val, TCGLifeData arg_life, 3116ba87719cSRichard Henderson TCGRegSet preferred_regs) 3117e8996ee0Sbellard { 3118e8996ee0Sbellard if (ots->fixed_reg) { 311959d7c14eSRichard Henderson /* For fixed registers, we do not do any constant propagation. */ 3120e8996ee0Sbellard tcg_out_movi(s, ots->type, ots->reg, val); 312159d7c14eSRichard Henderson return; 312259d7c14eSRichard Henderson } 312359d7c14eSRichard Henderson 312459d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 3125f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 3126f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3127f8b2f202SRichard Henderson } 3128e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 3129e8996ee0Sbellard ots->val = val; 313059d7c14eSRichard Henderson ots->mem_coherent = 0; 3131ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 3132ba87719cSRichard Henderson temp_sync(s, ots, s->reserved_regs, preferred_regs, IS_DEAD_ARG(0)); 313359d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 3134f8bf00f1SRichard Henderson temp_dead(s, ots); 31354c4e1ab2SAurelien Jarno } 3136e8996ee0Sbellard } 3137e8996ee0Sbellard 3138dd186292SRichard Henderson static void tcg_reg_alloc_movi(TCGContext *s, const TCGOp *op) 31390fe4fca4SPaolo Bonzini { 314043439139SRichard Henderson TCGTemp *ots = arg_temp(op->args[0]); 3141dd186292SRichard Henderson tcg_target_ulong val = op->args[1]; 31420fe4fca4SPaolo Bonzini 314369e3706dSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, op->life, op->output_pref[0]); 31440fe4fca4SPaolo Bonzini } 31450fe4fca4SPaolo Bonzini 3146dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 3147c896fe29Sbellard { 3148dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 314969e3706dSRichard Henderson TCGRegSet allocated_regs, preferred_regs; 3150c896fe29Sbellard TCGTemp *ts, *ots; 3151450445d5SRichard Henderson TCGType otype, itype; 3152c896fe29Sbellard 3153d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 315469e3706dSRichard Henderson preferred_regs = op->output_pref[0]; 315543439139SRichard Henderson ots = arg_temp(op->args[0]); 315643439139SRichard Henderson ts = arg_temp(op->args[1]); 3157450445d5SRichard Henderson 3158450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 3159450445d5SRichard Henderson otype = ots->type; 3160450445d5SRichard Henderson itype = ts->type; 3161c896fe29Sbellard 31620fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 31630fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 31640fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 31650fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 31660fe4fca4SPaolo Bonzini temp_dead(s, ts); 31670fe4fca4SPaolo Bonzini } 316869e3706dSRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, arg_life, preferred_regs); 31690fe4fca4SPaolo Bonzini return; 31700fe4fca4SPaolo Bonzini } 31710fe4fca4SPaolo Bonzini 31720fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 31730fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 31740fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 31750fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 31760fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 317769e3706dSRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], 317869e3706dSRichard Henderson allocated_regs, preferred_regs); 3179c29c1d7eSAurelien Jarno } 3180c29c1d7eSAurelien Jarno 31810fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 3182c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(0) && !ots->fixed_reg) { 3183c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 3184c29c1d7eSAurelien Jarno liveness analysis disabled). */ 3185eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 3186c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 31872272e4a7SRichard Henderson temp_allocate_frame(s, ots); 3188c29c1d7eSAurelien Jarno } 3189b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 3190c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 3191f8bf00f1SRichard Henderson temp_dead(s, ts); 3192c29c1d7eSAurelien Jarno } 3193f8bf00f1SRichard Henderson temp_dead(s, ots); 3194e8996ee0Sbellard } else { 3195c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) { 3196c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 3197c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 3198f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3199c896fe29Sbellard } 3200c29c1d7eSAurelien Jarno ots->reg = ts->reg; 3201f8bf00f1SRichard Henderson temp_dead(s, ts); 3202c29c1d7eSAurelien Jarno } else { 3203c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 3204c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 3205c29c1d7eSAurelien Jarno input one. */ 3206c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 3207450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 320869e3706dSRichard Henderson allocated_regs, preferred_regs, 3209b016486eSRichard Henderson ots->indirect_base); 3210c29c1d7eSAurelien Jarno } 3211450445d5SRichard Henderson tcg_out_mov(s, otype, ots->reg, ts->reg); 3212c29c1d7eSAurelien Jarno } 3213c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 3214c896fe29Sbellard ots->mem_coherent = 0; 3215f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 3216ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 321798b4e186SRichard Henderson temp_sync(s, ots, allocated_regs, 0, 0); 3218c29c1d7eSAurelien Jarno } 3219ec7a869dSAurelien Jarno } 3220c896fe29Sbellard } 3221c896fe29Sbellard 3222dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3223c896fe29Sbellard { 3224dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3225dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 322682790a87SRichard Henderson TCGRegSet i_allocated_regs; 322782790a87SRichard Henderson TCGRegSet o_allocated_regs; 3228b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3229b6638662SRichard Henderson TCGReg reg; 3230c896fe29Sbellard TCGArg arg; 3231c896fe29Sbellard const TCGArgConstraint *arg_ct; 3232c896fe29Sbellard TCGTemp *ts; 3233c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3234c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3235c896fe29Sbellard 3236c896fe29Sbellard nb_oargs = def->nb_oargs; 3237c896fe29Sbellard nb_iargs = def->nb_iargs; 3238c896fe29Sbellard 3239c896fe29Sbellard /* copy constants */ 3240c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3241dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3242c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3243c896fe29Sbellard 3244d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3245d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 324682790a87SRichard Henderson 3247c896fe29Sbellard /* satisfy input constraints */ 3248c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 3249d62816f2SRichard Henderson TCGRegSet i_preferred_regs, o_preferred_regs; 3250d62816f2SRichard Henderson 3251c896fe29Sbellard i = def->sorted_args[nb_oargs + k]; 3252dd186292SRichard Henderson arg = op->args[i]; 3253c896fe29Sbellard arg_ct = &def->args_ct[i]; 325443439139SRichard Henderson ts = arg_temp(arg); 325540ae5c62SRichard Henderson 325640ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 325740ae5c62SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct)) { 3258c896fe29Sbellard /* constant is OK for instruction */ 3259c896fe29Sbellard const_args[i] = 1; 3260c896fe29Sbellard new_args[i] = ts->val; 3261d62816f2SRichard Henderson continue; 3262c896fe29Sbellard } 326340ae5c62SRichard Henderson 3264d62816f2SRichard Henderson i_preferred_regs = o_preferred_regs = 0; 32655ff9d6a4Sbellard if (arg_ct->ct & TCG_CT_IALIAS) { 3266d62816f2SRichard Henderson o_preferred_regs = op->output_pref[arg_ct->alias_index]; 32675ff9d6a4Sbellard if (ts->fixed_reg) { 32685ff9d6a4Sbellard /* if fixed register, we must allocate a new register 32695ff9d6a4Sbellard if the alias is not the same register */ 3270d62816f2SRichard Henderson if (arg != op->args[arg_ct->alias_index]) { 32715ff9d6a4Sbellard goto allocate_in_reg; 3272d62816f2SRichard Henderson } 32735ff9d6a4Sbellard } else { 3274c896fe29Sbellard /* if the input is aliased to an output and if it is 3275c896fe29Sbellard not dead after the instruction, we must allocate 3276c896fe29Sbellard a new register and move it */ 3277866cb6cbSAurelien Jarno if (!IS_DEAD_ARG(i)) { 3278c896fe29Sbellard goto allocate_in_reg; 3279c896fe29Sbellard } 3280d62816f2SRichard Henderson 32817e1df267SAurelien Jarno /* check if the current register has already been allocated 32827e1df267SAurelien Jarno for another input aliased to an output */ 3283d62816f2SRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 32847e1df267SAurelien Jarno int k2, i2; 3285d62816f2SRichard Henderson reg = ts->reg; 32867e1df267SAurelien Jarno for (k2 = 0 ; k2 < k ; k2++) { 32877e1df267SAurelien Jarno i2 = def->sorted_args[nb_oargs + k2]; 32887e1df267SAurelien Jarno if ((def->args_ct[i2].ct & TCG_CT_IALIAS) && 3289d62816f2SRichard Henderson reg == new_args[i2]) { 32907e1df267SAurelien Jarno goto allocate_in_reg; 32917e1df267SAurelien Jarno } 32927e1df267SAurelien Jarno } 32935ff9d6a4Sbellard } 3294d62816f2SRichard Henderson i_preferred_regs = o_preferred_regs; 3295866cb6cbSAurelien Jarno } 3296d62816f2SRichard Henderson } 3297d62816f2SRichard Henderson 3298d62816f2SRichard Henderson temp_load(s, ts, arg_ct->u.regs, i_allocated_regs, i_preferred_regs); 3299c896fe29Sbellard reg = ts->reg; 3300d62816f2SRichard Henderson 3301c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3302c896fe29Sbellard /* nothing to do : the constraint is satisfied */ 3303c896fe29Sbellard } else { 3304c896fe29Sbellard allocate_in_reg: 3305c896fe29Sbellard /* allocate a new register matching the constraint 3306c896fe29Sbellard and move the temporary register into it */ 3307d62816f2SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 3308d62816f2SRichard Henderson i_allocated_regs, 0); 330982790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs, 3310d62816f2SRichard Henderson o_preferred_regs, ts->indirect_base); 33113b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3312c896fe29Sbellard } 3313c896fe29Sbellard new_args[i] = reg; 3314c896fe29Sbellard const_args[i] = 0; 331582790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3316c896fe29Sbellard } 3317c896fe29Sbellard 3318c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3319866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3320866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 332143439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3322c896fe29Sbellard } 3323c896fe29Sbellard } 3324c896fe29Sbellard 3325a52ad07eSAurelien Jarno if (def->flags & TCG_OPF_BB_END) { 332682790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3327a52ad07eSAurelien Jarno } else { 3328c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3329b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3330c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3331c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 333282790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3333c896fe29Sbellard } 3334c896fe29Sbellard } 33353d5c5f87SAurelien Jarno } 33363d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 33373d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 33383d5c5f87SAurelien Jarno an exception. */ 333982790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3340c896fe29Sbellard } 3341c896fe29Sbellard 3342c896fe29Sbellard /* satisfy the output constraints */ 3343c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 3344c896fe29Sbellard i = def->sorted_args[k]; 3345dd186292SRichard Henderson arg = op->args[i]; 3346c896fe29Sbellard arg_ct = &def->args_ct[i]; 334743439139SRichard Henderson ts = arg_temp(arg); 334817280ff4SRichard Henderson if ((arg_ct->ct & TCG_CT_ALIAS) 334917280ff4SRichard Henderson && !const_args[arg_ct->alias_index]) { 33505ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 335182790a87SRichard Henderson } else if (arg_ct->ct & TCG_CT_NEWREG) { 335282790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, 335382790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 335469e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3355c896fe29Sbellard } else { 3356c896fe29Sbellard /* if fixed register, we try to use it */ 3357c896fe29Sbellard reg = ts->reg; 3358c896fe29Sbellard if (ts->fixed_reg && 3359c896fe29Sbellard tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3360c896fe29Sbellard goto oarg_end; 3361c896fe29Sbellard } 336282790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs, 336369e3706dSRichard Henderson op->output_pref[k], ts->indirect_base); 3364c896fe29Sbellard } 336582790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 3366c896fe29Sbellard /* if a fixed register is used, then a move will be done afterwards */ 3367c896fe29Sbellard if (!ts->fixed_reg) { 3368639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3369f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3370639368ddSAurelien Jarno } 3371c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3372c896fe29Sbellard ts->reg = reg; 3373c896fe29Sbellard /* temp value is modified, so the value kept in memory is 3374c896fe29Sbellard potentially not the same */ 3375c896fe29Sbellard ts->mem_coherent = 0; 3376f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3377c896fe29Sbellard } 3378c896fe29Sbellard oarg_end: 3379c896fe29Sbellard new_args[i] = reg; 3380c896fe29Sbellard } 3381e8996ee0Sbellard } 3382c896fe29Sbellard 3383c896fe29Sbellard /* emit instruction */ 3384d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 3385d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 3386d2fd745fSRichard Henderson new_args, const_args); 3387d2fd745fSRichard Henderson } else { 3388dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 3389d2fd745fSRichard Henderson } 3390c896fe29Sbellard 3391c896fe29Sbellard /* move the outputs in the correct register if needed */ 3392c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 339343439139SRichard Henderson ts = arg_temp(op->args[i]); 3394c896fe29Sbellard reg = new_args[i]; 3395c896fe29Sbellard if (ts->fixed_reg && ts->reg != reg) { 33963b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3397c896fe29Sbellard } 3398ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 339998b4e186SRichard Henderson temp_sync(s, ts, o_allocated_regs, 0, IS_DEAD_ARG(i)); 340059d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3401f8bf00f1SRichard Henderson temp_dead(s, ts); 3402ec7a869dSAurelien Jarno } 3403c896fe29Sbellard } 3404c896fe29Sbellard } 3405c896fe29Sbellard 3406b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 3407b03cce8eSbellard #define STACK_DIR(x) (-(x)) 3408b03cce8eSbellard #else 3409b03cce8eSbellard #define STACK_DIR(x) (x) 3410b03cce8eSbellard #endif 3411b03cce8eSbellard 3412dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 3413c896fe29Sbellard { 3414cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 3415cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 3416dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3417b6638662SRichard Henderson int flags, nb_regs, i; 3418b6638662SRichard Henderson TCGReg reg; 3419cf066674SRichard Henderson TCGArg arg; 3420c896fe29Sbellard TCGTemp *ts; 3421d3452f1fSRichard Henderson intptr_t stack_offset; 3422d3452f1fSRichard Henderson size_t call_stack_size; 3423cf066674SRichard Henderson tcg_insn_unit *func_addr; 3424cf066674SRichard Henderson int allocate_args; 3425c896fe29Sbellard TCGRegSet allocated_regs; 3426c896fe29Sbellard 3427dd186292SRichard Henderson func_addr = (tcg_insn_unit *)(intptr_t)op->args[nb_oargs + nb_iargs]; 3428dd186292SRichard Henderson flags = op->args[nb_oargs + nb_iargs + 1]; 3429c896fe29Sbellard 34306e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 3431c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 3432c45cb8bbSRichard Henderson nb_regs = nb_iargs; 3433cf066674SRichard Henderson } 3434c896fe29Sbellard 3435c896fe29Sbellard /* assign stack slots first */ 3436c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 3437c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 3438c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 3439b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 3440b03cce8eSbellard if (allocate_args) { 3441345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 3442345649c0SBlue Swirl preallocate call stack */ 3443345649c0SBlue Swirl tcg_abort(); 3444b03cce8eSbellard } 344539cf05d3Sbellard 344639cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 3447c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 3448dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 344939cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 345039cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 345139cf05d3Sbellard #endif 345239cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 345343439139SRichard Henderson ts = arg_temp(arg); 345440ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 3455b722452aSRichard Henderson s->reserved_regs, 0); 3456e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 345739cf05d3Sbellard } 345839cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 345939cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 346039cf05d3Sbellard #endif 3461c896fe29Sbellard } 3462c896fe29Sbellard 3463c896fe29Sbellard /* assign input registers */ 3464d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 3465c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 3466dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 346739cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 346843439139SRichard Henderson ts = arg_temp(arg); 3469c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 3470b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 347140ae5c62SRichard Henderson 3472c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 3473c896fe29Sbellard if (ts->reg != reg) { 34743b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3475c896fe29Sbellard } 3476c896fe29Sbellard } else { 3477ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 347840ae5c62SRichard Henderson 347940ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 3480b722452aSRichard Henderson temp_load(s, ts, arg_set, allocated_regs, 0); 3481c896fe29Sbellard } 348240ae5c62SRichard Henderson 3483c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 3484c896fe29Sbellard } 348539cf05d3Sbellard } 3486c896fe29Sbellard 3487c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3488866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 3489866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 349043439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3491c896fe29Sbellard } 3492c896fe29Sbellard } 3493c896fe29Sbellard 3494c896fe29Sbellard /* clobber call registers */ 3495c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3496c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 3497b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 3498c896fe29Sbellard } 3499c896fe29Sbellard } 3500c896fe29Sbellard 350178505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 350278505279SAurelien Jarno they might be read. */ 350378505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 350478505279SAurelien Jarno /* Nothing to do */ 350578505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 350678505279SAurelien Jarno sync_globals(s, allocated_regs); 350778505279SAurelien Jarno } else { 3508e8996ee0Sbellard save_globals(s, allocated_regs); 3509b9c18f56Saurel32 } 3510c896fe29Sbellard 3511cf066674SRichard Henderson tcg_out_call(s, func_addr); 3512c896fe29Sbellard 3513c896fe29Sbellard /* assign output registers and emit moves if needed */ 3514c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 3515dd186292SRichard Henderson arg = op->args[i]; 351643439139SRichard Henderson ts = arg_temp(arg); 3517c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 3518eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 351934b1a49cSRichard Henderson 3520c896fe29Sbellard if (ts->fixed_reg) { 3521c896fe29Sbellard if (ts->reg != reg) { 35223b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3523c896fe29Sbellard } 3524c896fe29Sbellard } else { 3525639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3526f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3527639368ddSAurelien Jarno } 3528c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3529c896fe29Sbellard ts->reg = reg; 3530c896fe29Sbellard ts->mem_coherent = 0; 3531f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3532ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 353398b4e186SRichard Henderson temp_sync(s, ts, allocated_regs, 0, IS_DEAD_ARG(i)); 353459d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3535f8bf00f1SRichard Henderson temp_dead(s, ts); 3536c896fe29Sbellard } 3537c896fe29Sbellard } 35388c11ad25SAurelien Jarno } 3539c896fe29Sbellard } 3540c896fe29Sbellard 3541c896fe29Sbellard #ifdef CONFIG_PROFILER 3542c896fe29Sbellard 3543c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 3544c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 3545c3fac113SEmilio G. Cota do { \ 3546c3fac113SEmilio G. Cota (to)->field += atomic_read(&((from)->field)); \ 3547c3fac113SEmilio G. Cota } while (0) 3548c896fe29Sbellard 3549c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 3550c3fac113SEmilio G. Cota do { \ 3551c3fac113SEmilio G. Cota typeof((from)->field) val__ = atomic_read(&((from)->field)); \ 3552c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 3553c3fac113SEmilio G. Cota (to)->field = val__; \ 3554c3fac113SEmilio G. Cota } \ 3555c3fac113SEmilio G. Cota } while (0) 3556c3fac113SEmilio G. Cota 3557c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 3558c3fac113SEmilio G. Cota static inline 3559c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 3560c896fe29Sbellard { 35613468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 3562c3fac113SEmilio G. Cota unsigned int i; 3563c3fac113SEmilio G. Cota 35643468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 35653468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 35663468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 3567c3fac113SEmilio G. Cota 3568c3fac113SEmilio G. Cota if (counters) { 356972fd2efbSEmilio G. Cota PROF_ADD(prof, orig, cpu_exec_time); 3570c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 3571c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 3572c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 3573c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 3574c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 3575c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 3576c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 3577c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 3578c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 3579c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 3580c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 3581c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 3582c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 3583c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 3584c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 3585c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 3586c3fac113SEmilio G. Cota } 3587c3fac113SEmilio G. Cota if (table) { 3588c896fe29Sbellard int i; 3589d70724ceSzhanghailiang 359015fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 3591c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 3592c3fac113SEmilio G. Cota } 3593c3fac113SEmilio G. Cota } 3594c3fac113SEmilio G. Cota } 3595c3fac113SEmilio G. Cota } 3596c3fac113SEmilio G. Cota 3597c3fac113SEmilio G. Cota #undef PROF_ADD 3598c3fac113SEmilio G. Cota #undef PROF_MAX 3599c3fac113SEmilio G. Cota 3600c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 3601c3fac113SEmilio G. Cota { 3602c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 3603c3fac113SEmilio G. Cota } 3604c3fac113SEmilio G. Cota 3605c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 3606c3fac113SEmilio G. Cota { 3607c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 3608c3fac113SEmilio G. Cota } 3609c3fac113SEmilio G. Cota 3610c3fac113SEmilio G. Cota void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3611c3fac113SEmilio G. Cota { 3612c3fac113SEmilio G. Cota TCGProfile prof = {}; 3613c3fac113SEmilio G. Cota int i; 3614c3fac113SEmilio G. Cota 3615c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 3616c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 3617246ae24dSMax Filippov cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, 3618c3fac113SEmilio G. Cota prof.table_op_count[i]); 3619c896fe29Sbellard } 3620c896fe29Sbellard } 362172fd2efbSEmilio G. Cota 362272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 362372fd2efbSEmilio G. Cota { 362472fd2efbSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 362572fd2efbSEmilio G. Cota unsigned int i; 362672fd2efbSEmilio G. Cota int64_t ret = 0; 362772fd2efbSEmilio G. Cota 362872fd2efbSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 362972fd2efbSEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 363072fd2efbSEmilio G. Cota const TCGProfile *prof = &s->prof; 363172fd2efbSEmilio G. Cota 363272fd2efbSEmilio G. Cota ret += atomic_read(&prof->cpu_exec_time); 363372fd2efbSEmilio G. Cota } 363472fd2efbSEmilio G. Cota return ret; 363572fd2efbSEmilio G. Cota } 3636246ae24dSMax Filippov #else 3637246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3638246ae24dSMax Filippov { 3639246ae24dSMax Filippov cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3640246ae24dSMax Filippov } 364172fd2efbSEmilio G. Cota 364272fd2efbSEmilio G. Cota int64_t tcg_cpu_exec_time(void) 364372fd2efbSEmilio G. Cota { 364472fd2efbSEmilio G. Cota error_report("%s: TCG profiler not compiled", __func__); 364572fd2efbSEmilio G. Cota exit(EXIT_FAILURE); 364672fd2efbSEmilio G. Cota } 3647c896fe29Sbellard #endif 3648c896fe29Sbellard 3649c896fe29Sbellard 36505bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 3651c896fe29Sbellard { 3652c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 3653c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 3654c3fac113SEmilio G. Cota #endif 365515fa08f8SRichard Henderson int i, num_insns; 365615fa08f8SRichard Henderson TCGOp *op; 3657c896fe29Sbellard 365804fe6400SRichard Henderson #ifdef CONFIG_PROFILER 365904fe6400SRichard Henderson { 3660c1f543b7SEmilio G. Cota int n = 0; 366104fe6400SRichard Henderson 366215fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 366315fa08f8SRichard Henderson n++; 366415fa08f8SRichard Henderson } 3665c3fac113SEmilio G. Cota atomic_set(&prof->op_count, prof->op_count + n); 3666c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 3667c3fac113SEmilio G. Cota atomic_set(&prof->op_count_max, n); 366804fe6400SRichard Henderson } 366904fe6400SRichard Henderson 367004fe6400SRichard Henderson n = s->nb_temps; 3671c3fac113SEmilio G. Cota atomic_set(&prof->temp_count, prof->temp_count + n); 3672c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 3673c3fac113SEmilio G. Cota atomic_set(&prof->temp_count_max, n); 367404fe6400SRichard Henderson } 367504fe6400SRichard Henderson } 367604fe6400SRichard Henderson #endif 367704fe6400SRichard Henderson 3678c896fe29Sbellard #ifdef DEBUG_DISAS 3679d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 3680d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 36811ee73216SRichard Henderson qemu_log_lock(); 368293fcfe39Saliguori qemu_log("OP:\n"); 36831894f69aSRichard Henderson tcg_dump_ops(s, false); 368493fcfe39Saliguori qemu_log("\n"); 36851ee73216SRichard Henderson qemu_log_unlock(); 3686c896fe29Sbellard } 3687c896fe29Sbellard #endif 3688c896fe29Sbellard 3689c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 3690c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 3691c5cc28ffSAurelien Jarno #endif 3692c5cc28ffSAurelien Jarno 36938f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 3694c45cb8bbSRichard Henderson tcg_optimize(s); 36958f2e8c07SKirill Batuzov #endif 36968f2e8c07SKirill Batuzov 3697a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3698c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 3699c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time - profile_getclock()); 3700a23a9ec6Sbellard #endif 3701c5cc28ffSAurelien Jarno 3702b4fc67c7SRichard Henderson reachable_code_pass(s); 3703b83eabeaSRichard Henderson liveness_pass_1(s); 37045a18407fSRichard Henderson 37055a18407fSRichard Henderson if (s->nb_indirects > 0) { 37065a18407fSRichard Henderson #ifdef DEBUG_DISAS 37075a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 37085a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 37091ee73216SRichard Henderson qemu_log_lock(); 37105a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 37111894f69aSRichard Henderson tcg_dump_ops(s, false); 37125a18407fSRichard Henderson qemu_log("\n"); 37131ee73216SRichard Henderson qemu_log_unlock(); 37145a18407fSRichard Henderson } 37155a18407fSRichard Henderson #endif 37165a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 3717b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 37185a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 3719b83eabeaSRichard Henderson liveness_pass_1(s); 37205a18407fSRichard Henderson } 37215a18407fSRichard Henderson } 3722c5cc28ffSAurelien Jarno 3723a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3724c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time + profile_getclock()); 3725a23a9ec6Sbellard #endif 3726c896fe29Sbellard 3727c896fe29Sbellard #ifdef DEBUG_DISAS 3728d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 3729d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 37301ee73216SRichard Henderson qemu_log_lock(); 3731c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 37321894f69aSRichard Henderson tcg_dump_ops(s, true); 373393fcfe39Saliguori qemu_log("\n"); 37341ee73216SRichard Henderson qemu_log_unlock(); 3735c896fe29Sbellard } 3736c896fe29Sbellard #endif 3737c896fe29Sbellard 3738c896fe29Sbellard tcg_reg_alloc_start(s); 3739c896fe29Sbellard 3740e7e168f4SEmilio G. Cota s->code_buf = tb->tc.ptr; 3741e7e168f4SEmilio G. Cota s->code_ptr = tb->tc.ptr; 3742c896fe29Sbellard 3743659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 37446001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 3745659ef5cbSRichard Henderson #endif 374657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 374757a26946SRichard Henderson s->pool_labels = NULL; 374857a26946SRichard Henderson #endif 37499ecefc84SRichard Henderson 3750fca8a500SRichard Henderson num_insns = -1; 375115fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 3752c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 3753b3db8758Sblueswir1 3754c896fe29Sbellard #ifdef CONFIG_PROFILER 3755c3fac113SEmilio G. Cota atomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 3756c896fe29Sbellard #endif 3757c45cb8bbSRichard Henderson 3758c896fe29Sbellard switch (opc) { 3759c896fe29Sbellard case INDEX_op_mov_i32: 3760c896fe29Sbellard case INDEX_op_mov_i64: 3761d2fd745fSRichard Henderson case INDEX_op_mov_vec: 3762dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 3763c896fe29Sbellard break; 3764e8996ee0Sbellard case INDEX_op_movi_i32: 3765e8996ee0Sbellard case INDEX_op_movi_i64: 3766d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 3767dd186292SRichard Henderson tcg_reg_alloc_movi(s, op); 3768e8996ee0Sbellard break; 3769765b842aSRichard Henderson case INDEX_op_insn_start: 3770fca8a500SRichard Henderson if (num_insns >= 0) { 37719f754620SRichard Henderson size_t off = tcg_current_code_size(s); 37729f754620SRichard Henderson s->gen_insn_end_off[num_insns] = off; 37739f754620SRichard Henderson /* Assert that we do not overflow our stored offset. */ 37749f754620SRichard Henderson assert(s->gen_insn_end_off[num_insns] == off); 3775fca8a500SRichard Henderson } 3776fca8a500SRichard Henderson num_insns++; 3777bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 3778bad729e2SRichard Henderson target_ulong a; 3779bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 3780efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 3781bad729e2SRichard Henderson #else 3782efee3746SRichard Henderson a = op->args[i]; 3783bad729e2SRichard Henderson #endif 3784fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 3785bad729e2SRichard Henderson } 3786c896fe29Sbellard break; 37875ff9d6a4Sbellard case INDEX_op_discard: 378843439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 37895ff9d6a4Sbellard break; 3790c896fe29Sbellard case INDEX_op_set_label: 3791e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 3792efee3746SRichard Henderson tcg_out_label(s, arg_label(op->args[0]), s->code_ptr); 3793c896fe29Sbellard break; 3794c896fe29Sbellard case INDEX_op_call: 3795dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 3796c45cb8bbSRichard Henderson break; 3797c896fe29Sbellard default: 379825c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 3799be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 3800c896fe29Sbellard /* Note: in order to speed up the code, it would be much 3801c896fe29Sbellard faster to have specialized register allocator functions for 3802c896fe29Sbellard some common argument patterns */ 3803dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 3804c896fe29Sbellard break; 3805c896fe29Sbellard } 38068d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 3807c896fe29Sbellard check_regs(s); 3808c896fe29Sbellard #endif 3809b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 3810b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 3811b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 3812b125f9dcSRichard Henderson generating code without having to check during generation. */ 3813644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 3814b125f9dcSRichard Henderson return -1; 3815b125f9dcSRichard Henderson } 3816c896fe29Sbellard } 3817fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 3818fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 3819c45cb8bbSRichard Henderson 3820b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 3821659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 3822659ef5cbSRichard Henderson if (!tcg_out_ldst_finalize(s)) { 382323dceda6SRichard Henderson return -1; 382423dceda6SRichard Henderson } 3825659ef5cbSRichard Henderson #endif 382657a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 382757a26946SRichard Henderson if (!tcg_out_pool_finalize(s)) { 382857a26946SRichard Henderson return -1; 382957a26946SRichard Henderson } 383057a26946SRichard Henderson #endif 3831c896fe29Sbellard 3832c896fe29Sbellard /* flush instruction cache */ 38331813e175SRichard Henderson flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr); 38342aeabc08SStefan Weil 38351813e175SRichard Henderson return tcg_current_code_size(s); 3836c896fe29Sbellard } 3837c896fe29Sbellard 3838a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3839405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3840a23a9ec6Sbellard { 3841c3fac113SEmilio G. Cota TCGProfile prof = {}; 3842c3fac113SEmilio G. Cota const TCGProfile *s; 3843c3fac113SEmilio G. Cota int64_t tb_count; 3844c3fac113SEmilio G. Cota int64_t tb_div_count; 3845c3fac113SEmilio G. Cota int64_t tot; 3846c3fac113SEmilio G. Cota 3847c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 3848c3fac113SEmilio G. Cota s = &prof; 3849c3fac113SEmilio G. Cota tb_count = s->tb_count; 3850c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 3851c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 3852a23a9ec6Sbellard 3853a23a9ec6Sbellard cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 3854a23a9ec6Sbellard tot, tot / 2.4e9); 3855a23a9ec6Sbellard cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n", 3856fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 3857fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 3858fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 3859a23a9ec6Sbellard cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n", 3860fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 3861a23a9ec6Sbellard cpu_fprintf(f, "deleted ops/TB %0.2f\n", 3862fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 3863a23a9ec6Sbellard cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n", 3864fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 3865fca8a500SRichard Henderson cpu_fprintf(f, "avg host code/TB %0.1f\n", 3866fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 3867fca8a500SRichard Henderson cpu_fprintf(f, "avg search data/TB %0.1f\n", 3868fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 3869a23a9ec6Sbellard 3870a23a9ec6Sbellard cpu_fprintf(f, "cycles/op %0.1f\n", 3871a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 3872a23a9ec6Sbellard cpu_fprintf(f, "cycles/in byte %0.1f\n", 3873a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 3874a23a9ec6Sbellard cpu_fprintf(f, "cycles/out byte %0.1f\n", 3875a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 3876fca8a500SRichard Henderson cpu_fprintf(f, "cycles/search byte %0.1f\n", 3877fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 3878fca8a500SRichard Henderson if (tot == 0) { 3879a23a9ec6Sbellard tot = 1; 3880fca8a500SRichard Henderson } 3881a23a9ec6Sbellard cpu_fprintf(f, " gen_interm time %0.1f%%\n", 3882a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 3883a23a9ec6Sbellard cpu_fprintf(f, " gen_code time %0.1f%%\n", 3884a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 3885c5cc28ffSAurelien Jarno cpu_fprintf(f, "optim./code time %0.1f%%\n", 3886c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 3887c5cc28ffSAurelien Jarno * 100.0); 3888a23a9ec6Sbellard cpu_fprintf(f, "liveness/code time %0.1f%%\n", 3889a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 3890a23a9ec6Sbellard cpu_fprintf(f, "cpu_restore count %" PRId64 "\n", 3891a23a9ec6Sbellard s->restore_count); 3892a23a9ec6Sbellard cpu_fprintf(f, " avg cycles %0.1f\n", 3893a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 3894a23a9ec6Sbellard } 3895a23a9ec6Sbellard #else 3896405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3897a23a9ec6Sbellard { 389824bf7b3aSbellard cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3899a23a9ec6Sbellard } 3900a23a9ec6Sbellard #endif 3901813da627SRichard Henderson 3902813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 39035872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 39045872bbf2SRichard Henderson 39055872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 39065872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 39075872bbf2SRichard Henderson 39085872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 39095872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 39105872bbf2SRichard Henderson prologue unwind info for the tcg machine. 39115872bbf2SRichard Henderson 39125872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 39135872bbf2SRichard Henderson */ 3914813da627SRichard Henderson 3915813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 3916813da627SRichard Henderson typedef enum { 3917813da627SRichard Henderson JIT_NOACTION = 0, 3918813da627SRichard Henderson JIT_REGISTER_FN, 3919813da627SRichard Henderson JIT_UNREGISTER_FN 3920813da627SRichard Henderson } jit_actions_t; 3921813da627SRichard Henderson 3922813da627SRichard Henderson struct jit_code_entry { 3923813da627SRichard Henderson struct jit_code_entry *next_entry; 3924813da627SRichard Henderson struct jit_code_entry *prev_entry; 3925813da627SRichard Henderson const void *symfile_addr; 3926813da627SRichard Henderson uint64_t symfile_size; 3927813da627SRichard Henderson }; 3928813da627SRichard Henderson 3929813da627SRichard Henderson struct jit_descriptor { 3930813da627SRichard Henderson uint32_t version; 3931813da627SRichard Henderson uint32_t action_flag; 3932813da627SRichard Henderson struct jit_code_entry *relevant_entry; 3933813da627SRichard Henderson struct jit_code_entry *first_entry; 3934813da627SRichard Henderson }; 3935813da627SRichard Henderson 3936813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 3937813da627SRichard Henderson void __jit_debug_register_code(void) 3938813da627SRichard Henderson { 3939813da627SRichard Henderson asm(""); 3940813da627SRichard Henderson } 3941813da627SRichard Henderson 3942813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 3943813da627SRichard Henderson the version before we can set it. */ 3944813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 3945813da627SRichard Henderson 3946813da627SRichard Henderson /* End GDB interface. */ 3947813da627SRichard Henderson 3948813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 3949813da627SRichard Henderson { 3950813da627SRichard Henderson const char *p = strtab + 1; 3951813da627SRichard Henderson 3952813da627SRichard Henderson while (1) { 3953813da627SRichard Henderson if (strcmp(p, str) == 0) { 3954813da627SRichard Henderson return p - strtab; 3955813da627SRichard Henderson } 3956813da627SRichard Henderson p += strlen(p) + 1; 3957813da627SRichard Henderson } 3958813da627SRichard Henderson } 3959813da627SRichard Henderson 39605872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size, 39612c90784aSRichard Henderson const void *debug_frame, 39622c90784aSRichard Henderson size_t debug_frame_size) 3963813da627SRichard Henderson { 39645872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 39655872bbf2SRichard Henderson uint32_t len; 39665872bbf2SRichard Henderson uint16_t version; 39675872bbf2SRichard Henderson uint32_t abbrev; 39685872bbf2SRichard Henderson uint8_t ptr_size; 39695872bbf2SRichard Henderson uint8_t cu_die; 39705872bbf2SRichard Henderson uint16_t cu_lang; 39715872bbf2SRichard Henderson uintptr_t cu_low_pc; 39725872bbf2SRichard Henderson uintptr_t cu_high_pc; 39735872bbf2SRichard Henderson uint8_t fn_die; 39745872bbf2SRichard Henderson char fn_name[16]; 39755872bbf2SRichard Henderson uintptr_t fn_low_pc; 39765872bbf2SRichard Henderson uintptr_t fn_high_pc; 39775872bbf2SRichard Henderson uint8_t cu_eoc; 39785872bbf2SRichard Henderson }; 3979813da627SRichard Henderson 3980813da627SRichard Henderson struct ElfImage { 3981813da627SRichard Henderson ElfW(Ehdr) ehdr; 3982813da627SRichard Henderson ElfW(Phdr) phdr; 39835872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 39845872bbf2SRichard Henderson ElfW(Sym) sym[2]; 39855872bbf2SRichard Henderson struct DebugInfo di; 39865872bbf2SRichard Henderson uint8_t da[24]; 39875872bbf2SRichard Henderson char str[80]; 39885872bbf2SRichard Henderson }; 39895872bbf2SRichard Henderson 39905872bbf2SRichard Henderson struct ElfImage *img; 39915872bbf2SRichard Henderson 39925872bbf2SRichard Henderson static const struct ElfImage img_template = { 39935872bbf2SRichard Henderson .ehdr = { 39945872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 39955872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 39965872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 39975872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 39985872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 39995872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 40005872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 40015872bbf2SRichard Henderson .e_type = ET_EXEC, 40025872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 40035872bbf2SRichard Henderson .e_version = EV_CURRENT, 40045872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 40055872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 40065872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 40075872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 40085872bbf2SRichard Henderson .e_phnum = 1, 40095872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 40105872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 40115872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 4012abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 4013abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 4014abbb3eaeSRichard Henderson #endif 4015abbb3eaeSRichard Henderson #ifdef ELF_OSABI 4016abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 4017abbb3eaeSRichard Henderson #endif 40185872bbf2SRichard Henderson }, 40195872bbf2SRichard Henderson .phdr = { 40205872bbf2SRichard Henderson .p_type = PT_LOAD, 40215872bbf2SRichard Henderson .p_flags = PF_X, 40225872bbf2SRichard Henderson }, 40235872bbf2SRichard Henderson .shdr = { 40245872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 40255872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 40265872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 40275872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 40285872bbf2SRichard Henderson will not look for contents. We can record any address. */ 40295872bbf2SRichard Henderson [1] = { /* .text */ 40305872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 40315872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 40325872bbf2SRichard Henderson }, 40335872bbf2SRichard Henderson [2] = { /* .debug_info */ 40345872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 40355872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 40365872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 40375872bbf2SRichard Henderson }, 40385872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 40395872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 40405872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 40415872bbf2SRichard Henderson .sh_size = sizeof(img->da), 40425872bbf2SRichard Henderson }, 40435872bbf2SRichard Henderson [4] = { /* .debug_frame */ 40445872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 40455872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 40465872bbf2SRichard Henderson }, 40475872bbf2SRichard Henderson [5] = { /* .symtab */ 40485872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 40495872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 40505872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 40515872bbf2SRichard Henderson .sh_info = 1, 40525872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 40535872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 40545872bbf2SRichard Henderson }, 40555872bbf2SRichard Henderson [6] = { /* .strtab */ 40565872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 40575872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 40585872bbf2SRichard Henderson .sh_size = sizeof(img->str), 40595872bbf2SRichard Henderson } 40605872bbf2SRichard Henderson }, 40615872bbf2SRichard Henderson .sym = { 40625872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 40635872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 40645872bbf2SRichard Henderson .st_shndx = 1, 40655872bbf2SRichard Henderson } 40665872bbf2SRichard Henderson }, 40675872bbf2SRichard Henderson .di = { 40685872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 40695872bbf2SRichard Henderson .version = 2, 40705872bbf2SRichard Henderson .ptr_size = sizeof(void *), 40715872bbf2SRichard Henderson .cu_die = 1, 40725872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 40735872bbf2SRichard Henderson .fn_die = 2, 40745872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 40755872bbf2SRichard Henderson }, 40765872bbf2SRichard Henderson .da = { 40775872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 40785872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 40795872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 40805872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 40815872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 40825872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 40835872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 40845872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 40855872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 40865872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 40875872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 40885872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 40895872bbf2SRichard Henderson 0 /* no more abbrev */ 40905872bbf2SRichard Henderson }, 40915872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 40925872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 4093813da627SRichard Henderson }; 4094813da627SRichard Henderson 4095813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 4096813da627SRichard Henderson static struct jit_code_entry one_entry; 4097813da627SRichard Henderson 40985872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 4099813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 41002c90784aSRichard Henderson DebugFrameHeader *dfh; 4101813da627SRichard Henderson 41025872bbf2SRichard Henderson img = g_malloc(img_size); 41035872bbf2SRichard Henderson *img = img_template; 4104813da627SRichard Henderson 41055872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 41065872bbf2SRichard Henderson img->phdr.p_paddr = buf; 41075872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 4108813da627SRichard Henderson 41095872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 41105872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 41115872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 4112813da627SRichard Henderson 41135872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 41145872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 41155872bbf2SRichard Henderson 41165872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 41175872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 41185872bbf2SRichard Henderson 41195872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 41205872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 41215872bbf2SRichard Henderson 41225872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 41235872bbf2SRichard Henderson img->sym[1].st_value = buf; 41245872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 41255872bbf2SRichard Henderson 41265872bbf2SRichard Henderson img->di.cu_low_pc = buf; 412745aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 41285872bbf2SRichard Henderson img->di.fn_low_pc = buf; 412945aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 4130813da627SRichard Henderson 41312c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 41322c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 41332c90784aSRichard Henderson dfh->fde.func_start = buf; 41342c90784aSRichard Henderson dfh->fde.func_len = buf_size; 41352c90784aSRichard Henderson 4136813da627SRichard Henderson #ifdef DEBUG_JIT 4137813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 4138813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 4139813da627SRichard Henderson { 4140813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 4141813da627SRichard Henderson if (f) { 41425872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 4143813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 4144813da627SRichard Henderson } 4145813da627SRichard Henderson fclose(f); 4146813da627SRichard Henderson } 4147813da627SRichard Henderson } 4148813da627SRichard Henderson #endif 4149813da627SRichard Henderson 4150813da627SRichard Henderson one_entry.symfile_addr = img; 4151813da627SRichard Henderson one_entry.symfile_size = img_size; 4152813da627SRichard Henderson 4153813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 4154813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 4155813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 4156813da627SRichard Henderson __jit_debug_register_code(); 4157813da627SRichard Henderson } 4158813da627SRichard Henderson #else 41595872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 41605872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 4161813da627SRichard Henderson 4162813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 41632c90784aSRichard Henderson const void *debug_frame, 41642c90784aSRichard Henderson size_t debug_frame_size) 4165813da627SRichard Henderson { 4166813da627SRichard Henderson } 4167813da627SRichard Henderson 4168813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size) 4169813da627SRichard Henderson { 4170813da627SRichard Henderson } 4171813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 4172db432672SRichard Henderson 4173db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 4174db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 4175db432672SRichard Henderson { 4176db432672SRichard Henderson g_assert_not_reached(); 4177db432672SRichard Henderson } 4178db432672SRichard Henderson #endif 4179