1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 33f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 341de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 351de7afc9SPaolo Bonzini #include "qemu/timer.h" 36c896fe29Sbellard 37c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 38c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 39c896fe29Sbellard instructions */ 40c896fe29Sbellard #define NO_CPU_IO_DEFS 41c896fe29Sbellard #include "cpu.h" 42c896fe29Sbellard 4363c91552SPaolo Bonzini #include "exec/cpu-common.h" 4463c91552SPaolo Bonzini #include "exec/exec-all.h" 4563c91552SPaolo Bonzini 46c896fe29Sbellard #include "tcg-op.h" 47813da627SRichard Henderson 48edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 49813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 50edee2579SRichard Henderson #else 51edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 52813da627SRichard Henderson #endif 53813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 54813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 55813da627SRichard Henderson #else 56813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 57813da627SRichard Henderson #endif 58813da627SRichard Henderson 59c896fe29Sbellard #include "elf.h" 60508127e2SPaolo Bonzini #include "exec/log.h" 613468b59eSEmilio G. Cota #include "sysemu/sysemu.h" 62c896fe29Sbellard 63ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and 64ce151109SPeter Maydell used here. */ 65e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 66f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode); 67e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 681813e175SRichard Henderson static void patch_reloc(tcg_insn_unit *code_ptr, int type, 692ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 70c896fe29Sbellard 71497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 72497a22ebSRichard Henderson typedef struct { 73497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 74497a22ebSRichard Henderson uint32_t id; 75497a22ebSRichard Henderson uint8_t version; 76497a22ebSRichard Henderson char augmentation[1]; 77497a22ebSRichard Henderson uint8_t code_align; 78497a22ebSRichard Henderson uint8_t data_align; 79497a22ebSRichard Henderson uint8_t return_column; 80497a22ebSRichard Henderson } DebugFrameCIE; 81497a22ebSRichard Henderson 82497a22ebSRichard Henderson typedef struct QEMU_PACKED { 83497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 84497a22ebSRichard Henderson uint32_t cie_offset; 85edee2579SRichard Henderson uintptr_t func_start; 86edee2579SRichard Henderson uintptr_t func_len; 87497a22ebSRichard Henderson } DebugFrameFDEHeader; 88497a22ebSRichard Henderson 892c90784aSRichard Henderson typedef struct QEMU_PACKED { 902c90784aSRichard Henderson DebugFrameCIE cie; 912c90784aSRichard Henderson DebugFrameFDEHeader fde; 922c90784aSRichard Henderson } DebugFrameHeader; 932c90784aSRichard Henderson 94813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 952c90784aSRichard Henderson const void *debug_frame, 962c90784aSRichard Henderson size_t debug_frame_size) 97813da627SRichard Henderson __attribute__((unused)); 98813da627SRichard Henderson 99ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */ 100069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct, 101069ea736SRichard Henderson const char *ct_str, TCGType type); 1022a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 103a05b5b9bSRichard Henderson intptr_t arg2); 1042a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 105c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1062a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 107c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args, 108c0ad3001SStefan Weil const int *const_args); 109d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 110d2fd745fSRichard Henderson static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 111d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 112d2fd745fSRichard Henderson const int *const_args); 113d2fd745fSRichard Henderson #else 114d2fd745fSRichard Henderson static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 115d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 116d2fd745fSRichard Henderson const int *const_args) 117d2fd745fSRichard Henderson { 118d2fd745fSRichard Henderson g_assert_not_reached(); 119d2fd745fSRichard Henderson } 120d2fd745fSRichard Henderson #endif 1212a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 122a05b5b9bSRichard Henderson intptr_t arg2); 12359d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 12459d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 125cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); 126f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type, 127c0ad3001SStefan Weil const TCGArgConstraint *arg_ct); 128659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 129659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s); 130659ef5cbSRichard Henderson #endif 131c896fe29Sbellard 132a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024 133a505785cSEmilio G. Cota 134df2cce29SEmilio G. Cota static TCGContext **tcg_ctxs; 135df2cce29SEmilio G. Cota static unsigned int n_tcg_ctxs; 1361c2adb95SRichard Henderson TCGv_env cpu_env = 0; 137df2cce29SEmilio G. Cota 138be2cdc5eSEmilio G. Cota struct tcg_region_tree { 139be2cdc5eSEmilio G. Cota QemuMutex lock; 140be2cdc5eSEmilio G. Cota GTree *tree; 141be2cdc5eSEmilio G. Cota /* padding to avoid false sharing is computed at run-time */ 142be2cdc5eSEmilio G. Cota }; 143be2cdc5eSEmilio G. Cota 144e8feb96fSEmilio G. Cota /* 145e8feb96fSEmilio G. Cota * We divide code_gen_buffer into equally-sized "regions" that TCG threads 146e8feb96fSEmilio G. Cota * dynamically allocate from as demand dictates. Given appropriate region 147e8feb96fSEmilio G. Cota * sizing, this minimizes flushes even when some TCG threads generate a lot 148e8feb96fSEmilio G. Cota * more code than others. 149e8feb96fSEmilio G. Cota */ 150e8feb96fSEmilio G. Cota struct tcg_region_state { 151e8feb96fSEmilio G. Cota QemuMutex lock; 152e8feb96fSEmilio G. Cota 153e8feb96fSEmilio G. Cota /* fields set at init time */ 154e8feb96fSEmilio G. Cota void *start; 155e8feb96fSEmilio G. Cota void *start_aligned; 156e8feb96fSEmilio G. Cota void *end; 157e8feb96fSEmilio G. Cota size_t n; 158e8feb96fSEmilio G. Cota size_t size; /* size of one region */ 159e8feb96fSEmilio G. Cota size_t stride; /* .size + guard size */ 160e8feb96fSEmilio G. Cota 161e8feb96fSEmilio G. Cota /* fields protected by the lock */ 162e8feb96fSEmilio G. Cota size_t current; /* current region index */ 163e8feb96fSEmilio G. Cota size_t agg_size_full; /* aggregate size of full regions */ 164e8feb96fSEmilio G. Cota }; 165e8feb96fSEmilio G. Cota 166e8feb96fSEmilio G. Cota static struct tcg_region_state region; 167be2cdc5eSEmilio G. Cota /* 168be2cdc5eSEmilio G. Cota * This is an array of struct tcg_region_tree's, with padding. 169be2cdc5eSEmilio G. Cota * We use void * to simplify the computation of region_trees[i]; each 170be2cdc5eSEmilio G. Cota * struct is found every tree_size bytes. 171be2cdc5eSEmilio G. Cota */ 172be2cdc5eSEmilio G. Cota static void *region_trees; 173be2cdc5eSEmilio G. Cota static size_t tree_size; 174d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 175b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 176c896fe29Sbellard 1771813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1784196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 179c896fe29Sbellard { 180c896fe29Sbellard *s->code_ptr++ = v; 181c896fe29Sbellard } 182c896fe29Sbellard 1834196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1844196dca6SPeter Maydell uint8_t v) 1855c53bb81SPeter Maydell { 1861813e175SRichard Henderson *p = v; 1875c53bb81SPeter Maydell } 1881813e175SRichard Henderson #endif 1895c53bb81SPeter Maydell 1901813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1914196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 192c896fe29Sbellard { 1931813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1941813e175SRichard Henderson *s->code_ptr++ = v; 1951813e175SRichard Henderson } else { 1961813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1974387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1981813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 1991813e175SRichard Henderson } 200c896fe29Sbellard } 201c896fe29Sbellard 2024196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 2034196dca6SPeter Maydell uint16_t v) 2045c53bb81SPeter Maydell { 2051813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 2061813e175SRichard Henderson *p = v; 2071813e175SRichard Henderson } else { 2085c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2095c53bb81SPeter Maydell } 2101813e175SRichard Henderson } 2111813e175SRichard Henderson #endif 2125c53bb81SPeter Maydell 2131813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2144196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 215c896fe29Sbellard { 2161813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2171813e175SRichard Henderson *s->code_ptr++ = v; 2181813e175SRichard Henderson } else { 2191813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2204387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2211813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2221813e175SRichard Henderson } 223c896fe29Sbellard } 224c896fe29Sbellard 2254196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2264196dca6SPeter Maydell uint32_t v) 2275c53bb81SPeter Maydell { 2281813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2291813e175SRichard Henderson *p = v; 2301813e175SRichard Henderson } else { 2315c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2325c53bb81SPeter Maydell } 2331813e175SRichard Henderson } 2341813e175SRichard Henderson #endif 2355c53bb81SPeter Maydell 2361813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2374196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 238ac26eb69SRichard Henderson { 2391813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2401813e175SRichard Henderson *s->code_ptr++ = v; 2411813e175SRichard Henderson } else { 2421813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2434387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2441813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2451813e175SRichard Henderson } 246ac26eb69SRichard Henderson } 247ac26eb69SRichard Henderson 2484196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2494196dca6SPeter Maydell uint64_t v) 2505c53bb81SPeter Maydell { 2511813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2521813e175SRichard Henderson *p = v; 2531813e175SRichard Henderson } else { 2545c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2555c53bb81SPeter Maydell } 2561813e175SRichard Henderson } 2571813e175SRichard Henderson #endif 2585c53bb81SPeter Maydell 259c896fe29Sbellard /* label relocation processing */ 260c896fe29Sbellard 2611813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 262bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 263c896fe29Sbellard { 264c896fe29Sbellard TCGRelocation *r; 265c896fe29Sbellard 266c896fe29Sbellard if (l->has_value) { 267623e265cSpbrook /* FIXME: This may break relocations on RISC targets that 268623e265cSpbrook modify instruction fields in place. The caller may not have 269623e265cSpbrook written the initial value. */ 270f54b3f92Saurel32 patch_reloc(code_ptr, type, l->u.value, addend); 271c896fe29Sbellard } else { 272c896fe29Sbellard /* add a new relocation entry */ 273c896fe29Sbellard r = tcg_malloc(sizeof(TCGRelocation)); 274c896fe29Sbellard r->type = type; 275c896fe29Sbellard r->ptr = code_ptr; 276c896fe29Sbellard r->addend = addend; 277c896fe29Sbellard r->next = l->u.first_reloc; 278c896fe29Sbellard l->u.first_reloc = r; 279c896fe29Sbellard } 280c896fe29Sbellard } 281c896fe29Sbellard 282bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr) 283c896fe29Sbellard { 2842ba7fae2SRichard Henderson intptr_t value = (intptr_t)ptr; 2851813e175SRichard Henderson TCGRelocation *r; 286c896fe29Sbellard 287eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 2881813e175SRichard Henderson 2891813e175SRichard Henderson for (r = l->u.first_reloc; r != NULL; r = r->next) { 290f54b3f92Saurel32 patch_reloc(r->ptr, r->type, value, r->addend); 291c896fe29Sbellard } 2921813e175SRichard Henderson 293c896fe29Sbellard l->has_value = 1; 2941813e175SRichard Henderson l->u.value_ptr = ptr; 295c896fe29Sbellard } 296c896fe29Sbellard 29742a268c2SRichard Henderson TCGLabel *gen_new_label(void) 298c896fe29Sbellard { 299b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 30051e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 301c896fe29Sbellard 30251e3972cSRichard Henderson *l = (TCGLabel){ 30351e3972cSRichard Henderson .id = s->nb_labels++ 30451e3972cSRichard Henderson }; 30542a268c2SRichard Henderson 30642a268c2SRichard Henderson return l; 307c896fe29Sbellard } 308c896fe29Sbellard 309ce151109SPeter Maydell #include "tcg-target.inc.c" 310c896fe29Sbellard 311be2cdc5eSEmilio G. Cota /* compare a pointer @ptr and a tb_tc @s */ 312be2cdc5eSEmilio G. Cota static int ptr_cmp_tb_tc(const void *ptr, const struct tb_tc *s) 313be2cdc5eSEmilio G. Cota { 314be2cdc5eSEmilio G. Cota if (ptr >= s->ptr + s->size) { 315be2cdc5eSEmilio G. Cota return 1; 316be2cdc5eSEmilio G. Cota } else if (ptr < s->ptr) { 317be2cdc5eSEmilio G. Cota return -1; 318be2cdc5eSEmilio G. Cota } 319be2cdc5eSEmilio G. Cota return 0; 320be2cdc5eSEmilio G. Cota } 321be2cdc5eSEmilio G. Cota 322be2cdc5eSEmilio G. Cota static gint tb_tc_cmp(gconstpointer ap, gconstpointer bp) 323be2cdc5eSEmilio G. Cota { 324be2cdc5eSEmilio G. Cota const struct tb_tc *a = ap; 325be2cdc5eSEmilio G. Cota const struct tb_tc *b = bp; 326be2cdc5eSEmilio G. Cota 327be2cdc5eSEmilio G. Cota /* 328be2cdc5eSEmilio G. Cota * When both sizes are set, we know this isn't a lookup. 329be2cdc5eSEmilio G. Cota * This is the most likely case: every TB must be inserted; lookups 330be2cdc5eSEmilio G. Cota * are a lot less frequent. 331be2cdc5eSEmilio G. Cota */ 332be2cdc5eSEmilio G. Cota if (likely(a->size && b->size)) { 333be2cdc5eSEmilio G. Cota if (a->ptr > b->ptr) { 334be2cdc5eSEmilio G. Cota return 1; 335be2cdc5eSEmilio G. Cota } else if (a->ptr < b->ptr) { 336be2cdc5eSEmilio G. Cota return -1; 337be2cdc5eSEmilio G. Cota } 338be2cdc5eSEmilio G. Cota /* a->ptr == b->ptr should happen only on deletions */ 339be2cdc5eSEmilio G. Cota g_assert(a->size == b->size); 340be2cdc5eSEmilio G. Cota return 0; 341be2cdc5eSEmilio G. Cota } 342be2cdc5eSEmilio G. Cota /* 343be2cdc5eSEmilio G. Cota * All lookups have either .size field set to 0. 344be2cdc5eSEmilio G. Cota * From the glib sources we see that @ap is always the lookup key. However 345be2cdc5eSEmilio G. Cota * the docs provide no guarantee, so we just mark this case as likely. 346be2cdc5eSEmilio G. Cota */ 347be2cdc5eSEmilio G. Cota if (likely(a->size == 0)) { 348be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(a->ptr, b); 349be2cdc5eSEmilio G. Cota } 350be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(b->ptr, a); 351be2cdc5eSEmilio G. Cota } 352be2cdc5eSEmilio G. Cota 353be2cdc5eSEmilio G. Cota static void tcg_region_trees_init(void) 354be2cdc5eSEmilio G. Cota { 355be2cdc5eSEmilio G. Cota size_t i; 356be2cdc5eSEmilio G. Cota 357be2cdc5eSEmilio G. Cota tree_size = ROUND_UP(sizeof(struct tcg_region_tree), qemu_dcache_linesize); 358be2cdc5eSEmilio G. Cota region_trees = qemu_memalign(qemu_dcache_linesize, region.n * tree_size); 359be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 360be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 361be2cdc5eSEmilio G. Cota 362be2cdc5eSEmilio G. Cota qemu_mutex_init(&rt->lock); 363be2cdc5eSEmilio G. Cota rt->tree = g_tree_new(tb_tc_cmp); 364be2cdc5eSEmilio G. Cota } 365be2cdc5eSEmilio G. Cota } 366be2cdc5eSEmilio G. Cota 367be2cdc5eSEmilio G. Cota static struct tcg_region_tree *tc_ptr_to_region_tree(void *p) 368be2cdc5eSEmilio G. Cota { 369be2cdc5eSEmilio G. Cota size_t region_idx; 370be2cdc5eSEmilio G. Cota 371be2cdc5eSEmilio G. Cota if (p < region.start_aligned) { 372be2cdc5eSEmilio G. Cota region_idx = 0; 373be2cdc5eSEmilio G. Cota } else { 374be2cdc5eSEmilio G. Cota ptrdiff_t offset = p - region.start_aligned; 375be2cdc5eSEmilio G. Cota 376be2cdc5eSEmilio G. Cota if (offset > region.stride * (region.n - 1)) { 377be2cdc5eSEmilio G. Cota region_idx = region.n - 1; 378be2cdc5eSEmilio G. Cota } else { 379be2cdc5eSEmilio G. Cota region_idx = offset / region.stride; 380be2cdc5eSEmilio G. Cota } 381be2cdc5eSEmilio G. Cota } 382be2cdc5eSEmilio G. Cota return region_trees + region_idx * tree_size; 383be2cdc5eSEmilio G. Cota } 384be2cdc5eSEmilio G. Cota 385be2cdc5eSEmilio G. Cota void tcg_tb_insert(TranslationBlock *tb) 386be2cdc5eSEmilio G. Cota { 387be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 388be2cdc5eSEmilio G. Cota 389be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 390be2cdc5eSEmilio G. Cota g_tree_insert(rt->tree, &tb->tc, tb); 391be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 392be2cdc5eSEmilio G. Cota } 393be2cdc5eSEmilio G. Cota 394be2cdc5eSEmilio G. Cota void tcg_tb_remove(TranslationBlock *tb) 395be2cdc5eSEmilio G. Cota { 396be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 397be2cdc5eSEmilio G. Cota 398be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 399be2cdc5eSEmilio G. Cota g_tree_remove(rt->tree, &tb->tc); 400be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 401be2cdc5eSEmilio G. Cota } 402be2cdc5eSEmilio G. Cota 403be2cdc5eSEmilio G. Cota /* 404be2cdc5eSEmilio G. Cota * Find the TB 'tb' such that 405be2cdc5eSEmilio G. Cota * tb->tc.ptr <= tc_ptr < tb->tc.ptr + tb->tc.size 406be2cdc5eSEmilio G. Cota * Return NULL if not found. 407be2cdc5eSEmilio G. Cota */ 408be2cdc5eSEmilio G. Cota TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr) 409be2cdc5eSEmilio G. Cota { 410be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree((void *)tc_ptr); 411be2cdc5eSEmilio G. Cota TranslationBlock *tb; 412be2cdc5eSEmilio G. Cota struct tb_tc s = { .ptr = (void *)tc_ptr }; 413be2cdc5eSEmilio G. Cota 414be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 415be2cdc5eSEmilio G. Cota tb = g_tree_lookup(rt->tree, &s); 416be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 417be2cdc5eSEmilio G. Cota return tb; 418be2cdc5eSEmilio G. Cota } 419be2cdc5eSEmilio G. Cota 420be2cdc5eSEmilio G. Cota static void tcg_region_tree_lock_all(void) 421be2cdc5eSEmilio G. Cota { 422be2cdc5eSEmilio G. Cota size_t i; 423be2cdc5eSEmilio G. Cota 424be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 425be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 426be2cdc5eSEmilio G. Cota 427be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 428be2cdc5eSEmilio G. Cota } 429be2cdc5eSEmilio G. Cota } 430be2cdc5eSEmilio G. Cota 431be2cdc5eSEmilio G. Cota static void tcg_region_tree_unlock_all(void) 432be2cdc5eSEmilio G. Cota { 433be2cdc5eSEmilio G. Cota size_t i; 434be2cdc5eSEmilio G. Cota 435be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 436be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 437be2cdc5eSEmilio G. Cota 438be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 439be2cdc5eSEmilio G. Cota } 440be2cdc5eSEmilio G. Cota } 441be2cdc5eSEmilio G. Cota 442be2cdc5eSEmilio G. Cota void tcg_tb_foreach(GTraverseFunc func, gpointer user_data) 443be2cdc5eSEmilio G. Cota { 444be2cdc5eSEmilio G. Cota size_t i; 445be2cdc5eSEmilio G. Cota 446be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 447be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 448be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 449be2cdc5eSEmilio G. Cota 450be2cdc5eSEmilio G. Cota g_tree_foreach(rt->tree, func, user_data); 451be2cdc5eSEmilio G. Cota } 452be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 453be2cdc5eSEmilio G. Cota } 454be2cdc5eSEmilio G. Cota 455be2cdc5eSEmilio G. Cota size_t tcg_nb_tbs(void) 456be2cdc5eSEmilio G. Cota { 457be2cdc5eSEmilio G. Cota size_t nb_tbs = 0; 458be2cdc5eSEmilio G. Cota size_t i; 459be2cdc5eSEmilio G. Cota 460be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 461be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 462be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 463be2cdc5eSEmilio G. Cota 464be2cdc5eSEmilio G. Cota nb_tbs += g_tree_nnodes(rt->tree); 465be2cdc5eSEmilio G. Cota } 466be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 467be2cdc5eSEmilio G. Cota return nb_tbs; 468be2cdc5eSEmilio G. Cota } 469be2cdc5eSEmilio G. Cota 470be2cdc5eSEmilio G. Cota static void tcg_region_tree_reset_all(void) 471be2cdc5eSEmilio G. Cota { 472be2cdc5eSEmilio G. Cota size_t i; 473be2cdc5eSEmilio G. Cota 474be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 475be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 476be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 477be2cdc5eSEmilio G. Cota 478be2cdc5eSEmilio G. Cota /* Increment the refcount first so that destroy acts as a reset */ 479be2cdc5eSEmilio G. Cota g_tree_ref(rt->tree); 480be2cdc5eSEmilio G. Cota g_tree_destroy(rt->tree); 481be2cdc5eSEmilio G. Cota } 482be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 483be2cdc5eSEmilio G. Cota } 484be2cdc5eSEmilio G. Cota 485e8feb96fSEmilio G. Cota static void tcg_region_bounds(size_t curr_region, void **pstart, void **pend) 486e8feb96fSEmilio G. Cota { 487e8feb96fSEmilio G. Cota void *start, *end; 488e8feb96fSEmilio G. Cota 489e8feb96fSEmilio G. Cota start = region.start_aligned + curr_region * region.stride; 490e8feb96fSEmilio G. Cota end = start + region.size; 491e8feb96fSEmilio G. Cota 492e8feb96fSEmilio G. Cota if (curr_region == 0) { 493e8feb96fSEmilio G. Cota start = region.start; 494e8feb96fSEmilio G. Cota } 495e8feb96fSEmilio G. Cota if (curr_region == region.n - 1) { 496e8feb96fSEmilio G. Cota end = region.end; 497e8feb96fSEmilio G. Cota } 498e8feb96fSEmilio G. Cota 499e8feb96fSEmilio G. Cota *pstart = start; 500e8feb96fSEmilio G. Cota *pend = end; 501e8feb96fSEmilio G. Cota } 502e8feb96fSEmilio G. Cota 503e8feb96fSEmilio G. Cota static void tcg_region_assign(TCGContext *s, size_t curr_region) 504e8feb96fSEmilio G. Cota { 505e8feb96fSEmilio G. Cota void *start, *end; 506e8feb96fSEmilio G. Cota 507e8feb96fSEmilio G. Cota tcg_region_bounds(curr_region, &start, &end); 508e8feb96fSEmilio G. Cota 509e8feb96fSEmilio G. Cota s->code_gen_buffer = start; 510e8feb96fSEmilio G. Cota s->code_gen_ptr = start; 511e8feb96fSEmilio G. Cota s->code_gen_buffer_size = end - start; 512e8feb96fSEmilio G. Cota s->code_gen_highwater = end - TCG_HIGHWATER; 513e8feb96fSEmilio G. Cota } 514e8feb96fSEmilio G. Cota 515e8feb96fSEmilio G. Cota static bool tcg_region_alloc__locked(TCGContext *s) 516e8feb96fSEmilio G. Cota { 517e8feb96fSEmilio G. Cota if (region.current == region.n) { 518e8feb96fSEmilio G. Cota return true; 519e8feb96fSEmilio G. Cota } 520e8feb96fSEmilio G. Cota tcg_region_assign(s, region.current); 521e8feb96fSEmilio G. Cota region.current++; 522e8feb96fSEmilio G. Cota return false; 523e8feb96fSEmilio G. Cota } 524e8feb96fSEmilio G. Cota 525e8feb96fSEmilio G. Cota /* 526e8feb96fSEmilio G. Cota * Request a new region once the one in use has filled up. 527e8feb96fSEmilio G. Cota * Returns true on error. 528e8feb96fSEmilio G. Cota */ 529e8feb96fSEmilio G. Cota static bool tcg_region_alloc(TCGContext *s) 530e8feb96fSEmilio G. Cota { 531e8feb96fSEmilio G. Cota bool err; 532e8feb96fSEmilio G. Cota /* read the region size now; alloc__locked will overwrite it on success */ 533e8feb96fSEmilio G. Cota size_t size_full = s->code_gen_buffer_size; 534e8feb96fSEmilio G. Cota 535e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 536e8feb96fSEmilio G. Cota err = tcg_region_alloc__locked(s); 537e8feb96fSEmilio G. Cota if (!err) { 538e8feb96fSEmilio G. Cota region.agg_size_full += size_full - TCG_HIGHWATER; 539e8feb96fSEmilio G. Cota } 540e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 541e8feb96fSEmilio G. Cota return err; 542e8feb96fSEmilio G. Cota } 543e8feb96fSEmilio G. Cota 544e8feb96fSEmilio G. Cota /* 545e8feb96fSEmilio G. Cota * Perform a context's first region allocation. 546e8feb96fSEmilio G. Cota * This function does _not_ increment region.agg_size_full. 547e8feb96fSEmilio G. Cota */ 548e8feb96fSEmilio G. Cota static inline bool tcg_region_initial_alloc__locked(TCGContext *s) 549e8feb96fSEmilio G. Cota { 550e8feb96fSEmilio G. Cota return tcg_region_alloc__locked(s); 551e8feb96fSEmilio G. Cota } 552e8feb96fSEmilio G. Cota 553e8feb96fSEmilio G. Cota /* Call from a safe-work context */ 554e8feb96fSEmilio G. Cota void tcg_region_reset_all(void) 555e8feb96fSEmilio G. Cota { 5563468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 557e8feb96fSEmilio G. Cota unsigned int i; 558e8feb96fSEmilio G. Cota 559e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 560e8feb96fSEmilio G. Cota region.current = 0; 561e8feb96fSEmilio G. Cota region.agg_size_full = 0; 562e8feb96fSEmilio G. Cota 5633468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 5643468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 5653468b59eSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(s); 566e8feb96fSEmilio G. Cota 567e8feb96fSEmilio G. Cota g_assert(!err); 568e8feb96fSEmilio G. Cota } 569e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 570be2cdc5eSEmilio G. Cota 571be2cdc5eSEmilio G. Cota tcg_region_tree_reset_all(); 572e8feb96fSEmilio G. Cota } 573e8feb96fSEmilio G. Cota 5743468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 5753468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5763468b59eSEmilio G. Cota { 5773468b59eSEmilio G. Cota return 1; 5783468b59eSEmilio G. Cota } 5793468b59eSEmilio G. Cota #else 5803468b59eSEmilio G. Cota /* 5813468b59eSEmilio G. Cota * It is likely that some vCPUs will translate more code than others, so we 5823468b59eSEmilio G. Cota * first try to set more regions than max_cpus, with those regions being of 5833468b59eSEmilio G. Cota * reasonable size. If that's not possible we make do by evenly dividing 5843468b59eSEmilio G. Cota * the code_gen_buffer among the vCPUs. 5853468b59eSEmilio G. Cota */ 5863468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5873468b59eSEmilio G. Cota { 5883468b59eSEmilio G. Cota size_t i; 5893468b59eSEmilio G. Cota 5903468b59eSEmilio G. Cota /* Use a single region if all we have is one vCPU thread */ 5913468b59eSEmilio G. Cota if (max_cpus == 1 || !qemu_tcg_mttcg_enabled()) { 5923468b59eSEmilio G. Cota return 1; 5933468b59eSEmilio G. Cota } 5943468b59eSEmilio G. Cota 5953468b59eSEmilio G. Cota /* Try to have more regions than max_cpus, with each region being >= 2 MB */ 5963468b59eSEmilio G. Cota for (i = 8; i > 0; i--) { 5973468b59eSEmilio G. Cota size_t regions_per_thread = i; 5983468b59eSEmilio G. Cota size_t region_size; 5993468b59eSEmilio G. Cota 6003468b59eSEmilio G. Cota region_size = tcg_init_ctx.code_gen_buffer_size; 6013468b59eSEmilio G. Cota region_size /= max_cpus * regions_per_thread; 6023468b59eSEmilio G. Cota 6033468b59eSEmilio G. Cota if (region_size >= 2 * 1024u * 1024) { 6043468b59eSEmilio G. Cota return max_cpus * regions_per_thread; 6053468b59eSEmilio G. Cota } 6063468b59eSEmilio G. Cota } 6073468b59eSEmilio G. Cota /* If we can't, then just allocate one region per vCPU thread */ 6083468b59eSEmilio G. Cota return max_cpus; 6093468b59eSEmilio G. Cota } 6103468b59eSEmilio G. Cota #endif 6113468b59eSEmilio G. Cota 612e8feb96fSEmilio G. Cota /* 613e8feb96fSEmilio G. Cota * Initializes region partitioning. 614e8feb96fSEmilio G. Cota * 615e8feb96fSEmilio G. Cota * Called at init time from the parent thread (i.e. the one calling 616e8feb96fSEmilio G. Cota * tcg_context_init), after the target's TCG globals have been set. 6173468b59eSEmilio G. Cota * 6183468b59eSEmilio G. Cota * Region partitioning works by splitting code_gen_buffer into separate regions, 6193468b59eSEmilio G. Cota * and then assigning regions to TCG threads so that the threads can translate 6203468b59eSEmilio G. Cota * code in parallel without synchronization. 6213468b59eSEmilio G. Cota * 6223468b59eSEmilio G. Cota * In softmmu the number of TCG threads is bounded by max_cpus, so we use at 6233468b59eSEmilio G. Cota * least max_cpus regions in MTTCG. In !MTTCG we use a single region. 6243468b59eSEmilio G. Cota * Note that the TCG options from the command-line (i.e. -accel accel=tcg,[...]) 6253468b59eSEmilio G. Cota * must have been parsed before calling this function, since it calls 6263468b59eSEmilio G. Cota * qemu_tcg_mttcg_enabled(). 6273468b59eSEmilio G. Cota * 6283468b59eSEmilio G. Cota * In user-mode we use a single region. Having multiple regions in user-mode 6293468b59eSEmilio G. Cota * is not supported, because the number of vCPU threads (recall that each thread 6303468b59eSEmilio G. Cota * spawned by the guest corresponds to a vCPU thread) is only bounded by the 6313468b59eSEmilio G. Cota * OS, and usually this number is huge (tens of thousands is not uncommon). 6323468b59eSEmilio G. Cota * Thus, given this large bound on the number of vCPU threads and the fact 6333468b59eSEmilio G. Cota * that code_gen_buffer is allocated at compile-time, we cannot guarantee 6343468b59eSEmilio G. Cota * that the availability of at least one region per vCPU thread. 6353468b59eSEmilio G. Cota * 6363468b59eSEmilio G. Cota * However, this user-mode limitation is unlikely to be a significant problem 6373468b59eSEmilio G. Cota * in practice. Multi-threaded guests share most if not all of their translated 6383468b59eSEmilio G. Cota * code, which makes parallel code generation less appealing than in softmmu. 639e8feb96fSEmilio G. Cota */ 640e8feb96fSEmilio G. Cota void tcg_region_init(void) 641e8feb96fSEmilio G. Cota { 642e8feb96fSEmilio G. Cota void *buf = tcg_init_ctx.code_gen_buffer; 643e8feb96fSEmilio G. Cota void *aligned; 644e8feb96fSEmilio G. Cota size_t size = tcg_init_ctx.code_gen_buffer_size; 645e8feb96fSEmilio G. Cota size_t page_size = qemu_real_host_page_size; 646e8feb96fSEmilio G. Cota size_t region_size; 647e8feb96fSEmilio G. Cota size_t n_regions; 648e8feb96fSEmilio G. Cota size_t i; 649e8feb96fSEmilio G. Cota 6503468b59eSEmilio G. Cota n_regions = tcg_n_regions(); 651e8feb96fSEmilio G. Cota 652e8feb96fSEmilio G. Cota /* The first region will be 'aligned - buf' bytes larger than the others */ 653e8feb96fSEmilio G. Cota aligned = QEMU_ALIGN_PTR_UP(buf, page_size); 654e8feb96fSEmilio G. Cota g_assert(aligned < tcg_init_ctx.code_gen_buffer + size); 655e8feb96fSEmilio G. Cota /* 656e8feb96fSEmilio G. Cota * Make region_size a multiple of page_size, using aligned as the start. 657e8feb96fSEmilio G. Cota * As a result of this we might end up with a few extra pages at the end of 658e8feb96fSEmilio G. Cota * the buffer; we will assign those to the last region. 659e8feb96fSEmilio G. Cota */ 660e8feb96fSEmilio G. Cota region_size = (size - (aligned - buf)) / n_regions; 661e8feb96fSEmilio G. Cota region_size = QEMU_ALIGN_DOWN(region_size, page_size); 662e8feb96fSEmilio G. Cota 663e8feb96fSEmilio G. Cota /* A region must have at least 2 pages; one code, one guard */ 664e8feb96fSEmilio G. Cota g_assert(region_size >= 2 * page_size); 665e8feb96fSEmilio G. Cota 666e8feb96fSEmilio G. Cota /* init the region struct */ 667e8feb96fSEmilio G. Cota qemu_mutex_init(®ion.lock); 668e8feb96fSEmilio G. Cota region.n = n_regions; 669e8feb96fSEmilio G. Cota region.size = region_size - page_size; 670e8feb96fSEmilio G. Cota region.stride = region_size; 671e8feb96fSEmilio G. Cota region.start = buf; 672e8feb96fSEmilio G. Cota region.start_aligned = aligned; 673e8feb96fSEmilio G. Cota /* page-align the end, since its last page will be a guard page */ 674e8feb96fSEmilio G. Cota region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size); 675e8feb96fSEmilio G. Cota /* account for that last guard page */ 676e8feb96fSEmilio G. Cota region.end -= page_size; 677e8feb96fSEmilio G. Cota 678e8feb96fSEmilio G. Cota /* set guard pages */ 679e8feb96fSEmilio G. Cota for (i = 0; i < region.n; i++) { 680e8feb96fSEmilio G. Cota void *start, *end; 681e8feb96fSEmilio G. Cota int rc; 682e8feb96fSEmilio G. Cota 683e8feb96fSEmilio G. Cota tcg_region_bounds(i, &start, &end); 684e8feb96fSEmilio G. Cota rc = qemu_mprotect_none(end, page_size); 685e8feb96fSEmilio G. Cota g_assert(!rc); 686e8feb96fSEmilio G. Cota } 687e8feb96fSEmilio G. Cota 688be2cdc5eSEmilio G. Cota tcg_region_trees_init(); 689be2cdc5eSEmilio G. Cota 6903468b59eSEmilio G. Cota /* In user-mode we support only one ctx, so do the initial allocation now */ 6913468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 692e8feb96fSEmilio G. Cota { 693e8feb96fSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(tcg_ctx); 694e8feb96fSEmilio G. Cota 695e8feb96fSEmilio G. Cota g_assert(!err); 696e8feb96fSEmilio G. Cota } 6973468b59eSEmilio G. Cota #endif 698e8feb96fSEmilio G. Cota } 699e8feb96fSEmilio G. Cota 700e8feb96fSEmilio G. Cota /* 7013468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 7023468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 7033468b59eSEmilio G. Cota * before initiating translation. 7043468b59eSEmilio G. Cota * 7053468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 7063468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 7073468b59eSEmilio G. Cota * 7083468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 7093468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 7103468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 7113468b59eSEmilio G. Cota * 7123468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 7133468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 7143468b59eSEmilio G. Cota */ 7153468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 7163468b59eSEmilio G. Cota void tcg_register_thread(void) 7173468b59eSEmilio G. Cota { 7183468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 7193468b59eSEmilio G. Cota } 7203468b59eSEmilio G. Cota #else 7213468b59eSEmilio G. Cota void tcg_register_thread(void) 7223468b59eSEmilio G. Cota { 7233468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 7243468b59eSEmilio G. Cota unsigned int i, n; 7253468b59eSEmilio G. Cota bool err; 7263468b59eSEmilio G. Cota 7273468b59eSEmilio G. Cota *s = tcg_init_ctx; 7283468b59eSEmilio G. Cota 7293468b59eSEmilio G. Cota /* Relink mem_base. */ 7303468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 7313468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 7323468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 7333468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 7343468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 7353468b59eSEmilio G. Cota } 7363468b59eSEmilio G. Cota } 7373468b59eSEmilio G. Cota 7383468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 7393468b59eSEmilio G. Cota n = atomic_fetch_inc(&n_tcg_ctxs); 7403468b59eSEmilio G. Cota g_assert(n < max_cpus); 7413468b59eSEmilio G. Cota atomic_set(&tcg_ctxs[n], s); 7423468b59eSEmilio G. Cota 7433468b59eSEmilio G. Cota tcg_ctx = s; 7443468b59eSEmilio G. Cota qemu_mutex_lock(®ion.lock); 7453468b59eSEmilio G. Cota err = tcg_region_initial_alloc__locked(tcg_ctx); 7463468b59eSEmilio G. Cota g_assert(!err); 7473468b59eSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 7483468b59eSEmilio G. Cota } 7493468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 7503468b59eSEmilio G. Cota 7513468b59eSEmilio G. Cota /* 752e8feb96fSEmilio G. Cota * Returns the size (in bytes) of all translated code (i.e. from all regions) 753e8feb96fSEmilio G. Cota * currently in the cache. 754e8feb96fSEmilio G. Cota * See also: tcg_code_capacity() 755e8feb96fSEmilio G. Cota * Do not confuse with tcg_current_code_size(); that one applies to a single 756e8feb96fSEmilio G. Cota * TCG context. 757e8feb96fSEmilio G. Cota */ 758e8feb96fSEmilio G. Cota size_t tcg_code_size(void) 759e8feb96fSEmilio G. Cota { 7603468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 761e8feb96fSEmilio G. Cota unsigned int i; 762e8feb96fSEmilio G. Cota size_t total; 763e8feb96fSEmilio G. Cota 764e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 765e8feb96fSEmilio G. Cota total = region.agg_size_full; 7663468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 7673468b59eSEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 768e8feb96fSEmilio G. Cota size_t size; 769e8feb96fSEmilio G. Cota 770e8feb96fSEmilio G. Cota size = atomic_read(&s->code_gen_ptr) - s->code_gen_buffer; 771e8feb96fSEmilio G. Cota g_assert(size <= s->code_gen_buffer_size); 772e8feb96fSEmilio G. Cota total += size; 773e8feb96fSEmilio G. Cota } 774e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 775e8feb96fSEmilio G. Cota return total; 776e8feb96fSEmilio G. Cota } 777e8feb96fSEmilio G. Cota 778e8feb96fSEmilio G. Cota /* 779e8feb96fSEmilio G. Cota * Returns the code capacity (in bytes) of the entire cache, i.e. including all 780e8feb96fSEmilio G. Cota * regions. 781e8feb96fSEmilio G. Cota * See also: tcg_code_size() 782e8feb96fSEmilio G. Cota */ 783e8feb96fSEmilio G. Cota size_t tcg_code_capacity(void) 784e8feb96fSEmilio G. Cota { 785e8feb96fSEmilio G. Cota size_t guard_size, capacity; 786e8feb96fSEmilio G. Cota 787e8feb96fSEmilio G. Cota /* no need for synchronization; these variables are set at init time */ 788e8feb96fSEmilio G. Cota guard_size = region.stride - region.size; 789e8feb96fSEmilio G. Cota capacity = region.end + guard_size - region.start; 790e8feb96fSEmilio G. Cota capacity -= region.n * (guard_size + TCG_HIGHWATER); 791e8feb96fSEmilio G. Cota return capacity; 792e8feb96fSEmilio G. Cota } 793e8feb96fSEmilio G. Cota 794*128ed227SEmilio G. Cota size_t tcg_tb_phys_invalidate_count(void) 795*128ed227SEmilio G. Cota { 796*128ed227SEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 797*128ed227SEmilio G. Cota unsigned int i; 798*128ed227SEmilio G. Cota size_t total = 0; 799*128ed227SEmilio G. Cota 800*128ed227SEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 801*128ed227SEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 802*128ed227SEmilio G. Cota 803*128ed227SEmilio G. Cota total += atomic_read(&s->tb_phys_invalidate_count); 804*128ed227SEmilio G. Cota } 805*128ed227SEmilio G. Cota return total; 806*128ed227SEmilio G. Cota } 807*128ed227SEmilio G. Cota 808c896fe29Sbellard /* pool based memory allocation */ 809c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 810c896fe29Sbellard { 811c896fe29Sbellard TCGPool *p; 812c896fe29Sbellard int pool_size; 813c896fe29Sbellard 814c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 815c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 8167267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 817c896fe29Sbellard p->size = size; 8184055299eSKirill Batuzov p->next = s->pool_first_large; 8194055299eSKirill Batuzov s->pool_first_large = p; 8204055299eSKirill Batuzov return p->data; 821c896fe29Sbellard } else { 822c896fe29Sbellard p = s->pool_current; 823c896fe29Sbellard if (!p) { 824c896fe29Sbellard p = s->pool_first; 825c896fe29Sbellard if (!p) 826c896fe29Sbellard goto new_pool; 827c896fe29Sbellard } else { 828c896fe29Sbellard if (!p->next) { 829c896fe29Sbellard new_pool: 830c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 8317267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 832c896fe29Sbellard p->size = pool_size; 833c896fe29Sbellard p->next = NULL; 834c896fe29Sbellard if (s->pool_current) 835c896fe29Sbellard s->pool_current->next = p; 836c896fe29Sbellard else 837c896fe29Sbellard s->pool_first = p; 838c896fe29Sbellard } else { 839c896fe29Sbellard p = p->next; 840c896fe29Sbellard } 841c896fe29Sbellard } 842c896fe29Sbellard } 843c896fe29Sbellard s->pool_current = p; 844c896fe29Sbellard s->pool_cur = p->data + size; 845c896fe29Sbellard s->pool_end = p->data + p->size; 846c896fe29Sbellard return p->data; 847c896fe29Sbellard } 848c896fe29Sbellard 849c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 850c896fe29Sbellard { 8514055299eSKirill Batuzov TCGPool *p, *t; 8524055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 8534055299eSKirill Batuzov t = p->next; 8544055299eSKirill Batuzov g_free(p); 8554055299eSKirill Batuzov } 8564055299eSKirill Batuzov s->pool_first_large = NULL; 857c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 858c896fe29Sbellard s->pool_current = NULL; 859c896fe29Sbellard } 860c896fe29Sbellard 861100b5e01SRichard Henderson typedef struct TCGHelperInfo { 862100b5e01SRichard Henderson void *func; 863100b5e01SRichard Henderson const char *name; 864afb49896SRichard Henderson unsigned flags; 865afb49896SRichard Henderson unsigned sizemask; 866100b5e01SRichard Henderson } TCGHelperInfo; 867100b5e01SRichard Henderson 8682ef6175aSRichard Henderson #include "exec/helper-proto.h" 8692ef6175aSRichard Henderson 870100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 8712ef6175aSRichard Henderson #include "exec/helper-tcg.h" 872100b5e01SRichard Henderson }; 873619205fdSEmilio G. Cota static GHashTable *helper_table; 874100b5e01SRichard Henderson 87591478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 876f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 8771c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 8781c2adb95SRichard Henderson TCGReg reg, const char *name); 87991478cefSRichard Henderson 880c896fe29Sbellard void tcg_context_init(TCGContext *s) 881c896fe29Sbellard { 882100b5e01SRichard Henderson int op, total_args, n, i; 883c896fe29Sbellard TCGOpDef *def; 884c896fe29Sbellard TCGArgConstraint *args_ct; 885c896fe29Sbellard int *sorted_args; 8861c2adb95SRichard Henderson TCGTemp *ts; 887c896fe29Sbellard 888c896fe29Sbellard memset(s, 0, sizeof(*s)); 889c896fe29Sbellard s->nb_globals = 0; 890c896fe29Sbellard 891c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 892c896fe29Sbellard space */ 893c896fe29Sbellard total_args = 0; 894c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 895c896fe29Sbellard def = &tcg_op_defs[op]; 896c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 897c896fe29Sbellard total_args += n; 898c896fe29Sbellard } 899c896fe29Sbellard 9007267c094SAnthony Liguori args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args); 9017267c094SAnthony Liguori sorted_args = g_malloc(sizeof(int) * total_args); 902c896fe29Sbellard 903c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 904c896fe29Sbellard def = &tcg_op_defs[op]; 905c896fe29Sbellard def->args_ct = args_ct; 906c896fe29Sbellard def->sorted_args = sorted_args; 907c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 908c896fe29Sbellard sorted_args += n; 909c896fe29Sbellard args_ct += n; 910c896fe29Sbellard } 911c896fe29Sbellard 9125cd8f621SRichard Henderson /* Register helpers. */ 91384fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 914619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 91584fd9dd3SRichard Henderson 916100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 91784fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 91872866e82SRichard Henderson (gpointer)&all_helpers[i]); 919100b5e01SRichard Henderson } 9205cd8f621SRichard Henderson 921c896fe29Sbellard tcg_target_init(s); 922f69d277eSRichard Henderson process_op_defs(s); 92391478cefSRichard Henderson 92491478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 92591478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 92691478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 92791478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 92891478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 92991478cefSRichard Henderson break; 93091478cefSRichard Henderson } 93191478cefSRichard Henderson } 93291478cefSRichard Henderson for (i = 0; i < n; ++i) { 93391478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 93491478cefSRichard Henderson } 93591478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 93691478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 93791478cefSRichard Henderson } 938b1311c4aSEmilio G. Cota 939b1311c4aSEmilio G. Cota tcg_ctx = s; 9403468b59eSEmilio G. Cota /* 9413468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 9423468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 9433468b59eSEmilio G. Cota * reasoning behind this. 9443468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 9453468b59eSEmilio G. Cota */ 9463468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 947df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 948df2cce29SEmilio G. Cota n_tcg_ctxs = 1; 9493468b59eSEmilio G. Cota #else 9503468b59eSEmilio G. Cota tcg_ctxs = g_new(TCGContext *, max_cpus); 9513468b59eSEmilio G. Cota #endif 9521c2adb95SRichard Henderson 9531c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 9541c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 9551c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 9569002ec79SRichard Henderson } 957b03cce8eSbellard 9586e3b2bfdSEmilio G. Cota /* 9596e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 9606e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 9616e3b2bfdSEmilio G. Cota */ 9626e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 9636e3b2bfdSEmilio G. Cota { 9646e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 9656e3b2bfdSEmilio G. Cota TranslationBlock *tb; 9666e3b2bfdSEmilio G. Cota void *next; 9676e3b2bfdSEmilio G. Cota 968e8feb96fSEmilio G. Cota retry: 9696e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 9706e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 9716e3b2bfdSEmilio G. Cota 9726e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 973e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 9746e3b2bfdSEmilio G. Cota return NULL; 9756e3b2bfdSEmilio G. Cota } 976e8feb96fSEmilio G. Cota goto retry; 977e8feb96fSEmilio G. Cota } 978e8feb96fSEmilio G. Cota atomic_set(&s->code_gen_ptr, next); 97957a26946SRichard Henderson s->data_gen_ptr = NULL; 9806e3b2bfdSEmilio G. Cota return tb; 9816e3b2bfdSEmilio G. Cota } 9826e3b2bfdSEmilio G. Cota 9839002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 9849002ec79SRichard Henderson { 9858163b749SRichard Henderson size_t prologue_size, total_size; 9868163b749SRichard Henderson void *buf0, *buf1; 9878163b749SRichard Henderson 9888163b749SRichard Henderson /* Put the prologue at the beginning of code_gen_buffer. */ 9898163b749SRichard Henderson buf0 = s->code_gen_buffer; 9905b38ee31SRichard Henderson total_size = s->code_gen_buffer_size; 9918163b749SRichard Henderson s->code_ptr = buf0; 9928163b749SRichard Henderson s->code_buf = buf0; 9935b38ee31SRichard Henderson s->data_gen_ptr = NULL; 9948163b749SRichard Henderson s->code_gen_prologue = buf0; 9958163b749SRichard Henderson 9965b38ee31SRichard Henderson /* Compute a high-water mark, at which we voluntarily flush the buffer 9975b38ee31SRichard Henderson and start over. The size here is arbitrary, significantly larger 9985b38ee31SRichard Henderson than we expect the code generation for any one opcode to require. */ 9995b38ee31SRichard Henderson s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER); 10005b38ee31SRichard Henderson 10015b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10025b38ee31SRichard Henderson s->pool_labels = NULL; 10035b38ee31SRichard Henderson #endif 10045b38ee31SRichard Henderson 10058163b749SRichard Henderson /* Generate the prologue. */ 1006b03cce8eSbellard tcg_target_qemu_prologue(s); 10075b38ee31SRichard Henderson 10085b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10095b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 10105b38ee31SRichard Henderson { 10115b38ee31SRichard Henderson bool ok = tcg_out_pool_finalize(s); 10125b38ee31SRichard Henderson tcg_debug_assert(ok); 10135b38ee31SRichard Henderson } 10145b38ee31SRichard Henderson #endif 10155b38ee31SRichard Henderson 10168163b749SRichard Henderson buf1 = s->code_ptr; 10178163b749SRichard Henderson flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1); 10188163b749SRichard Henderson 10198163b749SRichard Henderson /* Deduct the prologue from the buffer. */ 10208163b749SRichard Henderson prologue_size = tcg_current_code_size(s); 10218163b749SRichard Henderson s->code_gen_ptr = buf1; 10228163b749SRichard Henderson s->code_gen_buffer = buf1; 10238163b749SRichard Henderson s->code_buf = buf1; 10245b38ee31SRichard Henderson total_size -= prologue_size; 10258163b749SRichard Henderson s->code_gen_buffer_size = total_size; 10268163b749SRichard Henderson 10278163b749SRichard Henderson tcg_register_jit(s->code_gen_buffer, total_size); 1028d6b64b2bSRichard Henderson 1029d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 1030d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 10311ee73216SRichard Henderson qemu_log_lock(); 10328163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 10335b38ee31SRichard Henderson if (s->data_gen_ptr) { 10345b38ee31SRichard Henderson size_t code_size = s->data_gen_ptr - buf0; 10355b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 10365b38ee31SRichard Henderson size_t i; 10375b38ee31SRichard Henderson 10385b38ee31SRichard Henderson log_disas(buf0, code_size); 10395b38ee31SRichard Henderson 10405b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 10415b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 10425b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 10435b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10445b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 10455b38ee31SRichard Henderson } else { 10465b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .long 0x%08x\n", 10475b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10485b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 10495b38ee31SRichard Henderson } 10505b38ee31SRichard Henderson } 10515b38ee31SRichard Henderson } else { 10528163b749SRichard Henderson log_disas(buf0, prologue_size); 10535b38ee31SRichard Henderson } 1054d6b64b2bSRichard Henderson qemu_log("\n"); 1055d6b64b2bSRichard Henderson qemu_log_flush(); 10561ee73216SRichard Henderson qemu_log_unlock(); 1057d6b64b2bSRichard Henderson } 1058d6b64b2bSRichard Henderson #endif 1059cedbcb01SEmilio G. Cota 1060cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 1061cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 1062cedbcb01SEmilio G. Cota tcg_debug_assert(s->code_gen_epilogue != NULL); 1063cedbcb01SEmilio G. Cota } 1064c896fe29Sbellard } 1065c896fe29Sbellard 1066c896fe29Sbellard void tcg_func_start(TCGContext *s) 1067c896fe29Sbellard { 1068c896fe29Sbellard tcg_pool_reset(s); 1069c896fe29Sbellard s->nb_temps = s->nb_globals; 10700ec9eabcSRichard Henderson 10710ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 10720ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 10730ec9eabcSRichard Henderson 1074abebf925SRichard Henderson s->nb_ops = 0; 1075c896fe29Sbellard s->nb_labels = 0; 1076c896fe29Sbellard s->current_frame_offset = s->frame_start; 1077c896fe29Sbellard 10780a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 10790a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 10800a209d4bSRichard Henderson #endif 10810a209d4bSRichard Henderson 108215fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 108315fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 1084c896fe29Sbellard } 1085c896fe29Sbellard 10867ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s) 10877ca4b752SRichard Henderson { 10887ca4b752SRichard Henderson int n = s->nb_temps++; 10897ca4b752SRichard Henderson tcg_debug_assert(n < TCG_MAX_TEMPS); 10907ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 10917ca4b752SRichard Henderson } 10927ca4b752SRichard Henderson 10937ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s) 10947ca4b752SRichard Henderson { 1095fa477d25SRichard Henderson TCGTemp *ts; 1096fa477d25SRichard Henderson 10977ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 10987ca4b752SRichard Henderson s->nb_globals++; 1099fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 1100fa477d25SRichard Henderson ts->temp_global = 1; 1101fa477d25SRichard Henderson 1102fa477d25SRichard Henderson return ts; 1103c896fe29Sbellard } 1104c896fe29Sbellard 1105085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 1106b6638662SRichard Henderson TCGReg reg, const char *name) 1107c896fe29Sbellard { 1108c896fe29Sbellard TCGTemp *ts; 1109c896fe29Sbellard 1110b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 1111c896fe29Sbellard tcg_abort(); 1112b3a62939SRichard Henderson } 11137ca4b752SRichard Henderson 11147ca4b752SRichard Henderson ts = tcg_global_alloc(s); 1115c896fe29Sbellard ts->base_type = type; 1116c896fe29Sbellard ts->type = type; 1117c896fe29Sbellard ts->fixed_reg = 1; 1118c896fe29Sbellard ts->reg = reg; 1119c896fe29Sbellard ts->name = name; 1120c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 11217ca4b752SRichard Henderson 1122085272b3SRichard Henderson return ts; 1123a7812ae4Spbrook } 1124a7812ae4Spbrook 1125b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 1126a7812ae4Spbrook { 1127b3a62939SRichard Henderson s->frame_start = start; 1128b3a62939SRichard Henderson s->frame_end = start + size; 1129085272b3SRichard Henderson s->frame_temp 1130085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 1131b3a62939SRichard Henderson } 1132a7812ae4Spbrook 1133085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 1134e1ccc054SRichard Henderson intptr_t offset, const char *name) 1135c896fe29Sbellard { 1136b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1137dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 11387ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 1139b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 11407ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 11417ca4b752SRichard Henderson bigendian = 1; 11427ca4b752SRichard Henderson #endif 1143c896fe29Sbellard 1144b3915dbbSRichard Henderson if (!base_ts->fixed_reg) { 11455a18407fSRichard Henderson /* We do not support double-indirect registers. */ 11465a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 1147b3915dbbSRichard Henderson base_ts->indirect_base = 1; 11485a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 11495a18407fSRichard Henderson ? 2 : 1); 11505a18407fSRichard Henderson indirect_reg = 1; 1151b3915dbbSRichard Henderson } 1152b3915dbbSRichard Henderson 11537ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 11547ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 1155c896fe29Sbellard char buf[64]; 11567ca4b752SRichard Henderson 11577ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 1158c896fe29Sbellard ts->type = TCG_TYPE_I32; 1159b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1160c896fe29Sbellard ts->mem_allocated = 1; 1161b3a62939SRichard Henderson ts->mem_base = base_ts; 11627ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 1163c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1164c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 1165c896fe29Sbellard ts->name = strdup(buf); 1166c896fe29Sbellard 11677ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 11687ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 11697ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 1170b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 11717ca4b752SRichard Henderson ts2->mem_allocated = 1; 11727ca4b752SRichard Henderson ts2->mem_base = base_ts; 11737ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 1174c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1175c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 1176120c1084SRichard Henderson ts2->name = strdup(buf); 11777ca4b752SRichard Henderson } else { 1178c896fe29Sbellard ts->base_type = type; 1179c896fe29Sbellard ts->type = type; 1180b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1181c896fe29Sbellard ts->mem_allocated = 1; 1182b3a62939SRichard Henderson ts->mem_base = base_ts; 1183c896fe29Sbellard ts->mem_offset = offset; 1184c896fe29Sbellard ts->name = name; 1185c896fe29Sbellard } 1186085272b3SRichard Henderson return ts; 1187c896fe29Sbellard } 1188c896fe29Sbellard 11895bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 1190c896fe29Sbellard { 1191b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1192c896fe29Sbellard TCGTemp *ts; 1193641d5fbeSbellard int idx, k; 1194c896fe29Sbellard 11950ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 11960ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 11970ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 11980ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 11990ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 12000ec9eabcSRichard Henderson 1201e8996ee0Sbellard ts = &s->temps[idx]; 1202e8996ee0Sbellard ts->temp_allocated = 1; 12037ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 12047ca4b752SRichard Henderson tcg_debug_assert(ts->temp_local == temp_local); 1205e8996ee0Sbellard } else { 12067ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 12077ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 12087ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 12097ca4b752SRichard Henderson 1210c896fe29Sbellard ts->base_type = type; 1211c896fe29Sbellard ts->type = TCG_TYPE_I32; 1212e8996ee0Sbellard ts->temp_allocated = 1; 1213641d5fbeSbellard ts->temp_local = temp_local; 12147ca4b752SRichard Henderson 12157ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 12167ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 12177ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 12187ca4b752SRichard Henderson ts2->temp_allocated = 1; 12197ca4b752SRichard Henderson ts2->temp_local = temp_local; 12207ca4b752SRichard Henderson } else { 1221c896fe29Sbellard ts->base_type = type; 1222c896fe29Sbellard ts->type = type; 1223e8996ee0Sbellard ts->temp_allocated = 1; 1224641d5fbeSbellard ts->temp_local = temp_local; 1225c896fe29Sbellard } 1226e8996ee0Sbellard } 122727bfd83cSPeter Maydell 122827bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 122927bfd83cSPeter Maydell s->temps_in_use++; 123027bfd83cSPeter Maydell #endif 1231085272b3SRichard Henderson return ts; 1232c896fe29Sbellard } 1233c896fe29Sbellard 1234d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 1235d2fd745fSRichard Henderson { 1236d2fd745fSRichard Henderson TCGTemp *t; 1237d2fd745fSRichard Henderson 1238d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 1239d2fd745fSRichard Henderson switch (type) { 1240d2fd745fSRichard Henderson case TCG_TYPE_V64: 1241d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 1242d2fd745fSRichard Henderson break; 1243d2fd745fSRichard Henderson case TCG_TYPE_V128: 1244d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 1245d2fd745fSRichard Henderson break; 1246d2fd745fSRichard Henderson case TCG_TYPE_V256: 1247d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 1248d2fd745fSRichard Henderson break; 1249d2fd745fSRichard Henderson default: 1250d2fd745fSRichard Henderson g_assert_not_reached(); 1251d2fd745fSRichard Henderson } 1252d2fd745fSRichard Henderson #endif 1253d2fd745fSRichard Henderson 1254d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 1255d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1256d2fd745fSRichard Henderson } 1257d2fd745fSRichard Henderson 1258d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 1259d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 1260d2fd745fSRichard Henderson { 1261d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 1262d2fd745fSRichard Henderson 1263d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 1264d2fd745fSRichard Henderson 1265d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 1266d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1267d2fd745fSRichard Henderson } 1268d2fd745fSRichard Henderson 12695bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 1270c896fe29Sbellard { 1271b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1272085272b3SRichard Henderson int k, idx; 1273c896fe29Sbellard 127427bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 127527bfd83cSPeter Maydell s->temps_in_use--; 127627bfd83cSPeter Maydell if (s->temps_in_use < 0) { 127727bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 127827bfd83cSPeter Maydell } 127927bfd83cSPeter Maydell #endif 128027bfd83cSPeter Maydell 1281085272b3SRichard Henderson tcg_debug_assert(ts->temp_global == 0); 1282eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 1283e8996ee0Sbellard ts->temp_allocated = 0; 12840ec9eabcSRichard Henderson 1285085272b3SRichard Henderson idx = temp_idx(ts); 128618d13fa2SAlexander Graf k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0); 12870ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 1288e8996ee0Sbellard } 1289e8996ee0Sbellard 1290a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1291a7812ae4Spbrook { 1292a7812ae4Spbrook TCGv_i32 t0; 1293a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1294e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1295e8996ee0Sbellard return t0; 1296c896fe29Sbellard } 1297c896fe29Sbellard 1298a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1299c896fe29Sbellard { 1300a7812ae4Spbrook TCGv_i64 t0; 1301a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1302e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1303e8996ee0Sbellard return t0; 1304c896fe29Sbellard } 1305c896fe29Sbellard 1306a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1307bdffd4a9Saurel32 { 1308a7812ae4Spbrook TCGv_i32 t0; 1309a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1310bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1311bdffd4a9Saurel32 return t0; 1312bdffd4a9Saurel32 } 1313bdffd4a9Saurel32 1314a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1315bdffd4a9Saurel32 { 1316a7812ae4Spbrook TCGv_i64 t0; 1317a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1318bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1319bdffd4a9Saurel32 return t0; 1320bdffd4a9Saurel32 } 1321bdffd4a9Saurel32 132227bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 132327bfd83cSPeter Maydell void tcg_clear_temp_count(void) 132427bfd83cSPeter Maydell { 1325b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 132627bfd83cSPeter Maydell s->temps_in_use = 0; 132727bfd83cSPeter Maydell } 132827bfd83cSPeter Maydell 132927bfd83cSPeter Maydell int tcg_check_temp_count(void) 133027bfd83cSPeter Maydell { 1331b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 133227bfd83cSPeter Maydell if (s->temps_in_use) { 133327bfd83cSPeter Maydell /* Clear the count so that we don't give another 133427bfd83cSPeter Maydell * warning immediately next time around. 133527bfd83cSPeter Maydell */ 133627bfd83cSPeter Maydell s->temps_in_use = 0; 133727bfd83cSPeter Maydell return 1; 133827bfd83cSPeter Maydell } 133927bfd83cSPeter Maydell return 0; 134027bfd83cSPeter Maydell } 134127bfd83cSPeter Maydell #endif 134227bfd83cSPeter Maydell 1343be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1344be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1345be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1346be0f34b5SRichard Henderson { 1347d2fd745fSRichard Henderson const bool have_vec 1348d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1349d2fd745fSRichard Henderson 1350be0f34b5SRichard Henderson switch (op) { 1351be0f34b5SRichard Henderson case INDEX_op_discard: 1352be0f34b5SRichard Henderson case INDEX_op_set_label: 1353be0f34b5SRichard Henderson case INDEX_op_call: 1354be0f34b5SRichard Henderson case INDEX_op_br: 1355be0f34b5SRichard Henderson case INDEX_op_mb: 1356be0f34b5SRichard Henderson case INDEX_op_insn_start: 1357be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1358be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1359be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1360be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1361be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1362be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1363be0f34b5SRichard Henderson return true; 1364be0f34b5SRichard Henderson 1365be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 1366be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 1367be0f34b5SRichard Henderson 1368be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1369be0f34b5SRichard Henderson case INDEX_op_movi_i32: 1370be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1371be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1372be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1373be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1374be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1375be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1376be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1377be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1378be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1379be0f34b5SRichard Henderson case INDEX_op_st_i32: 1380be0f34b5SRichard Henderson case INDEX_op_add_i32: 1381be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1382be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1383be0f34b5SRichard Henderson case INDEX_op_and_i32: 1384be0f34b5SRichard Henderson case INDEX_op_or_i32: 1385be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1386be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1387be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1388be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1389be0f34b5SRichard Henderson return true; 1390be0f34b5SRichard Henderson 1391be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1392be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1393be0f34b5SRichard Henderson case INDEX_op_div_i32: 1394be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1395be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1396be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1397be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1398be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1399be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1400be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1401be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1402be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1403be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1404be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1405be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1406be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1407be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1408be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1409be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1410be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1411be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1412be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1413be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1414be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1415be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1416be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1417be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1418be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1419be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1420be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1421be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1422be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1423be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1424be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1425be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1426be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1427be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1428be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1429be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1430be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1431be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1432be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1433be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1434be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1435be0f34b5SRichard Henderson case INDEX_op_not_i32: 1436be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1437be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1438be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1439be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1440be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1441be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1442be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1443be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1444be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1445be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1446be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1447be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1448be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1449be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1450be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1451be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1452be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1453be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1454be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1455be0f34b5SRichard Henderson 1456be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1457be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1458be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1459be0f34b5SRichard Henderson 1460be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1461be0f34b5SRichard Henderson case INDEX_op_movi_i64: 1462be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1463be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1464be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1465be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1466be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1467be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1468be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1469be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1470be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1471be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1472be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1473be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1474be0f34b5SRichard Henderson case INDEX_op_st_i64: 1475be0f34b5SRichard Henderson case INDEX_op_add_i64: 1476be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1477be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1478be0f34b5SRichard Henderson case INDEX_op_and_i64: 1479be0f34b5SRichard Henderson case INDEX_op_or_i64: 1480be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1481be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1482be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1483be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1484be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1485be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1486be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1487be0f34b5SRichard Henderson 1488be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1489be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1490be0f34b5SRichard Henderson case INDEX_op_div_i64: 1491be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1492be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1493be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1494be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1495be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1496be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1497be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1498be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1499be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1500be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1501be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1502be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1503be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1504be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1505be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1506be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1507be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1508be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1509be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1510be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1511be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1512be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1513be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1514be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1515be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1516be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1517be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1518be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1519be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1520be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1521be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1522be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1523be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1524be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1525be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1526be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1527be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1528be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1529be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1530be0f34b5SRichard Henderson case INDEX_op_not_i64: 1531be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1532be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1533be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1534be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1535be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1536be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1537be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1538be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1539be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1540be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1541be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1542be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1543be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1544be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1545be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1546be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1547be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1548be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1549be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1550be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1551be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1552be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1553be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1554be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1555be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1556be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1557be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1558be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1559be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1560be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1561be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1562be0f34b5SRichard Henderson 1563d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1564d2fd745fSRichard Henderson case INDEX_op_dup_vec: 1565d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 1566d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1567d2fd745fSRichard Henderson case INDEX_op_st_vec: 1568d2fd745fSRichard Henderson case INDEX_op_add_vec: 1569d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1570d2fd745fSRichard Henderson case INDEX_op_and_vec: 1571d2fd745fSRichard Henderson case INDEX_op_or_vec: 1572d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1573212be173SRichard Henderson case INDEX_op_cmp_vec: 1574d2fd745fSRichard Henderson return have_vec; 1575d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1576d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1577d2fd745fSRichard Henderson case INDEX_op_not_vec: 1578d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1579d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1580d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1581d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1582d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1583d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1584d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 15853774030aSRichard Henderson case INDEX_op_mul_vec: 15863774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1587d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1588d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1589d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1590d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1591d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1592d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1593d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1594d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1595d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1596d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1597d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1598d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1599d2fd745fSRichard Henderson 1600db432672SRichard Henderson default: 1601db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1602db432672SRichard Henderson return true; 1603be0f34b5SRichard Henderson } 1604be0f34b5SRichard Henderson } 1605be0f34b5SRichard Henderson 160639cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 160739cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 160839cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1609ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1610c896fe29Sbellard { 161175e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 1612bbb8a1b4SRichard Henderson unsigned sizemask, flags; 1613afb49896SRichard Henderson TCGHelperInfo *info; 161475e8b9b7SRichard Henderson TCGOp *op; 1615afb49896SRichard Henderson 1616619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 1617bbb8a1b4SRichard Henderson flags = info->flags; 1618bbb8a1b4SRichard Henderson sizemask = info->sizemask; 16192bece2c8SRichard Henderson 162034b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 162134b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 162234b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 162334b1a49cSRichard Henderson separate parameters. Split them. */ 162434b1a49cSRichard Henderson int orig_sizemask = sizemask; 162534b1a49cSRichard Henderson int orig_nargs = nargs; 162634b1a49cSRichard Henderson TCGv_i64 retl, reth; 1627ae8b75dcSRichard Henderson TCGTemp *split_args[MAX_OPC_PARAM]; 162834b1a49cSRichard Henderson 1629f764718dSRichard Henderson retl = NULL; 1630f764718dSRichard Henderson reth = NULL; 163134b1a49cSRichard Henderson if (sizemask != 0) { 163234b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 163334b1a49cSRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 163434b1a49cSRichard Henderson if (is_64bit) { 1635085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 163634b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 163734b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 163834b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 1639ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(h); 1640ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(l); 164134b1a49cSRichard Henderson } else { 164234b1a49cSRichard Henderson split_args[real_args++] = args[i]; 164334b1a49cSRichard Henderson } 164434b1a49cSRichard Henderson } 164534b1a49cSRichard Henderson nargs = real_args; 164634b1a49cSRichard Henderson args = split_args; 164734b1a49cSRichard Henderson sizemask = 0; 164834b1a49cSRichard Henderson } 164934b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 16502bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 16512bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 16522bece2c8SRichard Henderson int is_signed = sizemask & (2 << (i+1)*2); 16532bece2c8SRichard Henderson if (!is_64bit) { 16542bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 1655085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 16562bece2c8SRichard Henderson if (is_signed) { 16572bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 16582bece2c8SRichard Henderson } else { 16592bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 16602bece2c8SRichard Henderson } 1661ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 16622bece2c8SRichard Henderson } 16632bece2c8SRichard Henderson } 16642bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 16652bece2c8SRichard Henderson 166615fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 166775e8b9b7SRichard Henderson 166875e8b9b7SRichard Henderson pi = 0; 1669ae8b75dcSRichard Henderson if (ret != NULL) { 167034b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 167134b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 167234b1a49cSRichard Henderson if (orig_sizemask & 1) { 167334b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 167434b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 167534b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 167634b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 167734b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1678ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(reth); 1679ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(retl); 168034b1a49cSRichard Henderson nb_rets = 2; 168134b1a49cSRichard Henderson } else { 1682ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 168334b1a49cSRichard Henderson nb_rets = 1; 168434b1a49cSRichard Henderson } 168534b1a49cSRichard Henderson #else 168634b1a49cSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) { 168702eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1688ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1689ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1690a7812ae4Spbrook #else 1691ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1692ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1693a7812ae4Spbrook #endif 1694a7812ae4Spbrook nb_rets = 2; 169534b1a49cSRichard Henderson } else { 1696ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1697a7812ae4Spbrook nb_rets = 1; 1698a7812ae4Spbrook } 169934b1a49cSRichard Henderson #endif 1700a7812ae4Spbrook } else { 1701a7812ae4Spbrook nb_rets = 0; 1702a7812ae4Spbrook } 1703cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 170475e8b9b7SRichard Henderson 1705a7812ae4Spbrook real_args = 0; 1706a7812ae4Spbrook for (i = 0; i < nargs; i++) { 17072bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 1708bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 170939cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 171039cf05d3Sbellard /* some targets want aligned 64 bit args */ 1711ebd486d5Smalc if (real_args & 1) { 171275e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1713ebd486d5Smalc real_args++; 171439cf05d3Sbellard } 171539cf05d3Sbellard #endif 17163f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 17173f90f252SRichard Henderson arguments at lower addresses, which means we need to 17183f90f252SRichard Henderson reverse the order compared to how we would normally 17193f90f252SRichard Henderson treat either big or little-endian. For those arguments 17203f90f252SRichard Henderson that will wind up in registers, this still works for 17213f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 17223f90f252SRichard Henderson argument registers are *also* allocated in decreasing 17233f90f252SRichard Henderson order. If another such target is added, this logic may 17243f90f252SRichard Henderson have to get more complicated to differentiate between 17253f90f252SRichard Henderson stack arguments and register arguments. */ 172602eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1727ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1728ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1729c896fe29Sbellard #else 1730ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1731ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1732c896fe29Sbellard #endif 1733a7812ae4Spbrook real_args += 2; 17342bece2c8SRichard Henderson continue; 17352bece2c8SRichard Henderson } 17362bece2c8SRichard Henderson 1737ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1738a7812ae4Spbrook real_args++; 1739c896fe29Sbellard } 174075e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 174175e8b9b7SRichard Henderson op->args[pi++] = flags; 1742cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1743a7812ae4Spbrook 174475e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1745cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 174675e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 17472bece2c8SRichard Henderson 174834b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 174934b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 175034b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 175134b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 175234b1a49cSRichard Henderson int is_64bit = orig_sizemask & (1 << (i+1)*2); 175334b1a49cSRichard Henderson if (is_64bit) { 1754085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 1755085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 175634b1a49cSRichard Henderson } else { 175734b1a49cSRichard Henderson real_args++; 175834b1a49cSRichard Henderson } 175934b1a49cSRichard Henderson } 176034b1a49cSRichard Henderson if (orig_sizemask & 1) { 176134b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 176234b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 176334b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 1764085272b3SRichard Henderson tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth); 176534b1a49cSRichard Henderson tcg_temp_free_i64(retl); 176634b1a49cSRichard Henderson tcg_temp_free_i64(reth); 176734b1a49cSRichard Henderson } 176834b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 17692bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 17702bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 17712bece2c8SRichard Henderson if (!is_64bit) { 1772085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 17732bece2c8SRichard Henderson } 17742bece2c8SRichard Henderson } 17752bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1776a7812ae4Spbrook } 1777c896fe29Sbellard 17788fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1779c896fe29Sbellard { 1780ac3b8891SRichard Henderson int i, n; 1781c896fe29Sbellard TCGTemp *ts; 1782ac3b8891SRichard Henderson 1783ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 1784c896fe29Sbellard ts = &s->temps[i]; 1785ac3b8891SRichard Henderson ts->val_type = (ts->fixed_reg ? TEMP_VAL_REG : TEMP_VAL_MEM); 1786c896fe29Sbellard } 1787ac3b8891SRichard Henderson for (n = s->nb_temps; i < n; i++) { 1788e8996ee0Sbellard ts = &s->temps[i]; 1789ac3b8891SRichard Henderson ts->val_type = (ts->temp_local ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 1790e8996ee0Sbellard ts->mem_allocated = 0; 1791e8996ee0Sbellard ts->fixed_reg = 0; 1792e8996ee0Sbellard } 1793f8b2f202SRichard Henderson 1794f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1795c896fe29Sbellard } 1796c896fe29Sbellard 1797f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1798f8b2f202SRichard Henderson TCGTemp *ts) 1799c896fe29Sbellard { 18001807f4c4SRichard Henderson int idx = temp_idx(ts); 1801ac56dd48Spbrook 1802fa477d25SRichard Henderson if (ts->temp_global) { 1803ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1804f8b2f202SRichard Henderson } else if (ts->temp_local) { 1805641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1806f8b2f202SRichard Henderson } else { 1807ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1808c896fe29Sbellard } 1809c896fe29Sbellard return buf; 1810c896fe29Sbellard } 1811c896fe29Sbellard 181243439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 181343439139SRichard Henderson int buf_size, TCGArg arg) 1814f8b2f202SRichard Henderson { 181543439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1816f8b2f202SRichard Henderson } 1817f8b2f202SRichard Henderson 18186e085f72SRichard Henderson /* Find helper name. */ 18196e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val) 1820e8996ee0Sbellard { 18216e085f72SRichard Henderson const char *ret = NULL; 1822619205fdSEmilio G. Cota if (helper_table) { 1823619205fdSEmilio G. Cota TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val); 182472866e82SRichard Henderson if (info) { 182572866e82SRichard Henderson ret = info->name; 182672866e82SRichard Henderson } 1827e8996ee0Sbellard } 18286e085f72SRichard Henderson return ret; 18294dc81f28Sbellard } 18304dc81f28Sbellard 1831f48f3edeSblueswir1 static const char * const cond_name[] = 1832f48f3edeSblueswir1 { 18330aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 18340aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1835f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1836f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1837f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1838f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1839f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1840f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1841f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1842f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1843f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1844f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1845f48f3edeSblueswir1 }; 1846f48f3edeSblueswir1 1847f713d6adSRichard Henderson static const char * const ldst_name[] = 1848f713d6adSRichard Henderson { 1849f713d6adSRichard Henderson [MO_UB] = "ub", 1850f713d6adSRichard Henderson [MO_SB] = "sb", 1851f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1852f713d6adSRichard Henderson [MO_LESW] = "lesw", 1853f713d6adSRichard Henderson [MO_LEUL] = "leul", 1854f713d6adSRichard Henderson [MO_LESL] = "lesl", 1855f713d6adSRichard Henderson [MO_LEQ] = "leq", 1856f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1857f713d6adSRichard Henderson [MO_BESW] = "besw", 1858f713d6adSRichard Henderson [MO_BEUL] = "beul", 1859f713d6adSRichard Henderson [MO_BESL] = "besl", 1860f713d6adSRichard Henderson [MO_BEQ] = "beq", 1861f713d6adSRichard Henderson }; 1862f713d6adSRichard Henderson 18631f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 18641f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY 18651f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 18661f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 18671f00b27fSSergey Sorokin #else 18681f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 18691f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 18701f00b27fSSergey Sorokin #endif 18711f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 18721f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 18731f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 18741f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 18751f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 18761f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 18771f00b27fSSergey Sorokin }; 18781f00b27fSSergey Sorokin 1879eeacee4dSBlue Swirl void tcg_dump_ops(TCGContext *s) 1880c896fe29Sbellard { 1881c896fe29Sbellard char buf[128]; 1882c45cb8bbSRichard Henderson TCGOp *op; 1883c896fe29Sbellard 188415fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1885c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1886c45cb8bbSRichard Henderson const TCGOpDef *def; 1887c45cb8bbSRichard Henderson TCGOpcode c; 1888bdfb460eSRichard Henderson int col = 0; 1889c45cb8bbSRichard Henderson 1890c45cb8bbSRichard Henderson c = op->opc; 1891c896fe29Sbellard def = &tcg_op_defs[c]; 1892c45cb8bbSRichard Henderson 1893765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 189415fa08f8SRichard Henderson col += qemu_log("\n ----"); 18959aef40edSRichard Henderson 18969aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 18979aef40edSRichard Henderson target_ulong a; 18987e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1899efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 19007e4597d7Sbellard #else 1901efee3746SRichard Henderson a = op->args[i]; 19027e4597d7Sbellard #endif 1903bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1904eeacee4dSBlue Swirl } 19057e4597d7Sbellard } else if (c == INDEX_op_call) { 1906c896fe29Sbellard /* variable number of arguments */ 1907cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1908cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1909c896fe29Sbellard nb_cargs = def->nb_cargs; 1910b03cce8eSbellard 1911cf066674SRichard Henderson /* function name, flags, out args */ 1912bdfb460eSRichard Henderson col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name, 1913efee3746SRichard Henderson tcg_find_helper(s, op->args[nb_oargs + nb_iargs]), 1914efee3746SRichard Henderson op->args[nb_oargs + nb_iargs + 1], nb_oargs); 1915b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 191643439139SRichard Henderson col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1917efee3746SRichard Henderson op->args[i])); 1918b03cce8eSbellard } 1919cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1920efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1921cf066674SRichard Henderson const char *t = "<dummy>"; 1922cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 192343439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1924b03cce8eSbellard } 1925bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1926e8996ee0Sbellard } 1927b03cce8eSbellard } else { 1928bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1929c45cb8bbSRichard Henderson 1930c896fe29Sbellard nb_oargs = def->nb_oargs; 1931c896fe29Sbellard nb_iargs = def->nb_iargs; 1932c896fe29Sbellard nb_cargs = def->nb_cargs; 1933c896fe29Sbellard 1934d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1935d2fd745fSRichard Henderson col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op), 1936d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1937d2fd745fSRichard Henderson } 1938d2fd745fSRichard Henderson 1939c896fe29Sbellard k = 0; 1940c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1941eeacee4dSBlue Swirl if (k != 0) { 1942bdfb460eSRichard Henderson col += qemu_log(","); 1943eeacee4dSBlue Swirl } 194443439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1945efee3746SRichard Henderson op->args[k++])); 1946c896fe29Sbellard } 1947c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1948eeacee4dSBlue Swirl if (k != 0) { 1949bdfb460eSRichard Henderson col += qemu_log(","); 1950eeacee4dSBlue Swirl } 195143439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1952efee3746SRichard Henderson op->args[k++])); 1953c896fe29Sbellard } 1954be210acbSRichard Henderson switch (c) { 1955be210acbSRichard Henderson case INDEX_op_brcond_i32: 1956ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1957ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1958be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1959be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1960ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1961be210acbSRichard Henderson case INDEX_op_setcond_i64: 1962ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1963212be173SRichard Henderson case INDEX_op_cmp_vec: 1964efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1965efee3746SRichard Henderson && cond_name[op->args[k]]) { 1966efee3746SRichard Henderson col += qemu_log(",%s", cond_name[op->args[k++]]); 1967eeacee4dSBlue Swirl } else { 1968efee3746SRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]); 1969eeacee4dSBlue Swirl } 1970f48f3edeSblueswir1 i = 1; 1971be210acbSRichard Henderson break; 1972f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1973f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 1974f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1975f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 197659227d5dSRichard Henderson { 1977efee3746SRichard Henderson TCGMemOpIdx oi = op->args[k++]; 197859227d5dSRichard Henderson TCGMemOp op = get_memop(oi); 197959227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 198059227d5dSRichard Henderson 198159c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1982bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 198359c4b7e8SRichard Henderson } else { 19841f00b27fSSergey Sorokin const char *s_al, *s_op; 19851f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 198659c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1987bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 1988f713d6adSRichard Henderson } 1989f713d6adSRichard Henderson i = 1; 199059227d5dSRichard Henderson } 1991f713d6adSRichard Henderson break; 1992be210acbSRichard Henderson default: 1993f48f3edeSblueswir1 i = 0; 1994be210acbSRichard Henderson break; 1995be210acbSRichard Henderson } 199651e3972cSRichard Henderson switch (c) { 199751e3972cSRichard Henderson case INDEX_op_set_label: 199851e3972cSRichard Henderson case INDEX_op_br: 199951e3972cSRichard Henderson case INDEX_op_brcond_i32: 200051e3972cSRichard Henderson case INDEX_op_brcond_i64: 200151e3972cSRichard Henderson case INDEX_op_brcond2_i32: 2002efee3746SRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", 2003efee3746SRichard Henderson arg_label(op->args[k])->id); 200451e3972cSRichard Henderson i++, k++; 200551e3972cSRichard Henderson break; 200651e3972cSRichard Henderson default: 200751e3972cSRichard Henderson break; 2008eeacee4dSBlue Swirl } 200951e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 2010efee3746SRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]); 2011bdfb460eSRichard Henderson } 2012bdfb460eSRichard Henderson } 2013bdfb460eSRichard Henderson if (op->life) { 2014bdfb460eSRichard Henderson unsigned life = op->life; 2015bdfb460eSRichard Henderson 2016bdfb460eSRichard Henderson for (; col < 48; ++col) { 2017bdfb460eSRichard Henderson putc(' ', qemu_logfile); 2018bdfb460eSRichard Henderson } 2019bdfb460eSRichard Henderson 2020bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 2021bdfb460eSRichard Henderson qemu_log(" sync:"); 2022bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 2023bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 2024bdfb460eSRichard Henderson qemu_log(" %d", i); 2025bdfb460eSRichard Henderson } 2026bdfb460eSRichard Henderson } 2027bdfb460eSRichard Henderson } 2028bdfb460eSRichard Henderson life /= DEAD_ARG; 2029bdfb460eSRichard Henderson if (life) { 2030bdfb460eSRichard Henderson qemu_log(" dead:"); 2031bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 2032bdfb460eSRichard Henderson if (life & 1) { 2033bdfb460eSRichard Henderson qemu_log(" %d", i); 2034bdfb460eSRichard Henderson } 2035bdfb460eSRichard Henderson } 2036c896fe29Sbellard } 2037b03cce8eSbellard } 2038eeacee4dSBlue Swirl qemu_log("\n"); 2039c896fe29Sbellard } 2040c896fe29Sbellard } 2041c896fe29Sbellard 2042c896fe29Sbellard /* we give more priority to constraints with less registers */ 2043c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 2044c896fe29Sbellard { 2045c896fe29Sbellard const TCGArgConstraint *arg_ct; 2046c896fe29Sbellard 2047c896fe29Sbellard int i, n; 2048c896fe29Sbellard arg_ct = &def->args_ct[k]; 2049c896fe29Sbellard if (arg_ct->ct & TCG_CT_ALIAS) { 2050c896fe29Sbellard /* an alias is equivalent to a single register */ 2051c896fe29Sbellard n = 1; 2052c896fe29Sbellard } else { 2053c896fe29Sbellard if (!(arg_ct->ct & TCG_CT_REG)) 2054c896fe29Sbellard return 0; 2055c896fe29Sbellard n = 0; 2056c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2057c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, i)) 2058c896fe29Sbellard n++; 2059c896fe29Sbellard } 2060c896fe29Sbellard } 2061c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 2062c896fe29Sbellard } 2063c896fe29Sbellard 2064c896fe29Sbellard /* sort from highest priority to lowest */ 2065c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 2066c896fe29Sbellard { 2067c896fe29Sbellard int i, j, p1, p2, tmp; 2068c896fe29Sbellard 2069c896fe29Sbellard for(i = 0; i < n; i++) 2070c896fe29Sbellard def->sorted_args[start + i] = start + i; 2071c896fe29Sbellard if (n <= 1) 2072c896fe29Sbellard return; 2073c896fe29Sbellard for(i = 0; i < n - 1; i++) { 2074c896fe29Sbellard for(j = i + 1; j < n; j++) { 2075c896fe29Sbellard p1 = get_constraint_priority(def, def->sorted_args[start + i]); 2076c896fe29Sbellard p2 = get_constraint_priority(def, def->sorted_args[start + j]); 2077c896fe29Sbellard if (p1 < p2) { 2078c896fe29Sbellard tmp = def->sorted_args[start + i]; 2079c896fe29Sbellard def->sorted_args[start + i] = def->sorted_args[start + j]; 2080c896fe29Sbellard def->sorted_args[start + j] = tmp; 2081c896fe29Sbellard } 2082c896fe29Sbellard } 2083c896fe29Sbellard } 2084c896fe29Sbellard } 2085c896fe29Sbellard 2086f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 2087c896fe29Sbellard { 2088a9751609SRichard Henderson TCGOpcode op; 2089c896fe29Sbellard 2090f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 2091f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 2092f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 2093069ea736SRichard Henderson TCGType type; 2094069ea736SRichard Henderson int i, nb_args; 2095f69d277eSRichard Henderson 2096f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 2097f69d277eSRichard Henderson continue; 2098f69d277eSRichard Henderson } 2099f69d277eSRichard Henderson 2100c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 2101f69d277eSRichard Henderson if (nb_args == 0) { 2102f69d277eSRichard Henderson continue; 2103f69d277eSRichard Henderson } 2104f69d277eSRichard Henderson 2105f69d277eSRichard Henderson tdefs = tcg_target_op_def(op); 2106f69d277eSRichard Henderson /* Missing TCGTargetOpDef entry. */ 2107f69d277eSRichard Henderson tcg_debug_assert(tdefs != NULL); 2108f69d277eSRichard Henderson 2109069ea736SRichard Henderson type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32); 2110c896fe29Sbellard for (i = 0; i < nb_args; i++) { 2111f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 2112f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2113eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2114f69d277eSRichard Henderson 2115ccb1bb66SRichard Henderson def->args_ct[i].u.regs = 0; 2116c896fe29Sbellard def->args_ct[i].ct = 0; 211717280ff4SRichard Henderson while (*ct_str != '\0') { 211817280ff4SRichard Henderson switch(*ct_str) { 211917280ff4SRichard Henderson case '0' ... '9': 212017280ff4SRichard Henderson { 212117280ff4SRichard Henderson int oarg = *ct_str - '0'; 212217280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 2123eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 2124eabb7b91SAurelien Jarno tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG); 212517280ff4SRichard Henderson /* TCG_CT_ALIAS is for the output arguments. 212617280ff4SRichard Henderson The input is tagged with TCG_CT_IALIAS. */ 2127c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 212817280ff4SRichard Henderson def->args_ct[oarg].ct |= TCG_CT_ALIAS; 21295ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 2130c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_IALIAS; 21315ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 213217280ff4SRichard Henderson } 213317280ff4SRichard Henderson ct_str++; 2134c896fe29Sbellard break; 213582790a87SRichard Henderson case '&': 213682790a87SRichard Henderson def->args_ct[i].ct |= TCG_CT_NEWREG; 213782790a87SRichard Henderson ct_str++; 213882790a87SRichard Henderson break; 2139c896fe29Sbellard case 'i': 2140c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2141c896fe29Sbellard ct_str++; 2142c896fe29Sbellard break; 2143c896fe29Sbellard default: 2144069ea736SRichard Henderson ct_str = target_parse_constraint(&def->args_ct[i], 2145069ea736SRichard Henderson ct_str, type); 2146f69d277eSRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2147069ea736SRichard Henderson tcg_debug_assert(ct_str != NULL); 2148c896fe29Sbellard } 2149c896fe29Sbellard } 2150c896fe29Sbellard } 2151c896fe29Sbellard 2152c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2153eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2154c68aaa18SStefan Weil 2155c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2156c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2157c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2158c896fe29Sbellard } 2159c896fe29Sbellard } 2160c896fe29Sbellard 21610c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 21620c627cdcSRichard Henderson { 216315fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 216415fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2165abebf925SRichard Henderson s->nb_ops--; 21660c627cdcSRichard Henderson 21670c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2168c3fac113SEmilio G. Cota atomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 21690c627cdcSRichard Henderson #endif 21700c627cdcSRichard Henderson } 21710c627cdcSRichard Henderson 217215fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 217315fa08f8SRichard Henderson { 217415fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 217515fa08f8SRichard Henderson TCGOp *op; 217615fa08f8SRichard Henderson 217715fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 217815fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 217915fa08f8SRichard Henderson } else { 218015fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 218115fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 218215fa08f8SRichard Henderson } 218315fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 218415fa08f8SRichard Henderson op->opc = opc; 2185abebf925SRichard Henderson s->nb_ops++; 218615fa08f8SRichard Henderson 218715fa08f8SRichard Henderson return op; 218815fa08f8SRichard Henderson } 218915fa08f8SRichard Henderson 219015fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 219115fa08f8SRichard Henderson { 219215fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 219315fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 219415fa08f8SRichard Henderson return op; 219515fa08f8SRichard Henderson } 219615fa08f8SRichard Henderson 21975a18407fSRichard Henderson TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, 21985a18407fSRichard Henderson TCGOpcode opc, int nargs) 21995a18407fSRichard Henderson { 220015fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 220115fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 22025a18407fSRichard Henderson return new_op; 22035a18407fSRichard Henderson } 22045a18407fSRichard Henderson 22055a18407fSRichard Henderson TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, 22065a18407fSRichard Henderson TCGOpcode opc, int nargs) 22075a18407fSRichard Henderson { 220815fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 220915fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 22105a18407fSRichard Henderson return new_op; 22115a18407fSRichard Henderson } 22125a18407fSRichard Henderson 2213c70fbf0aSRichard Henderson #define TS_DEAD 1 2214c70fbf0aSRichard Henderson #define TS_MEM 2 2215c70fbf0aSRichard Henderson 22165a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 22175a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 22185a18407fSRichard Henderson 22199c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 22209c43b68dSAurelien Jarno should be in memory. */ 2221b83eabeaSRichard Henderson static void tcg_la_func_end(TCGContext *s) 2222c896fe29Sbellard { 2223b83eabeaSRichard Henderson int ng = s->nb_globals; 2224b83eabeaSRichard Henderson int nt = s->nb_temps; 2225b83eabeaSRichard Henderson int i; 2226b83eabeaSRichard Henderson 2227b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2228b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2229b83eabeaSRichard Henderson } 2230b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2231b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 2232b83eabeaSRichard Henderson } 2233c896fe29Sbellard } 2234c896fe29Sbellard 22359c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 22369c43b68dSAurelien Jarno and local temps should be in memory. */ 2237b83eabeaSRichard Henderson static void tcg_la_bb_end(TCGContext *s) 2238641d5fbeSbellard { 2239b83eabeaSRichard Henderson int ng = s->nb_globals; 2240b83eabeaSRichard Henderson int nt = s->nb_temps; 2241b83eabeaSRichard Henderson int i; 2242641d5fbeSbellard 2243b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2244b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2245c70fbf0aSRichard Henderson } 2246b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2247b83eabeaSRichard Henderson s->temps[i].state = (s->temps[i].temp_local 2248b83eabeaSRichard Henderson ? TS_DEAD | TS_MEM 2249b83eabeaSRichard Henderson : TS_DEAD); 2250641d5fbeSbellard } 2251641d5fbeSbellard } 2252641d5fbeSbellard 2253a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2254c896fe29Sbellard given input arguments is dead. Instructions updating dead 2255c896fe29Sbellard temporaries are removed. */ 2256b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2257c896fe29Sbellard { 2258c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 225915fa08f8SRichard Henderson TCGOp *op, *op_prev; 2260c896fe29Sbellard 2261b83eabeaSRichard Henderson tcg_la_func_end(s); 2262c896fe29Sbellard 226315fa08f8SRichard Henderson QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, TCGOpHead, link, op_prev) { 2264c45cb8bbSRichard Henderson int i, nb_iargs, nb_oargs; 2265c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2266c45cb8bbSRichard Henderson bool have_opc_new2; 2267a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 2268b83eabeaSRichard Henderson TCGTemp *arg_ts; 2269c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2270c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2271c45cb8bbSRichard Henderson 2272c45cb8bbSRichard Henderson switch (opc) { 2273c896fe29Sbellard case INDEX_op_call: 2274c6e113f5Sbellard { 2275c6e113f5Sbellard int call_flags; 2276c6e113f5Sbellard 2277cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2278cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2279efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 2280c6e113f5Sbellard 2281c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 228278505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2283c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 2284b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2285b83eabeaSRichard Henderson if (arg_ts->state != TS_DEAD) { 2286c6e113f5Sbellard goto do_not_remove_call; 2287c6e113f5Sbellard } 22889c43b68dSAurelien Jarno } 2289c45cb8bbSRichard Henderson goto do_remove; 2290c6e113f5Sbellard } else { 2291c6e113f5Sbellard do_not_remove_call: 2292c896fe29Sbellard 2293c896fe29Sbellard /* output args are dead */ 2294c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2295b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2296b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2297a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 22986b64b624SAurelien Jarno } 2299b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2300a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 23019c43b68dSAurelien Jarno } 2302b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2303c896fe29Sbellard } 2304c896fe29Sbellard 230578505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 230678505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 23079c43b68dSAurelien Jarno /* globals should go back to memory */ 2308b83eabeaSRichard Henderson for (i = 0; i < nb_globals; i++) { 2309b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2310b83eabeaSRichard Henderson } 2311c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2312c70fbf0aSRichard Henderson /* globals should be synced to memory */ 2313c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2314b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2315c70fbf0aSRichard Henderson } 2316b9c18f56Saurel32 } 2317c896fe29Sbellard 2318c19f47bfSAurelien Jarno /* record arguments that die in this helper */ 2319866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2320b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2321b83eabeaSRichard Henderson if (arg_ts && arg_ts->state & TS_DEAD) { 2322a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2323c896fe29Sbellard } 2324c896fe29Sbellard } 232567cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2326c70fbf0aSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2327b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2328b83eabeaSRichard Henderson if (arg_ts) { 2329b83eabeaSRichard Henderson arg_ts->state &= ~TS_DEAD; 2330c70fbf0aSRichard Henderson } 2331c19f47bfSAurelien Jarno } 2332c6e113f5Sbellard } 2333c6e113f5Sbellard } 2334c896fe29Sbellard break; 2335765b842aSRichard Henderson case INDEX_op_insn_start: 2336c896fe29Sbellard break; 23375ff9d6a4Sbellard case INDEX_op_discard: 23385ff9d6a4Sbellard /* mark the temporary as dead */ 2339b83eabeaSRichard Henderson arg_temp(op->args[0])->state = TS_DEAD; 23405ff9d6a4Sbellard break; 23411305c451SRichard Henderson 23421305c451SRichard Henderson case INDEX_op_add2_i32: 2343c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2344f1fae40cSRichard Henderson goto do_addsub2; 23451305c451SRichard Henderson case INDEX_op_sub2_i32: 2346c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2347f1fae40cSRichard Henderson goto do_addsub2; 2348f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2349c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2350f1fae40cSRichard Henderson goto do_addsub2; 2351f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2352c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2353f1fae40cSRichard Henderson do_addsub2: 23541305c451SRichard Henderson nb_iargs = 4; 23551305c451SRichard Henderson nb_oargs = 2; 23561305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 23571305c451SRichard Henderson the low part. The result can be optimized to a simple 23581305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 23591305c451SRichard Henderson cpu mode is set to 32 bit. */ 2360b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2361b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 23621305c451SRichard Henderson goto do_remove; 23631305c451SRichard Henderson } 2364c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2365c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2366c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2367efee3746SRichard Henderson op->args[1] = op->args[2]; 2368efee3746SRichard Henderson op->args[2] = op->args[4]; 23691305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 23701305c451SRichard Henderson nb_iargs = 2; 23711305c451SRichard Henderson nb_oargs = 1; 23721305c451SRichard Henderson } 23731305c451SRichard Henderson goto do_not_remove; 23741305c451SRichard Henderson 23751414968aSRichard Henderson case INDEX_op_mulu2_i32: 2376c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2377c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2378c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 237903271524SRichard Henderson goto do_mul2; 2380f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2381c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2382c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2383c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2384f1fae40cSRichard Henderson goto do_mul2; 2385f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2386c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2387c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2388c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 238903271524SRichard Henderson goto do_mul2; 2390f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2391c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2392c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2393c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 239403271524SRichard Henderson goto do_mul2; 2395f1fae40cSRichard Henderson do_mul2: 23961414968aSRichard Henderson nb_iargs = 2; 23971414968aSRichard Henderson nb_oargs = 2; 2398b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2399b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 240003271524SRichard Henderson /* Both parts of the operation are dead. */ 24011414968aSRichard Henderson goto do_remove; 24021414968aSRichard Henderson } 240303271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2404c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2405efee3746SRichard Henderson op->args[1] = op->args[2]; 2406efee3746SRichard Henderson op->args[2] = op->args[3]; 2407b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 240803271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2409c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2410efee3746SRichard Henderson op->args[0] = op->args[1]; 2411efee3746SRichard Henderson op->args[1] = op->args[2]; 2412efee3746SRichard Henderson op->args[2] = op->args[3]; 241303271524SRichard Henderson } else { 241403271524SRichard Henderson goto do_not_remove; 241503271524SRichard Henderson } 241603271524SRichard Henderson /* Mark the single-word operation live. */ 24171414968aSRichard Henderson nb_oargs = 1; 24181414968aSRichard Henderson goto do_not_remove; 24191414968aSRichard Henderson 2420c896fe29Sbellard default: 24211305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2422c896fe29Sbellard nb_iargs = def->nb_iargs; 2423c896fe29Sbellard nb_oargs = def->nb_oargs; 2424c896fe29Sbellard 2425c896fe29Sbellard /* Test if the operation can be removed because all 24265ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 24275ff9d6a4Sbellard implies side effects */ 24285ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2429c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2430b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2431c896fe29Sbellard goto do_not_remove; 2432c896fe29Sbellard } 24339c43b68dSAurelien Jarno } 24341305c451SRichard Henderson do_remove: 24350c627cdcSRichard Henderson tcg_op_remove(s, op); 2436c896fe29Sbellard } else { 2437c896fe29Sbellard do_not_remove: 2438c896fe29Sbellard /* output args are dead */ 2439c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2440b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2441b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2442a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 24436b64b624SAurelien Jarno } 2444b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2445a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 24469c43b68dSAurelien Jarno } 2447b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2448c896fe29Sbellard } 2449c896fe29Sbellard 2450c896fe29Sbellard /* if end of basic block, update */ 2451c896fe29Sbellard if (def->flags & TCG_OPF_BB_END) { 2452b83eabeaSRichard Henderson tcg_la_bb_end(s); 24533d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 24543d5c5f87SAurelien Jarno /* globals should be synced to memory */ 2455c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2456b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2457c70fbf0aSRichard Henderson } 2458c896fe29Sbellard } 2459c896fe29Sbellard 2460c19f47bfSAurelien Jarno /* record arguments that die in this opcode */ 2461866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2462b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2463b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2464a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2465c896fe29Sbellard } 2466c19f47bfSAurelien Jarno } 246767cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2468c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2469b83eabeaSRichard Henderson arg_temp(op->args[i])->state &= ~TS_DEAD; 2470c896fe29Sbellard } 2471c896fe29Sbellard } 2472c896fe29Sbellard break; 2473c896fe29Sbellard } 2474bee158cbSRichard Henderson op->life = arg_life; 2475c896fe29Sbellard } 24761ff0a2c5SEvgeny Voevodin } 2477c896fe29Sbellard 24785a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2479b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 24805a18407fSRichard Henderson { 24815a18407fSRichard Henderson int nb_globals = s->nb_globals; 248215fa08f8SRichard Henderson int nb_temps, i; 24835a18407fSRichard Henderson bool changes = false; 248415fa08f8SRichard Henderson TCGOp *op, *op_next; 24855a18407fSRichard Henderson 24865a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 24875a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 24885a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 24895a18407fSRichard Henderson if (its->indirect_reg) { 24905a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 24915a18407fSRichard Henderson dts->type = its->type; 24925a18407fSRichard Henderson dts->base_type = its->base_type; 2493b83eabeaSRichard Henderson its->state_ptr = dts; 2494b83eabeaSRichard Henderson } else { 2495b83eabeaSRichard Henderson its->state_ptr = NULL; 24965a18407fSRichard Henderson } 2497b83eabeaSRichard Henderson /* All globals begin dead. */ 2498b83eabeaSRichard Henderson its->state = TS_DEAD; 24995a18407fSRichard Henderson } 2500b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2501b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2502b83eabeaSRichard Henderson its->state_ptr = NULL; 2503b83eabeaSRichard Henderson its->state = TS_DEAD; 2504b83eabeaSRichard Henderson } 25055a18407fSRichard Henderson 250615fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 25075a18407fSRichard Henderson TCGOpcode opc = op->opc; 25085a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 25095a18407fSRichard Henderson TCGLifeData arg_life = op->life; 25105a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2511b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 25125a18407fSRichard Henderson 25135a18407fSRichard Henderson if (opc == INDEX_op_call) { 2514cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2515cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2516efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 25175a18407fSRichard Henderson } else { 25185a18407fSRichard Henderson nb_iargs = def->nb_iargs; 25195a18407fSRichard Henderson nb_oargs = def->nb_oargs; 25205a18407fSRichard Henderson 25215a18407fSRichard Henderson /* Set flags similar to how calls require. */ 25225a18407fSRichard Henderson if (def->flags & TCG_OPF_BB_END) { 25235a18407fSRichard Henderson /* Like writing globals: save_globals */ 25245a18407fSRichard Henderson call_flags = 0; 25255a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 25265a18407fSRichard Henderson /* Like reading globals: sync_globals */ 25275a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 25285a18407fSRichard Henderson } else { 25295a18407fSRichard Henderson /* No effect on globals. */ 25305a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 25315a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 25325a18407fSRichard Henderson } 25335a18407fSRichard Henderson } 25345a18407fSRichard Henderson 25355a18407fSRichard Henderson /* Make sure that input arguments are available. */ 25365a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2537b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2538b83eabeaSRichard Henderson if (arg_ts) { 2539b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2540b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2541b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 25425a18407fSRichard Henderson ? INDEX_op_ld_i32 25435a18407fSRichard Henderson : INDEX_op_ld_i64); 25445a18407fSRichard Henderson TCGOp *lop = tcg_op_insert_before(s, op, lopc, 3); 25455a18407fSRichard Henderson 2546b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2547b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2548b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 25495a18407fSRichard Henderson 25505a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2551b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 25525a18407fSRichard Henderson } 25535a18407fSRichard Henderson } 25545a18407fSRichard Henderson } 25555a18407fSRichard Henderson 25565a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 25575a18407fSRichard Henderson No action is required except keeping temp_state up to date 25585a18407fSRichard Henderson so that we reload when needed. */ 25595a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2560b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2561b83eabeaSRichard Henderson if (arg_ts) { 2562b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2563b83eabeaSRichard Henderson if (dir_ts) { 2564b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 25655a18407fSRichard Henderson changes = true; 25665a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2567b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 25685a18407fSRichard Henderson } 25695a18407fSRichard Henderson } 25705a18407fSRichard Henderson } 25715a18407fSRichard Henderson } 25725a18407fSRichard Henderson 25735a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 25745a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 25755a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 25765a18407fSRichard Henderson /* Nothing to do */ 25775a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 25785a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 25795a18407fSRichard Henderson /* Liveness should see that globals are synced back, 25805a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2581b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2582b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2583b83eabeaSRichard Henderson || arg_ts->state != 0); 25845a18407fSRichard Henderson } 25855a18407fSRichard Henderson } else { 25865a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 25875a18407fSRichard Henderson /* Liveness should see that globals are saved back, 25885a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2589b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2590b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2591b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 25925a18407fSRichard Henderson } 25935a18407fSRichard Henderson } 25945a18407fSRichard Henderson 25955a18407fSRichard Henderson /* Outputs become available. */ 25965a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 2597b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2598b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2599b83eabeaSRichard Henderson if (!dir_ts) { 26005a18407fSRichard Henderson continue; 26015a18407fSRichard Henderson } 2602b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 26035a18407fSRichard Henderson changes = true; 26045a18407fSRichard Henderson 26055a18407fSRichard Henderson /* The output is now live and modified. */ 2606b83eabeaSRichard Henderson arg_ts->state = 0; 26075a18407fSRichard Henderson 26085a18407fSRichard Henderson /* Sync outputs upon their last write. */ 26095a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 2610b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 26115a18407fSRichard Henderson ? INDEX_op_st_i32 26125a18407fSRichard Henderson : INDEX_op_st_i64); 26135a18407fSRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc, 3); 26145a18407fSRichard Henderson 2615b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 2616b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 2617b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 26185a18407fSRichard Henderson 2619b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 26205a18407fSRichard Henderson } 26215a18407fSRichard Henderson /* Drop outputs that are dead. */ 26225a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2623b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 26245a18407fSRichard Henderson } 26255a18407fSRichard Henderson } 26265a18407fSRichard Henderson } 26275a18407fSRichard Henderson 26285a18407fSRichard Henderson return changes; 26295a18407fSRichard Henderson } 26305a18407fSRichard Henderson 26318d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2632c896fe29Sbellard static void dump_regs(TCGContext *s) 2633c896fe29Sbellard { 2634c896fe29Sbellard TCGTemp *ts; 2635c896fe29Sbellard int i; 2636c896fe29Sbellard char buf[64]; 2637c896fe29Sbellard 2638c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2639c896fe29Sbellard ts = &s->temps[i]; 264043439139SRichard Henderson printf(" %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2641c896fe29Sbellard switch(ts->val_type) { 2642c896fe29Sbellard case TEMP_VAL_REG: 2643c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2644c896fe29Sbellard break; 2645c896fe29Sbellard case TEMP_VAL_MEM: 2646b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2647b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2648c896fe29Sbellard break; 2649c896fe29Sbellard case TEMP_VAL_CONST: 2650c896fe29Sbellard printf("$0x%" TCG_PRIlx, ts->val); 2651c896fe29Sbellard break; 2652c896fe29Sbellard case TEMP_VAL_DEAD: 2653c896fe29Sbellard printf("D"); 2654c896fe29Sbellard break; 2655c896fe29Sbellard default: 2656c896fe29Sbellard printf("???"); 2657c896fe29Sbellard break; 2658c896fe29Sbellard } 2659c896fe29Sbellard printf("\n"); 2660c896fe29Sbellard } 2661c896fe29Sbellard 2662c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2663f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2664c896fe29Sbellard printf("%s: %s\n", 2665c896fe29Sbellard tcg_target_reg_names[i], 2666f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2667c896fe29Sbellard } 2668c896fe29Sbellard } 2669c896fe29Sbellard } 2670c896fe29Sbellard 2671c896fe29Sbellard static void check_regs(TCGContext *s) 2672c896fe29Sbellard { 2673869938aeSRichard Henderson int reg; 2674b6638662SRichard Henderson int k; 2675c896fe29Sbellard TCGTemp *ts; 2676c896fe29Sbellard char buf[64]; 2677c896fe29Sbellard 2678c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2679f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2680f8b2f202SRichard Henderson if (ts != NULL) { 2681f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2682c896fe29Sbellard printf("Inconsistency for register %s:\n", 2683c896fe29Sbellard tcg_target_reg_names[reg]); 2684b03cce8eSbellard goto fail; 2685c896fe29Sbellard } 2686c896fe29Sbellard } 2687c896fe29Sbellard } 2688c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2689c896fe29Sbellard ts = &s->temps[k]; 2690f8b2f202SRichard Henderson if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg 2691f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2692c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2693f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2694b03cce8eSbellard fail: 2695c896fe29Sbellard printf("reg state:\n"); 2696c896fe29Sbellard dump_regs(s); 2697c896fe29Sbellard tcg_abort(); 2698c896fe29Sbellard } 2699c896fe29Sbellard } 2700c896fe29Sbellard } 2701c896fe29Sbellard #endif 2702c896fe29Sbellard 27032272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 2704c896fe29Sbellard { 27059b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 27069b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2707b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2708b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2709b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2710f44c9960SBlue Swirl #endif 2711b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2712b591dc59SBlue Swirl s->frame_end) { 27135ff9d6a4Sbellard tcg_abort(); 2714b591dc59SBlue Swirl } 2715c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2716b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2717c896fe29Sbellard ts->mem_allocated = 1; 2718e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2719c896fe29Sbellard } 2720c896fe29Sbellard 2721b3915dbbSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet); 2722b3915dbbSRichard Henderson 272359d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 272459d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 272559d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2726c896fe29Sbellard { 272759d7c14eSRichard Henderson if (ts->fixed_reg) { 272859d7c14eSRichard Henderson return; 272959d7c14eSRichard Henderson } 273059d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 273159d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 273259d7c14eSRichard Henderson } 273359d7c14eSRichard Henderson ts->val_type = (free_or_dead < 0 273459d7c14eSRichard Henderson || ts->temp_local 2735fa477d25SRichard Henderson || ts->temp_global 273659d7c14eSRichard Henderson ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 273759d7c14eSRichard Henderson } 2738c896fe29Sbellard 273959d7c14eSRichard Henderson /* Mark a temporary as dead. */ 274059d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 274159d7c14eSRichard Henderson { 274259d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 274359d7c14eSRichard Henderson } 274459d7c14eSRichard Henderson 274559d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 274659d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 274759d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 274859d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 274959d7c14eSRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, 275059d7c14eSRichard Henderson TCGRegSet allocated_regs, int free_or_dead) 275159d7c14eSRichard Henderson { 275259d7c14eSRichard Henderson if (ts->fixed_reg) { 275359d7c14eSRichard Henderson return; 275459d7c14eSRichard Henderson } 275559d7c14eSRichard Henderson if (!ts->mem_coherent) { 27567f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 27572272e4a7SRichard Henderson temp_allocate_frame(s, ts); 275859d7c14eSRichard Henderson } 275959d7c14eSRichard Henderson switch (ts->val_type) { 276059d7c14eSRichard Henderson case TEMP_VAL_CONST: 276159d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 276259d7c14eSRichard Henderson require it later in a register, so attempt to store the 276359d7c14eSRichard Henderson constant to memory directly. */ 276459d7c14eSRichard Henderson if (free_or_dead 276559d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 276659d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 276759d7c14eSRichard Henderson break; 276859d7c14eSRichard Henderson } 276959d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 277059d7c14eSRichard Henderson allocated_regs); 277159d7c14eSRichard Henderson /* fallthrough */ 277259d7c14eSRichard Henderson 277359d7c14eSRichard Henderson case TEMP_VAL_REG: 277459d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 277559d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 277659d7c14eSRichard Henderson break; 277759d7c14eSRichard Henderson 277859d7c14eSRichard Henderson case TEMP_VAL_MEM: 277959d7c14eSRichard Henderson break; 278059d7c14eSRichard Henderson 278159d7c14eSRichard Henderson case TEMP_VAL_DEAD: 278259d7c14eSRichard Henderson default: 278359d7c14eSRichard Henderson tcg_abort(); 2784c896fe29Sbellard } 27857f6ceedfSAurelien Jarno ts->mem_coherent = 1; 27867f6ceedfSAurelien Jarno } 278759d7c14eSRichard Henderson if (free_or_dead) { 278859d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 278959d7c14eSRichard Henderson } 279059d7c14eSRichard Henderson } 27917f6ceedfSAurelien Jarno 27927f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 2793b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 27947f6ceedfSAurelien Jarno { 2795f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 2796f8b2f202SRichard Henderson if (ts != NULL) { 279759d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, -1); 2798c896fe29Sbellard } 2799c896fe29Sbellard } 2800c896fe29Sbellard 2801c896fe29Sbellard /* Allocate a register belonging to reg1 & ~reg2 */ 2802b3915dbbSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet desired_regs, 280391478cefSRichard Henderson TCGRegSet allocated_regs, bool rev) 2804c896fe29Sbellard { 280591478cefSRichard Henderson int i, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 280691478cefSRichard Henderson const int *order; 2807b6638662SRichard Henderson TCGReg reg; 2808c896fe29Sbellard TCGRegSet reg_ct; 2809c896fe29Sbellard 281007ddf036SRichard Henderson reg_ct = desired_regs & ~allocated_regs; 281191478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 2812c896fe29Sbellard 2813c896fe29Sbellard /* first try free registers */ 281491478cefSRichard Henderson for(i = 0; i < n; i++) { 281591478cefSRichard Henderson reg = order[i]; 2816f8b2f202SRichard Henderson if (tcg_regset_test_reg(reg_ct, reg) && s->reg_to_temp[reg] == NULL) 2817c896fe29Sbellard return reg; 2818c896fe29Sbellard } 2819c896fe29Sbellard 2820c896fe29Sbellard /* XXX: do better spill choice */ 282191478cefSRichard Henderson for(i = 0; i < n; i++) { 282291478cefSRichard Henderson reg = order[i]; 2823c896fe29Sbellard if (tcg_regset_test_reg(reg_ct, reg)) { 2824b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 2825c896fe29Sbellard return reg; 2826c896fe29Sbellard } 2827c896fe29Sbellard } 2828c896fe29Sbellard 2829c896fe29Sbellard tcg_abort(); 2830c896fe29Sbellard } 2831c896fe29Sbellard 283240ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 283340ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 283440ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 283540ae5c62SRichard Henderson TCGRegSet allocated_regs) 283640ae5c62SRichard Henderson { 283740ae5c62SRichard Henderson TCGReg reg; 283840ae5c62SRichard Henderson 283940ae5c62SRichard Henderson switch (ts->val_type) { 284040ae5c62SRichard Henderson case TEMP_VAL_REG: 284140ae5c62SRichard Henderson return; 284240ae5c62SRichard Henderson case TEMP_VAL_CONST: 284391478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 284440ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 284540ae5c62SRichard Henderson ts->mem_coherent = 0; 284640ae5c62SRichard Henderson break; 284740ae5c62SRichard Henderson case TEMP_VAL_MEM: 284891478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 284940ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 285040ae5c62SRichard Henderson ts->mem_coherent = 1; 285140ae5c62SRichard Henderson break; 285240ae5c62SRichard Henderson case TEMP_VAL_DEAD: 285340ae5c62SRichard Henderson default: 285440ae5c62SRichard Henderson tcg_abort(); 285540ae5c62SRichard Henderson } 285640ae5c62SRichard Henderson ts->reg = reg; 285740ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 285840ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 285940ae5c62SRichard Henderson } 286040ae5c62SRichard Henderson 286159d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 2862e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 286359d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 28641ad80729SAurelien Jarno { 28652c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 2866eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 2867f8bf00f1SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg); 28681ad80729SAurelien Jarno } 28691ad80729SAurelien Jarno 28709814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 2871641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 2872641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 2873641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 2874641d5fbeSbellard { 2875ac3b8891SRichard Henderson int i, n; 2876641d5fbeSbellard 2877ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 2878b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 2879641d5fbeSbellard } 2880e5097dc8Sbellard } 2881e5097dc8Sbellard 28823d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 28833d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 28843d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 28853d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 28863d5c5f87SAurelien Jarno { 2887ac3b8891SRichard Henderson int i, n; 28883d5c5f87SAurelien Jarno 2889ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 289012b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 289112b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 289212b9b11aSRichard Henderson || ts->fixed_reg 289312b9b11aSRichard Henderson || ts->mem_coherent); 28943d5c5f87SAurelien Jarno } 28953d5c5f87SAurelien Jarno } 28963d5c5f87SAurelien Jarno 2897e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 2898e8996ee0Sbellard all globals are stored at their canonical location. */ 2899e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 2900e5097dc8Sbellard { 2901e5097dc8Sbellard int i; 2902e5097dc8Sbellard 2903c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 2904b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 2905641d5fbeSbellard if (ts->temp_local) { 2906b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 2907641d5fbeSbellard } else { 29082c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 2909eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 2910eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 2911c896fe29Sbellard } 2912641d5fbeSbellard } 2913e8996ee0Sbellard 2914e8996ee0Sbellard save_globals(s, allocated_regs); 2915c896fe29Sbellard } 2916c896fe29Sbellard 29170fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 29180fe4fca4SPaolo Bonzini tcg_target_ulong val, TCGLifeData arg_life) 2919e8996ee0Sbellard { 2920e8996ee0Sbellard if (ots->fixed_reg) { 292159d7c14eSRichard Henderson /* For fixed registers, we do not do any constant propagation. */ 2922e8996ee0Sbellard tcg_out_movi(s, ots->type, ots->reg, val); 292359d7c14eSRichard Henderson return; 292459d7c14eSRichard Henderson } 292559d7c14eSRichard Henderson 292659d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 2927f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 2928f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2929f8b2f202SRichard Henderson } 2930e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 2931e8996ee0Sbellard ots->val = val; 293259d7c14eSRichard Henderson ots->mem_coherent = 0; 2933ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 293459d7c14eSRichard Henderson temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0)); 293559d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 2936f8bf00f1SRichard Henderson temp_dead(s, ots); 29374c4e1ab2SAurelien Jarno } 2938e8996ee0Sbellard } 2939e8996ee0Sbellard 2940dd186292SRichard Henderson static void tcg_reg_alloc_movi(TCGContext *s, const TCGOp *op) 29410fe4fca4SPaolo Bonzini { 294243439139SRichard Henderson TCGTemp *ots = arg_temp(op->args[0]); 2943dd186292SRichard Henderson tcg_target_ulong val = op->args[1]; 29440fe4fca4SPaolo Bonzini 2945dd186292SRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, op->life); 29460fe4fca4SPaolo Bonzini } 29470fe4fca4SPaolo Bonzini 2948dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 2949c896fe29Sbellard { 2950dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 2951c29c1d7eSAurelien Jarno TCGRegSet allocated_regs; 2952c896fe29Sbellard TCGTemp *ts, *ots; 2953450445d5SRichard Henderson TCGType otype, itype; 2954c896fe29Sbellard 2955d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 295643439139SRichard Henderson ots = arg_temp(op->args[0]); 295743439139SRichard Henderson ts = arg_temp(op->args[1]); 2958450445d5SRichard Henderson 2959450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 2960450445d5SRichard Henderson otype = ots->type; 2961450445d5SRichard Henderson itype = ts->type; 2962c896fe29Sbellard 29630fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 29640fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 29650fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 29660fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 29670fe4fca4SPaolo Bonzini temp_dead(s, ts); 29680fe4fca4SPaolo Bonzini } 29690fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 29700fe4fca4SPaolo Bonzini return; 29710fe4fca4SPaolo Bonzini } 29720fe4fca4SPaolo Bonzini 29730fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 29740fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 29750fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 29760fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 29770fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 297840ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], allocated_regs); 2979c29c1d7eSAurelien Jarno } 2980c29c1d7eSAurelien Jarno 29810fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 2982c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(0) && !ots->fixed_reg) { 2983c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 2984c29c1d7eSAurelien Jarno liveness analysis disabled). */ 2985eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 2986c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 29872272e4a7SRichard Henderson temp_allocate_frame(s, ots); 2988c29c1d7eSAurelien Jarno } 2989b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 2990c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 2991f8bf00f1SRichard Henderson temp_dead(s, ts); 2992c29c1d7eSAurelien Jarno } 2993f8bf00f1SRichard Henderson temp_dead(s, ots); 2994e8996ee0Sbellard } else { 2995c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) { 2996c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 2997c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 2998f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2999c896fe29Sbellard } 3000c29c1d7eSAurelien Jarno ots->reg = ts->reg; 3001f8bf00f1SRichard Henderson temp_dead(s, ts); 3002c29c1d7eSAurelien Jarno } else { 3003c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 3004c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 3005c29c1d7eSAurelien Jarno input one. */ 3006c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 3007450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 300891478cefSRichard Henderson allocated_regs, ots->indirect_base); 3009c29c1d7eSAurelien Jarno } 3010450445d5SRichard Henderson tcg_out_mov(s, otype, ots->reg, ts->reg); 3011c29c1d7eSAurelien Jarno } 3012c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 3013c896fe29Sbellard ots->mem_coherent = 0; 3014f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 3015ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 301659d7c14eSRichard Henderson temp_sync(s, ots, allocated_regs, 0); 3017c29c1d7eSAurelien Jarno } 3018ec7a869dSAurelien Jarno } 3019c896fe29Sbellard } 3020c896fe29Sbellard 3021dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3022c896fe29Sbellard { 3023dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3024dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 302582790a87SRichard Henderson TCGRegSet i_allocated_regs; 302682790a87SRichard Henderson TCGRegSet o_allocated_regs; 3027b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3028b6638662SRichard Henderson TCGReg reg; 3029c896fe29Sbellard TCGArg arg; 3030c896fe29Sbellard const TCGArgConstraint *arg_ct; 3031c896fe29Sbellard TCGTemp *ts; 3032c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3033c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3034c896fe29Sbellard 3035c896fe29Sbellard nb_oargs = def->nb_oargs; 3036c896fe29Sbellard nb_iargs = def->nb_iargs; 3037c896fe29Sbellard 3038c896fe29Sbellard /* copy constants */ 3039c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3040dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3041c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3042c896fe29Sbellard 3043d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3044d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 304582790a87SRichard Henderson 3046c896fe29Sbellard /* satisfy input constraints */ 3047c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 3048c896fe29Sbellard i = def->sorted_args[nb_oargs + k]; 3049dd186292SRichard Henderson arg = op->args[i]; 3050c896fe29Sbellard arg_ct = &def->args_ct[i]; 305143439139SRichard Henderson ts = arg_temp(arg); 305240ae5c62SRichard Henderson 305340ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 305440ae5c62SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct)) { 3055c896fe29Sbellard /* constant is OK for instruction */ 3056c896fe29Sbellard const_args[i] = 1; 3057c896fe29Sbellard new_args[i] = ts->val; 3058c896fe29Sbellard goto iarg_end; 3059c896fe29Sbellard } 306040ae5c62SRichard Henderson 306182790a87SRichard Henderson temp_load(s, ts, arg_ct->u.regs, i_allocated_regs); 306240ae5c62SRichard Henderson 30635ff9d6a4Sbellard if (arg_ct->ct & TCG_CT_IALIAS) { 30645ff9d6a4Sbellard if (ts->fixed_reg) { 30655ff9d6a4Sbellard /* if fixed register, we must allocate a new register 30665ff9d6a4Sbellard if the alias is not the same register */ 3067dd186292SRichard Henderson if (arg != op->args[arg_ct->alias_index]) 30685ff9d6a4Sbellard goto allocate_in_reg; 30695ff9d6a4Sbellard } else { 3070c896fe29Sbellard /* if the input is aliased to an output and if it is 3071c896fe29Sbellard not dead after the instruction, we must allocate 3072c896fe29Sbellard a new register and move it */ 3073866cb6cbSAurelien Jarno if (!IS_DEAD_ARG(i)) { 3074c896fe29Sbellard goto allocate_in_reg; 3075c896fe29Sbellard } 30767e1df267SAurelien Jarno /* check if the current register has already been allocated 30777e1df267SAurelien Jarno for another input aliased to an output */ 30787e1df267SAurelien Jarno int k2, i2; 30797e1df267SAurelien Jarno for (k2 = 0 ; k2 < k ; k2++) { 30807e1df267SAurelien Jarno i2 = def->sorted_args[nb_oargs + k2]; 30817e1df267SAurelien Jarno if ((def->args_ct[i2].ct & TCG_CT_IALIAS) && 30827e1df267SAurelien Jarno (new_args[i2] == ts->reg)) { 30837e1df267SAurelien Jarno goto allocate_in_reg; 30847e1df267SAurelien Jarno } 30857e1df267SAurelien Jarno } 30865ff9d6a4Sbellard } 3087866cb6cbSAurelien Jarno } 3088c896fe29Sbellard reg = ts->reg; 3089c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3090c896fe29Sbellard /* nothing to do : the constraint is satisfied */ 3091c896fe29Sbellard } else { 3092c896fe29Sbellard allocate_in_reg: 3093c896fe29Sbellard /* allocate a new register matching the constraint 3094c896fe29Sbellard and move the temporary register into it */ 309582790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs, 309691478cefSRichard Henderson ts->indirect_base); 30973b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3098c896fe29Sbellard } 3099c896fe29Sbellard new_args[i] = reg; 3100c896fe29Sbellard const_args[i] = 0; 310182790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3102c896fe29Sbellard iarg_end: ; 3103c896fe29Sbellard } 3104c896fe29Sbellard 3105c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3106866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3107866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 310843439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3109c896fe29Sbellard } 3110c896fe29Sbellard } 3111c896fe29Sbellard 3112a52ad07eSAurelien Jarno if (def->flags & TCG_OPF_BB_END) { 311382790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3114a52ad07eSAurelien Jarno } else { 3115c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3116b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3117c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3118c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 311982790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3120c896fe29Sbellard } 3121c896fe29Sbellard } 31223d5c5f87SAurelien Jarno } 31233d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 31243d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 31253d5c5f87SAurelien Jarno an exception. */ 312682790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3127c896fe29Sbellard } 3128c896fe29Sbellard 3129c896fe29Sbellard /* satisfy the output constraints */ 3130c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 3131c896fe29Sbellard i = def->sorted_args[k]; 3132dd186292SRichard Henderson arg = op->args[i]; 3133c896fe29Sbellard arg_ct = &def->args_ct[i]; 313443439139SRichard Henderson ts = arg_temp(arg); 313517280ff4SRichard Henderson if ((arg_ct->ct & TCG_CT_ALIAS) 313617280ff4SRichard Henderson && !const_args[arg_ct->alias_index]) { 31375ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 313882790a87SRichard Henderson } else if (arg_ct->ct & TCG_CT_NEWREG) { 313982790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, 314082790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 314182790a87SRichard Henderson ts->indirect_base); 3142c896fe29Sbellard } else { 3143c896fe29Sbellard /* if fixed register, we try to use it */ 3144c896fe29Sbellard reg = ts->reg; 3145c896fe29Sbellard if (ts->fixed_reg && 3146c896fe29Sbellard tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3147c896fe29Sbellard goto oarg_end; 3148c896fe29Sbellard } 314982790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs, 315091478cefSRichard Henderson ts->indirect_base); 3151c896fe29Sbellard } 315282790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 3153c896fe29Sbellard /* if a fixed register is used, then a move will be done afterwards */ 3154c896fe29Sbellard if (!ts->fixed_reg) { 3155639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3156f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3157639368ddSAurelien Jarno } 3158c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3159c896fe29Sbellard ts->reg = reg; 3160c896fe29Sbellard /* temp value is modified, so the value kept in memory is 3161c896fe29Sbellard potentially not the same */ 3162c896fe29Sbellard ts->mem_coherent = 0; 3163f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3164c896fe29Sbellard } 3165c896fe29Sbellard oarg_end: 3166c896fe29Sbellard new_args[i] = reg; 3167c896fe29Sbellard } 3168e8996ee0Sbellard } 3169c896fe29Sbellard 3170c896fe29Sbellard /* emit instruction */ 3171d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 3172d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 3173d2fd745fSRichard Henderson new_args, const_args); 3174d2fd745fSRichard Henderson } else { 3175dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 3176d2fd745fSRichard Henderson } 3177c896fe29Sbellard 3178c896fe29Sbellard /* move the outputs in the correct register if needed */ 3179c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 318043439139SRichard Henderson ts = arg_temp(op->args[i]); 3181c896fe29Sbellard reg = new_args[i]; 3182c896fe29Sbellard if (ts->fixed_reg && ts->reg != reg) { 31833b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3184c896fe29Sbellard } 3185ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 318682790a87SRichard Henderson temp_sync(s, ts, o_allocated_regs, IS_DEAD_ARG(i)); 318759d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3188f8bf00f1SRichard Henderson temp_dead(s, ts); 3189ec7a869dSAurelien Jarno } 3190c896fe29Sbellard } 3191c896fe29Sbellard } 3192c896fe29Sbellard 3193b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 3194b03cce8eSbellard #define STACK_DIR(x) (-(x)) 3195b03cce8eSbellard #else 3196b03cce8eSbellard #define STACK_DIR(x) (x) 3197b03cce8eSbellard #endif 3198b03cce8eSbellard 3199dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 3200c896fe29Sbellard { 3201cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 3202cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 3203dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3204b6638662SRichard Henderson int flags, nb_regs, i; 3205b6638662SRichard Henderson TCGReg reg; 3206cf066674SRichard Henderson TCGArg arg; 3207c896fe29Sbellard TCGTemp *ts; 3208d3452f1fSRichard Henderson intptr_t stack_offset; 3209d3452f1fSRichard Henderson size_t call_stack_size; 3210cf066674SRichard Henderson tcg_insn_unit *func_addr; 3211cf066674SRichard Henderson int allocate_args; 3212c896fe29Sbellard TCGRegSet allocated_regs; 3213c896fe29Sbellard 3214dd186292SRichard Henderson func_addr = (tcg_insn_unit *)(intptr_t)op->args[nb_oargs + nb_iargs]; 3215dd186292SRichard Henderson flags = op->args[nb_oargs + nb_iargs + 1]; 3216c896fe29Sbellard 32176e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 3218c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 3219c45cb8bbSRichard Henderson nb_regs = nb_iargs; 3220cf066674SRichard Henderson } 3221c896fe29Sbellard 3222c896fe29Sbellard /* assign stack slots first */ 3223c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 3224c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 3225c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 3226b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 3227b03cce8eSbellard if (allocate_args) { 3228345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 3229345649c0SBlue Swirl preallocate call stack */ 3230345649c0SBlue Swirl tcg_abort(); 3231b03cce8eSbellard } 323239cf05d3Sbellard 323339cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 3234c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 3235dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 323639cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 323739cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 323839cf05d3Sbellard #endif 323939cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 324043439139SRichard Henderson ts = arg_temp(arg); 324140ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 324240ae5c62SRichard Henderson s->reserved_regs); 3243e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 324439cf05d3Sbellard } 324539cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 324639cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 324739cf05d3Sbellard #endif 3248c896fe29Sbellard } 3249c896fe29Sbellard 3250c896fe29Sbellard /* assign input registers */ 3251d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 3252c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 3253dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 325439cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 325543439139SRichard Henderson ts = arg_temp(arg); 3256c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 3257b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 325840ae5c62SRichard Henderson 3259c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 3260c896fe29Sbellard if (ts->reg != reg) { 32613b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3262c896fe29Sbellard } 3263c896fe29Sbellard } else { 3264ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 326540ae5c62SRichard Henderson 326640ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 326740ae5c62SRichard Henderson temp_load(s, ts, arg_set, allocated_regs); 3268c896fe29Sbellard } 326940ae5c62SRichard Henderson 3270c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 3271c896fe29Sbellard } 327239cf05d3Sbellard } 3273c896fe29Sbellard 3274c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3275866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 3276866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 327743439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3278c896fe29Sbellard } 3279c896fe29Sbellard } 3280c896fe29Sbellard 3281c896fe29Sbellard /* clobber call registers */ 3282c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3283c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 3284b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 3285c896fe29Sbellard } 3286c896fe29Sbellard } 3287c896fe29Sbellard 328878505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 328978505279SAurelien Jarno they might be read. */ 329078505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 329178505279SAurelien Jarno /* Nothing to do */ 329278505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 329378505279SAurelien Jarno sync_globals(s, allocated_regs); 329478505279SAurelien Jarno } else { 3295e8996ee0Sbellard save_globals(s, allocated_regs); 3296b9c18f56Saurel32 } 3297c896fe29Sbellard 3298cf066674SRichard Henderson tcg_out_call(s, func_addr); 3299c896fe29Sbellard 3300c896fe29Sbellard /* assign output registers and emit moves if needed */ 3301c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 3302dd186292SRichard Henderson arg = op->args[i]; 330343439139SRichard Henderson ts = arg_temp(arg); 3304c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 3305eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 330634b1a49cSRichard Henderson 3307c896fe29Sbellard if (ts->fixed_reg) { 3308c896fe29Sbellard if (ts->reg != reg) { 33093b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3310c896fe29Sbellard } 3311c896fe29Sbellard } else { 3312639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3313f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3314639368ddSAurelien Jarno } 3315c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3316c896fe29Sbellard ts->reg = reg; 3317c896fe29Sbellard ts->mem_coherent = 0; 3318f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3319ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 332059d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i)); 332159d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3322f8bf00f1SRichard Henderson temp_dead(s, ts); 3323c896fe29Sbellard } 3324c896fe29Sbellard } 33258c11ad25SAurelien Jarno } 3326c896fe29Sbellard } 3327c896fe29Sbellard 3328c896fe29Sbellard #ifdef CONFIG_PROFILER 3329c896fe29Sbellard 3330c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 3331c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 3332c3fac113SEmilio G. Cota do { \ 3333c3fac113SEmilio G. Cota (to)->field += atomic_read(&((from)->field)); \ 3334c3fac113SEmilio G. Cota } while (0) 3335c896fe29Sbellard 3336c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 3337c3fac113SEmilio G. Cota do { \ 3338c3fac113SEmilio G. Cota typeof((from)->field) val__ = atomic_read(&((from)->field)); \ 3339c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 3340c3fac113SEmilio G. Cota (to)->field = val__; \ 3341c3fac113SEmilio G. Cota } \ 3342c3fac113SEmilio G. Cota } while (0) 3343c3fac113SEmilio G. Cota 3344c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 3345c3fac113SEmilio G. Cota static inline 3346c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 3347c896fe29Sbellard { 33483468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 3349c3fac113SEmilio G. Cota unsigned int i; 3350c3fac113SEmilio G. Cota 33513468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 33523468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 33533468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 3354c3fac113SEmilio G. Cota 3355c3fac113SEmilio G. Cota if (counters) { 3356c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 3357c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 3358c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 3359c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 3360c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 3361c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 3362c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 3363c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 3364c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 3365c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 3366c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 3367c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 3368c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 3369c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 3370c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 3371c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 3372c3fac113SEmilio G. Cota } 3373c3fac113SEmilio G. Cota if (table) { 3374c896fe29Sbellard int i; 3375d70724ceSzhanghailiang 337615fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 3377c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 3378c3fac113SEmilio G. Cota } 3379c3fac113SEmilio G. Cota } 3380c3fac113SEmilio G. Cota } 3381c3fac113SEmilio G. Cota } 3382c3fac113SEmilio G. Cota 3383c3fac113SEmilio G. Cota #undef PROF_ADD 3384c3fac113SEmilio G. Cota #undef PROF_MAX 3385c3fac113SEmilio G. Cota 3386c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 3387c3fac113SEmilio G. Cota { 3388c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 3389c3fac113SEmilio G. Cota } 3390c3fac113SEmilio G. Cota 3391c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 3392c3fac113SEmilio G. Cota { 3393c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 3394c3fac113SEmilio G. Cota } 3395c3fac113SEmilio G. Cota 3396c3fac113SEmilio G. Cota void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3397c3fac113SEmilio G. Cota { 3398c3fac113SEmilio G. Cota TCGProfile prof = {}; 3399c3fac113SEmilio G. Cota int i; 3400c3fac113SEmilio G. Cota 3401c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 3402c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 3403246ae24dSMax Filippov cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, 3404c3fac113SEmilio G. Cota prof.table_op_count[i]); 3405c896fe29Sbellard } 3406c896fe29Sbellard } 3407246ae24dSMax Filippov #else 3408246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3409246ae24dSMax Filippov { 3410246ae24dSMax Filippov cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3411246ae24dSMax Filippov } 3412c896fe29Sbellard #endif 3413c896fe29Sbellard 3414c896fe29Sbellard 34155bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 3416c896fe29Sbellard { 3417c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 3418c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 3419c3fac113SEmilio G. Cota #endif 342015fa08f8SRichard Henderson int i, num_insns; 342115fa08f8SRichard Henderson TCGOp *op; 3422c896fe29Sbellard 342304fe6400SRichard Henderson #ifdef CONFIG_PROFILER 342404fe6400SRichard Henderson { 342504fe6400SRichard Henderson int n; 342604fe6400SRichard Henderson 342715fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 342815fa08f8SRichard Henderson n++; 342915fa08f8SRichard Henderson } 3430c3fac113SEmilio G. Cota atomic_set(&prof->op_count, prof->op_count + n); 3431c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 3432c3fac113SEmilio G. Cota atomic_set(&prof->op_count_max, n); 343304fe6400SRichard Henderson } 343404fe6400SRichard Henderson 343504fe6400SRichard Henderson n = s->nb_temps; 3436c3fac113SEmilio G. Cota atomic_set(&prof->temp_count, prof->temp_count + n); 3437c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 3438c3fac113SEmilio G. Cota atomic_set(&prof->temp_count_max, n); 343904fe6400SRichard Henderson } 344004fe6400SRichard Henderson } 344104fe6400SRichard Henderson #endif 344204fe6400SRichard Henderson 3443c896fe29Sbellard #ifdef DEBUG_DISAS 3444d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 3445d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 34461ee73216SRichard Henderson qemu_log_lock(); 344793fcfe39Saliguori qemu_log("OP:\n"); 3448eeacee4dSBlue Swirl tcg_dump_ops(s); 344993fcfe39Saliguori qemu_log("\n"); 34501ee73216SRichard Henderson qemu_log_unlock(); 3451c896fe29Sbellard } 3452c896fe29Sbellard #endif 3453c896fe29Sbellard 3454c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 3455c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 3456c5cc28ffSAurelien Jarno #endif 3457c5cc28ffSAurelien Jarno 34588f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 3459c45cb8bbSRichard Henderson tcg_optimize(s); 34608f2e8c07SKirill Batuzov #endif 34618f2e8c07SKirill Batuzov 3462a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3463c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 3464c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time - profile_getclock()); 3465a23a9ec6Sbellard #endif 3466c5cc28ffSAurelien Jarno 3467b83eabeaSRichard Henderson liveness_pass_1(s); 34685a18407fSRichard Henderson 34695a18407fSRichard Henderson if (s->nb_indirects > 0) { 34705a18407fSRichard Henderson #ifdef DEBUG_DISAS 34715a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 34725a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 34731ee73216SRichard Henderson qemu_log_lock(); 34745a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 34755a18407fSRichard Henderson tcg_dump_ops(s); 34765a18407fSRichard Henderson qemu_log("\n"); 34771ee73216SRichard Henderson qemu_log_unlock(); 34785a18407fSRichard Henderson } 34795a18407fSRichard Henderson #endif 34805a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 3481b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 34825a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 3483b83eabeaSRichard Henderson liveness_pass_1(s); 34845a18407fSRichard Henderson } 34855a18407fSRichard Henderson } 3486c5cc28ffSAurelien Jarno 3487a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3488c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time + profile_getclock()); 3489a23a9ec6Sbellard #endif 3490c896fe29Sbellard 3491c896fe29Sbellard #ifdef DEBUG_DISAS 3492d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 3493d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 34941ee73216SRichard Henderson qemu_log_lock(); 3495c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 3496eeacee4dSBlue Swirl tcg_dump_ops(s); 349793fcfe39Saliguori qemu_log("\n"); 34981ee73216SRichard Henderson qemu_log_unlock(); 3499c896fe29Sbellard } 3500c896fe29Sbellard #endif 3501c896fe29Sbellard 3502c896fe29Sbellard tcg_reg_alloc_start(s); 3503c896fe29Sbellard 3504e7e168f4SEmilio G. Cota s->code_buf = tb->tc.ptr; 3505e7e168f4SEmilio G. Cota s->code_ptr = tb->tc.ptr; 3506c896fe29Sbellard 3507659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 35086001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 3509659ef5cbSRichard Henderson #endif 351057a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 351157a26946SRichard Henderson s->pool_labels = NULL; 351257a26946SRichard Henderson #endif 35139ecefc84SRichard Henderson 3514fca8a500SRichard Henderson num_insns = -1; 351515fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 3516c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 3517b3db8758Sblueswir1 3518c896fe29Sbellard #ifdef CONFIG_PROFILER 3519c3fac113SEmilio G. Cota atomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 3520c896fe29Sbellard #endif 3521c45cb8bbSRichard Henderson 3522c896fe29Sbellard switch (opc) { 3523c896fe29Sbellard case INDEX_op_mov_i32: 3524c896fe29Sbellard case INDEX_op_mov_i64: 3525d2fd745fSRichard Henderson case INDEX_op_mov_vec: 3526dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 3527c896fe29Sbellard break; 3528e8996ee0Sbellard case INDEX_op_movi_i32: 3529e8996ee0Sbellard case INDEX_op_movi_i64: 3530d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 3531dd186292SRichard Henderson tcg_reg_alloc_movi(s, op); 3532e8996ee0Sbellard break; 3533765b842aSRichard Henderson case INDEX_op_insn_start: 3534fca8a500SRichard Henderson if (num_insns >= 0) { 3535fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 3536fca8a500SRichard Henderson } 3537fca8a500SRichard Henderson num_insns++; 3538bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 3539bad729e2SRichard Henderson target_ulong a; 3540bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 3541efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 3542bad729e2SRichard Henderson #else 3543efee3746SRichard Henderson a = op->args[i]; 3544bad729e2SRichard Henderson #endif 3545fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 3546bad729e2SRichard Henderson } 3547c896fe29Sbellard break; 35485ff9d6a4Sbellard case INDEX_op_discard: 354943439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 35505ff9d6a4Sbellard break; 3551c896fe29Sbellard case INDEX_op_set_label: 3552e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 3553efee3746SRichard Henderson tcg_out_label(s, arg_label(op->args[0]), s->code_ptr); 3554c896fe29Sbellard break; 3555c896fe29Sbellard case INDEX_op_call: 3556dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 3557c45cb8bbSRichard Henderson break; 3558c896fe29Sbellard default: 355925c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 3560be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 3561c896fe29Sbellard /* Note: in order to speed up the code, it would be much 3562c896fe29Sbellard faster to have specialized register allocator functions for 3563c896fe29Sbellard some common argument patterns */ 3564dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 3565c896fe29Sbellard break; 3566c896fe29Sbellard } 35678d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 3568c896fe29Sbellard check_regs(s); 3569c896fe29Sbellard #endif 3570b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 3571b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 3572b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 3573b125f9dcSRichard Henderson generating code without having to check during generation. */ 3574644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 3575b125f9dcSRichard Henderson return -1; 3576b125f9dcSRichard Henderson } 3577c896fe29Sbellard } 3578fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 3579fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 3580c45cb8bbSRichard Henderson 3581b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 3582659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 3583659ef5cbSRichard Henderson if (!tcg_out_ldst_finalize(s)) { 358423dceda6SRichard Henderson return -1; 358523dceda6SRichard Henderson } 3586659ef5cbSRichard Henderson #endif 358757a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 358857a26946SRichard Henderson if (!tcg_out_pool_finalize(s)) { 358957a26946SRichard Henderson return -1; 359057a26946SRichard Henderson } 359157a26946SRichard Henderson #endif 3592c896fe29Sbellard 3593c896fe29Sbellard /* flush instruction cache */ 35941813e175SRichard Henderson flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr); 35952aeabc08SStefan Weil 35961813e175SRichard Henderson return tcg_current_code_size(s); 3597c896fe29Sbellard } 3598c896fe29Sbellard 3599a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3600405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3601a23a9ec6Sbellard { 3602c3fac113SEmilio G. Cota TCGProfile prof = {}; 3603c3fac113SEmilio G. Cota const TCGProfile *s; 3604c3fac113SEmilio G. Cota int64_t tb_count; 3605c3fac113SEmilio G. Cota int64_t tb_div_count; 3606c3fac113SEmilio G. Cota int64_t tot; 3607c3fac113SEmilio G. Cota 3608c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 3609c3fac113SEmilio G. Cota s = &prof; 3610c3fac113SEmilio G. Cota tb_count = s->tb_count; 3611c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 3612c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 3613a23a9ec6Sbellard 3614a23a9ec6Sbellard cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 3615a23a9ec6Sbellard tot, tot / 2.4e9); 3616a23a9ec6Sbellard cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n", 3617fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 3618fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 3619fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 3620a23a9ec6Sbellard cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n", 3621fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 3622a23a9ec6Sbellard cpu_fprintf(f, "deleted ops/TB %0.2f\n", 3623fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 3624a23a9ec6Sbellard cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n", 3625fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 3626fca8a500SRichard Henderson cpu_fprintf(f, "avg host code/TB %0.1f\n", 3627fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 3628fca8a500SRichard Henderson cpu_fprintf(f, "avg search data/TB %0.1f\n", 3629fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 3630a23a9ec6Sbellard 3631a23a9ec6Sbellard cpu_fprintf(f, "cycles/op %0.1f\n", 3632a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 3633a23a9ec6Sbellard cpu_fprintf(f, "cycles/in byte %0.1f\n", 3634a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 3635a23a9ec6Sbellard cpu_fprintf(f, "cycles/out byte %0.1f\n", 3636a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 3637fca8a500SRichard Henderson cpu_fprintf(f, "cycles/search byte %0.1f\n", 3638fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 3639fca8a500SRichard Henderson if (tot == 0) { 3640a23a9ec6Sbellard tot = 1; 3641fca8a500SRichard Henderson } 3642a23a9ec6Sbellard cpu_fprintf(f, " gen_interm time %0.1f%%\n", 3643a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 3644a23a9ec6Sbellard cpu_fprintf(f, " gen_code time %0.1f%%\n", 3645a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 3646c5cc28ffSAurelien Jarno cpu_fprintf(f, "optim./code time %0.1f%%\n", 3647c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 3648c5cc28ffSAurelien Jarno * 100.0); 3649a23a9ec6Sbellard cpu_fprintf(f, "liveness/code time %0.1f%%\n", 3650a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 3651a23a9ec6Sbellard cpu_fprintf(f, "cpu_restore count %" PRId64 "\n", 3652a23a9ec6Sbellard s->restore_count); 3653a23a9ec6Sbellard cpu_fprintf(f, " avg cycles %0.1f\n", 3654a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 3655a23a9ec6Sbellard } 3656a23a9ec6Sbellard #else 3657405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3658a23a9ec6Sbellard { 365924bf7b3aSbellard cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3660a23a9ec6Sbellard } 3661a23a9ec6Sbellard #endif 3662813da627SRichard Henderson 3663813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 36645872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 36655872bbf2SRichard Henderson 36665872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 36675872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 36685872bbf2SRichard Henderson 36695872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 36705872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 36715872bbf2SRichard Henderson prologue unwind info for the tcg machine. 36725872bbf2SRichard Henderson 36735872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 36745872bbf2SRichard Henderson */ 3675813da627SRichard Henderson 3676813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 3677813da627SRichard Henderson typedef enum { 3678813da627SRichard Henderson JIT_NOACTION = 0, 3679813da627SRichard Henderson JIT_REGISTER_FN, 3680813da627SRichard Henderson JIT_UNREGISTER_FN 3681813da627SRichard Henderson } jit_actions_t; 3682813da627SRichard Henderson 3683813da627SRichard Henderson struct jit_code_entry { 3684813da627SRichard Henderson struct jit_code_entry *next_entry; 3685813da627SRichard Henderson struct jit_code_entry *prev_entry; 3686813da627SRichard Henderson const void *symfile_addr; 3687813da627SRichard Henderson uint64_t symfile_size; 3688813da627SRichard Henderson }; 3689813da627SRichard Henderson 3690813da627SRichard Henderson struct jit_descriptor { 3691813da627SRichard Henderson uint32_t version; 3692813da627SRichard Henderson uint32_t action_flag; 3693813da627SRichard Henderson struct jit_code_entry *relevant_entry; 3694813da627SRichard Henderson struct jit_code_entry *first_entry; 3695813da627SRichard Henderson }; 3696813da627SRichard Henderson 3697813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 3698813da627SRichard Henderson void __jit_debug_register_code(void) 3699813da627SRichard Henderson { 3700813da627SRichard Henderson asm(""); 3701813da627SRichard Henderson } 3702813da627SRichard Henderson 3703813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 3704813da627SRichard Henderson the version before we can set it. */ 3705813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 3706813da627SRichard Henderson 3707813da627SRichard Henderson /* End GDB interface. */ 3708813da627SRichard Henderson 3709813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 3710813da627SRichard Henderson { 3711813da627SRichard Henderson const char *p = strtab + 1; 3712813da627SRichard Henderson 3713813da627SRichard Henderson while (1) { 3714813da627SRichard Henderson if (strcmp(p, str) == 0) { 3715813da627SRichard Henderson return p - strtab; 3716813da627SRichard Henderson } 3717813da627SRichard Henderson p += strlen(p) + 1; 3718813da627SRichard Henderson } 3719813da627SRichard Henderson } 3720813da627SRichard Henderson 37215872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size, 37222c90784aSRichard Henderson const void *debug_frame, 37232c90784aSRichard Henderson size_t debug_frame_size) 3724813da627SRichard Henderson { 37255872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 37265872bbf2SRichard Henderson uint32_t len; 37275872bbf2SRichard Henderson uint16_t version; 37285872bbf2SRichard Henderson uint32_t abbrev; 37295872bbf2SRichard Henderson uint8_t ptr_size; 37305872bbf2SRichard Henderson uint8_t cu_die; 37315872bbf2SRichard Henderson uint16_t cu_lang; 37325872bbf2SRichard Henderson uintptr_t cu_low_pc; 37335872bbf2SRichard Henderson uintptr_t cu_high_pc; 37345872bbf2SRichard Henderson uint8_t fn_die; 37355872bbf2SRichard Henderson char fn_name[16]; 37365872bbf2SRichard Henderson uintptr_t fn_low_pc; 37375872bbf2SRichard Henderson uintptr_t fn_high_pc; 37385872bbf2SRichard Henderson uint8_t cu_eoc; 37395872bbf2SRichard Henderson }; 3740813da627SRichard Henderson 3741813da627SRichard Henderson struct ElfImage { 3742813da627SRichard Henderson ElfW(Ehdr) ehdr; 3743813da627SRichard Henderson ElfW(Phdr) phdr; 37445872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 37455872bbf2SRichard Henderson ElfW(Sym) sym[2]; 37465872bbf2SRichard Henderson struct DebugInfo di; 37475872bbf2SRichard Henderson uint8_t da[24]; 37485872bbf2SRichard Henderson char str[80]; 37495872bbf2SRichard Henderson }; 37505872bbf2SRichard Henderson 37515872bbf2SRichard Henderson struct ElfImage *img; 37525872bbf2SRichard Henderson 37535872bbf2SRichard Henderson static const struct ElfImage img_template = { 37545872bbf2SRichard Henderson .ehdr = { 37555872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 37565872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 37575872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 37585872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 37595872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 37605872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 37615872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 37625872bbf2SRichard Henderson .e_type = ET_EXEC, 37635872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 37645872bbf2SRichard Henderson .e_version = EV_CURRENT, 37655872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 37665872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 37675872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 37685872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 37695872bbf2SRichard Henderson .e_phnum = 1, 37705872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 37715872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 37725872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 3773abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 3774abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 3775abbb3eaeSRichard Henderson #endif 3776abbb3eaeSRichard Henderson #ifdef ELF_OSABI 3777abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 3778abbb3eaeSRichard Henderson #endif 37795872bbf2SRichard Henderson }, 37805872bbf2SRichard Henderson .phdr = { 37815872bbf2SRichard Henderson .p_type = PT_LOAD, 37825872bbf2SRichard Henderson .p_flags = PF_X, 37835872bbf2SRichard Henderson }, 37845872bbf2SRichard Henderson .shdr = { 37855872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 37865872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 37875872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 37885872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 37895872bbf2SRichard Henderson will not look for contents. We can record any address. */ 37905872bbf2SRichard Henderson [1] = { /* .text */ 37915872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 37925872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 37935872bbf2SRichard Henderson }, 37945872bbf2SRichard Henderson [2] = { /* .debug_info */ 37955872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 37965872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 37975872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 37985872bbf2SRichard Henderson }, 37995872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 38005872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 38015872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 38025872bbf2SRichard Henderson .sh_size = sizeof(img->da), 38035872bbf2SRichard Henderson }, 38045872bbf2SRichard Henderson [4] = { /* .debug_frame */ 38055872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 38065872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 38075872bbf2SRichard Henderson }, 38085872bbf2SRichard Henderson [5] = { /* .symtab */ 38095872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 38105872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 38115872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 38125872bbf2SRichard Henderson .sh_info = 1, 38135872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 38145872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 38155872bbf2SRichard Henderson }, 38165872bbf2SRichard Henderson [6] = { /* .strtab */ 38175872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 38185872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 38195872bbf2SRichard Henderson .sh_size = sizeof(img->str), 38205872bbf2SRichard Henderson } 38215872bbf2SRichard Henderson }, 38225872bbf2SRichard Henderson .sym = { 38235872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 38245872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 38255872bbf2SRichard Henderson .st_shndx = 1, 38265872bbf2SRichard Henderson } 38275872bbf2SRichard Henderson }, 38285872bbf2SRichard Henderson .di = { 38295872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 38305872bbf2SRichard Henderson .version = 2, 38315872bbf2SRichard Henderson .ptr_size = sizeof(void *), 38325872bbf2SRichard Henderson .cu_die = 1, 38335872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 38345872bbf2SRichard Henderson .fn_die = 2, 38355872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 38365872bbf2SRichard Henderson }, 38375872bbf2SRichard Henderson .da = { 38385872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 38395872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 38405872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 38415872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 38425872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 38435872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 38445872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 38455872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 38465872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 38475872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 38485872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 38495872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 38505872bbf2SRichard Henderson 0 /* no more abbrev */ 38515872bbf2SRichard Henderson }, 38525872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 38535872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 3854813da627SRichard Henderson }; 3855813da627SRichard Henderson 3856813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 3857813da627SRichard Henderson static struct jit_code_entry one_entry; 3858813da627SRichard Henderson 38595872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 3860813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 38612c90784aSRichard Henderson DebugFrameHeader *dfh; 3862813da627SRichard Henderson 38635872bbf2SRichard Henderson img = g_malloc(img_size); 38645872bbf2SRichard Henderson *img = img_template; 3865813da627SRichard Henderson 38665872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 38675872bbf2SRichard Henderson img->phdr.p_paddr = buf; 38685872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 3869813da627SRichard Henderson 38705872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 38715872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 38725872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 3873813da627SRichard Henderson 38745872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 38755872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 38765872bbf2SRichard Henderson 38775872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 38785872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 38795872bbf2SRichard Henderson 38805872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 38815872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 38825872bbf2SRichard Henderson 38835872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 38845872bbf2SRichard Henderson img->sym[1].st_value = buf; 38855872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 38865872bbf2SRichard Henderson 38875872bbf2SRichard Henderson img->di.cu_low_pc = buf; 388845aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 38895872bbf2SRichard Henderson img->di.fn_low_pc = buf; 389045aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 3891813da627SRichard Henderson 38922c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 38932c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 38942c90784aSRichard Henderson dfh->fde.func_start = buf; 38952c90784aSRichard Henderson dfh->fde.func_len = buf_size; 38962c90784aSRichard Henderson 3897813da627SRichard Henderson #ifdef DEBUG_JIT 3898813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 3899813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 3900813da627SRichard Henderson { 3901813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 3902813da627SRichard Henderson if (f) { 39035872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 3904813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 3905813da627SRichard Henderson } 3906813da627SRichard Henderson fclose(f); 3907813da627SRichard Henderson } 3908813da627SRichard Henderson } 3909813da627SRichard Henderson #endif 3910813da627SRichard Henderson 3911813da627SRichard Henderson one_entry.symfile_addr = img; 3912813da627SRichard Henderson one_entry.symfile_size = img_size; 3913813da627SRichard Henderson 3914813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 3915813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 3916813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 3917813da627SRichard Henderson __jit_debug_register_code(); 3918813da627SRichard Henderson } 3919813da627SRichard Henderson #else 39205872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 39215872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 3922813da627SRichard Henderson 3923813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 39242c90784aSRichard Henderson const void *debug_frame, 39252c90784aSRichard Henderson size_t debug_frame_size) 3926813da627SRichard Henderson { 3927813da627SRichard Henderson } 3928813da627SRichard Henderson 3929813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size) 3930813da627SRichard Henderson { 3931813da627SRichard Henderson } 3932813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 3933db432672SRichard Henderson 3934db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 3935db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 3936db432672SRichard Henderson { 3937db432672SRichard Henderson g_assert_not_reached(); 3938db432672SRichard Henderson } 3939db432672SRichard Henderson #endif 3940