1c896fe29Sbellard /* 2c896fe29Sbellard * Tiny Code Generator for QEMU 3c896fe29Sbellard * 4c896fe29Sbellard * Copyright (c) 2008 Fabrice Bellard 5c896fe29Sbellard * 6c896fe29Sbellard * Permission is hereby granted, free of charge, to any person obtaining a copy 7c896fe29Sbellard * of this software and associated documentation files (the "Software"), to deal 8c896fe29Sbellard * in the Software without restriction, including without limitation the rights 9c896fe29Sbellard * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 10c896fe29Sbellard * copies of the Software, and to permit persons to whom the Software is 11c896fe29Sbellard * furnished to do so, subject to the following conditions: 12c896fe29Sbellard * 13c896fe29Sbellard * The above copyright notice and this permission notice shall be included in 14c896fe29Sbellard * all copies or substantial portions of the Software. 15c896fe29Sbellard * 16c896fe29Sbellard * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17c896fe29Sbellard * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18c896fe29Sbellard * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19c896fe29Sbellard * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20c896fe29Sbellard * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21c896fe29Sbellard * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 22c896fe29Sbellard * THE SOFTWARE. 23c896fe29Sbellard */ 24c896fe29Sbellard 25c896fe29Sbellard /* define it to use liveness analysis (better code) */ 268f2e8c07SKirill Batuzov #define USE_TCG_OPTIMIZATIONS 27c896fe29Sbellard 28757e725bSPeter Maydell #include "qemu/osdep.h" 29cca82982Saurel32 30813da627SRichard Henderson /* Define to jump the ELF file used to communicate with GDB. */ 31813da627SRichard Henderson #undef DEBUG_JIT 32813da627SRichard Henderson 33f348b6d1SVeronia Bahaa #include "qemu/cutils.h" 341de7afc9SPaolo Bonzini #include "qemu/host-utils.h" 351de7afc9SPaolo Bonzini #include "qemu/timer.h" 36c896fe29Sbellard 37c5d3c498SStefan Weil /* Note: the long term plan is to reduce the dependencies on the QEMU 38c896fe29Sbellard CPU definitions. Currently they are used for qemu_ld/st 39c896fe29Sbellard instructions */ 40c896fe29Sbellard #define NO_CPU_IO_DEFS 41c896fe29Sbellard #include "cpu.h" 42c896fe29Sbellard 4363c91552SPaolo Bonzini #include "exec/cpu-common.h" 4463c91552SPaolo Bonzini #include "exec/exec-all.h" 4563c91552SPaolo Bonzini 46c896fe29Sbellard #include "tcg-op.h" 47813da627SRichard Henderson 48edee2579SRichard Henderson #if UINTPTR_MAX == UINT32_MAX 49813da627SRichard Henderson # define ELF_CLASS ELFCLASS32 50edee2579SRichard Henderson #else 51edee2579SRichard Henderson # define ELF_CLASS ELFCLASS64 52813da627SRichard Henderson #endif 53813da627SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 54813da627SRichard Henderson # define ELF_DATA ELFDATA2MSB 55813da627SRichard Henderson #else 56813da627SRichard Henderson # define ELF_DATA ELFDATA2LSB 57813da627SRichard Henderson #endif 58813da627SRichard Henderson 59c896fe29Sbellard #include "elf.h" 60508127e2SPaolo Bonzini #include "exec/log.h" 613468b59eSEmilio G. Cota #include "sysemu/sysemu.h" 62c896fe29Sbellard 63ce151109SPeter Maydell /* Forward declarations for functions declared in tcg-target.inc.c and 64ce151109SPeter Maydell used here. */ 65e4d58b41SRichard Henderson static void tcg_target_init(TCGContext *s); 66f69d277eSRichard Henderson static const TCGTargetOpDef *tcg_target_op_def(TCGOpcode); 67e4d58b41SRichard Henderson static void tcg_target_qemu_prologue(TCGContext *s); 681813e175SRichard Henderson static void patch_reloc(tcg_insn_unit *code_ptr, int type, 692ba7fae2SRichard Henderson intptr_t value, intptr_t addend); 70c896fe29Sbellard 71497a22ebSRichard Henderson /* The CIE and FDE header definitions will be common to all hosts. */ 72497a22ebSRichard Henderson typedef struct { 73497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 74497a22ebSRichard Henderson uint32_t id; 75497a22ebSRichard Henderson uint8_t version; 76497a22ebSRichard Henderson char augmentation[1]; 77497a22ebSRichard Henderson uint8_t code_align; 78497a22ebSRichard Henderson uint8_t data_align; 79497a22ebSRichard Henderson uint8_t return_column; 80497a22ebSRichard Henderson } DebugFrameCIE; 81497a22ebSRichard Henderson 82497a22ebSRichard Henderson typedef struct QEMU_PACKED { 83497a22ebSRichard Henderson uint32_t len __attribute__((aligned((sizeof(void *))))); 84497a22ebSRichard Henderson uint32_t cie_offset; 85edee2579SRichard Henderson uintptr_t func_start; 86edee2579SRichard Henderson uintptr_t func_len; 87497a22ebSRichard Henderson } DebugFrameFDEHeader; 88497a22ebSRichard Henderson 892c90784aSRichard Henderson typedef struct QEMU_PACKED { 902c90784aSRichard Henderson DebugFrameCIE cie; 912c90784aSRichard Henderson DebugFrameFDEHeader fde; 922c90784aSRichard Henderson } DebugFrameHeader; 932c90784aSRichard Henderson 94813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 952c90784aSRichard Henderson const void *debug_frame, 962c90784aSRichard Henderson size_t debug_frame_size) 97813da627SRichard Henderson __attribute__((unused)); 98813da627SRichard Henderson 99ce151109SPeter Maydell /* Forward declarations for functions declared and used in tcg-target.inc.c. */ 100069ea736SRichard Henderson static const char *target_parse_constraint(TCGArgConstraint *ct, 101069ea736SRichard Henderson const char *ct_str, TCGType type); 1022a534affSRichard Henderson static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg1, 103a05b5b9bSRichard Henderson intptr_t arg2); 1042a534affSRichard Henderson static void tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg); 105c0ad3001SStefan Weil static void tcg_out_movi(TCGContext *s, TCGType type, 1062a534affSRichard Henderson TCGReg ret, tcg_target_long arg); 107c0ad3001SStefan Weil static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args, 108c0ad3001SStefan Weil const int *const_args); 109d2fd745fSRichard Henderson #if TCG_TARGET_MAYBE_vec 110d2fd745fSRichard Henderson static void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 111d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 112d2fd745fSRichard Henderson const int *const_args); 113d2fd745fSRichard Henderson #else 114d2fd745fSRichard Henderson static inline void tcg_out_vec_op(TCGContext *s, TCGOpcode opc, unsigned vecl, 115d2fd745fSRichard Henderson unsigned vece, const TCGArg *args, 116d2fd745fSRichard Henderson const int *const_args) 117d2fd745fSRichard Henderson { 118d2fd745fSRichard Henderson g_assert_not_reached(); 119d2fd745fSRichard Henderson } 120d2fd745fSRichard Henderson #endif 1212a534affSRichard Henderson static void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, TCGReg arg1, 122a05b5b9bSRichard Henderson intptr_t arg2); 12359d7c14eSRichard Henderson static bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val, 12459d7c14eSRichard Henderson TCGReg base, intptr_t ofs); 125cf066674SRichard Henderson static void tcg_out_call(TCGContext *s, tcg_insn_unit *target); 126f6c6afc1SRichard Henderson static int tcg_target_const_match(tcg_target_long val, TCGType type, 127c0ad3001SStefan Weil const TCGArgConstraint *arg_ct); 128659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 129659ef5cbSRichard Henderson static bool tcg_out_ldst_finalize(TCGContext *s); 130659ef5cbSRichard Henderson #endif 131c896fe29Sbellard 132a505785cSEmilio G. Cota #define TCG_HIGHWATER 1024 133a505785cSEmilio G. Cota 134df2cce29SEmilio G. Cota static TCGContext **tcg_ctxs; 135df2cce29SEmilio G. Cota static unsigned int n_tcg_ctxs; 1361c2adb95SRichard Henderson TCGv_env cpu_env = 0; 137df2cce29SEmilio G. Cota 138be2cdc5eSEmilio G. Cota struct tcg_region_tree { 139be2cdc5eSEmilio G. Cota QemuMutex lock; 140be2cdc5eSEmilio G. Cota GTree *tree; 141be2cdc5eSEmilio G. Cota /* padding to avoid false sharing is computed at run-time */ 142be2cdc5eSEmilio G. Cota }; 143be2cdc5eSEmilio G. Cota 144e8feb96fSEmilio G. Cota /* 145e8feb96fSEmilio G. Cota * We divide code_gen_buffer into equally-sized "regions" that TCG threads 146e8feb96fSEmilio G. Cota * dynamically allocate from as demand dictates. Given appropriate region 147e8feb96fSEmilio G. Cota * sizing, this minimizes flushes even when some TCG threads generate a lot 148e8feb96fSEmilio G. Cota * more code than others. 149e8feb96fSEmilio G. Cota */ 150e8feb96fSEmilio G. Cota struct tcg_region_state { 151e8feb96fSEmilio G. Cota QemuMutex lock; 152e8feb96fSEmilio G. Cota 153e8feb96fSEmilio G. Cota /* fields set at init time */ 154e8feb96fSEmilio G. Cota void *start; 155e8feb96fSEmilio G. Cota void *start_aligned; 156e8feb96fSEmilio G. Cota void *end; 157e8feb96fSEmilio G. Cota size_t n; 158e8feb96fSEmilio G. Cota size_t size; /* size of one region */ 159e8feb96fSEmilio G. Cota size_t stride; /* .size + guard size */ 160e8feb96fSEmilio G. Cota 161e8feb96fSEmilio G. Cota /* fields protected by the lock */ 162e8feb96fSEmilio G. Cota size_t current; /* current region index */ 163e8feb96fSEmilio G. Cota size_t agg_size_full; /* aggregate size of full regions */ 164e8feb96fSEmilio G. Cota }; 165e8feb96fSEmilio G. Cota 166e8feb96fSEmilio G. Cota static struct tcg_region_state region; 167be2cdc5eSEmilio G. Cota /* 168be2cdc5eSEmilio G. Cota * This is an array of struct tcg_region_tree's, with padding. 169be2cdc5eSEmilio G. Cota * We use void * to simplify the computation of region_trees[i]; each 170be2cdc5eSEmilio G. Cota * struct is found every tree_size bytes. 171be2cdc5eSEmilio G. Cota */ 172be2cdc5eSEmilio G. Cota static void *region_trees; 173be2cdc5eSEmilio G. Cota static size_t tree_size; 174d2fd745fSRichard Henderson static TCGRegSet tcg_target_available_regs[TCG_TYPE_COUNT]; 175b1d8e52eSblueswir1 static TCGRegSet tcg_target_call_clobber_regs; 176c896fe29Sbellard 1771813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE == 1 1784196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out8(TCGContext *s, uint8_t v) 179c896fe29Sbellard { 180c896fe29Sbellard *s->code_ptr++ = v; 181c896fe29Sbellard } 182c896fe29Sbellard 1834196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch8(tcg_insn_unit *p, 1844196dca6SPeter Maydell uint8_t v) 1855c53bb81SPeter Maydell { 1861813e175SRichard Henderson *p = v; 1875c53bb81SPeter Maydell } 1881813e175SRichard Henderson #endif 1895c53bb81SPeter Maydell 1901813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 2 1914196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out16(TCGContext *s, uint16_t v) 192c896fe29Sbellard { 1931813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 1941813e175SRichard Henderson *s->code_ptr++ = v; 1951813e175SRichard Henderson } else { 1961813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 1974387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 1981813e175SRichard Henderson s->code_ptr = p + (2 / TCG_TARGET_INSN_UNIT_SIZE); 1991813e175SRichard Henderson } 200c896fe29Sbellard } 201c896fe29Sbellard 2024196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch16(tcg_insn_unit *p, 2034196dca6SPeter Maydell uint16_t v) 2045c53bb81SPeter Maydell { 2051813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 2) { 2061813e175SRichard Henderson *p = v; 2071813e175SRichard Henderson } else { 2085c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2095c53bb81SPeter Maydell } 2101813e175SRichard Henderson } 2111813e175SRichard Henderson #endif 2125c53bb81SPeter Maydell 2131813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 4 2144196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out32(TCGContext *s, uint32_t v) 215c896fe29Sbellard { 2161813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2171813e175SRichard Henderson *s->code_ptr++ = v; 2181813e175SRichard Henderson } else { 2191813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2204387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2211813e175SRichard Henderson s->code_ptr = p + (4 / TCG_TARGET_INSN_UNIT_SIZE); 2221813e175SRichard Henderson } 223c896fe29Sbellard } 224c896fe29Sbellard 2254196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch32(tcg_insn_unit *p, 2264196dca6SPeter Maydell uint32_t v) 2275c53bb81SPeter Maydell { 2281813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 4) { 2291813e175SRichard Henderson *p = v; 2301813e175SRichard Henderson } else { 2315c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2325c53bb81SPeter Maydell } 2331813e175SRichard Henderson } 2341813e175SRichard Henderson #endif 2355c53bb81SPeter Maydell 2361813e175SRichard Henderson #if TCG_TARGET_INSN_UNIT_SIZE <= 8 2374196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_out64(TCGContext *s, uint64_t v) 238ac26eb69SRichard Henderson { 2391813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2401813e175SRichard Henderson *s->code_ptr++ = v; 2411813e175SRichard Henderson } else { 2421813e175SRichard Henderson tcg_insn_unit *p = s->code_ptr; 2434387345aSPeter Maydell memcpy(p, &v, sizeof(v)); 2441813e175SRichard Henderson s->code_ptr = p + (8 / TCG_TARGET_INSN_UNIT_SIZE); 2451813e175SRichard Henderson } 246ac26eb69SRichard Henderson } 247ac26eb69SRichard Henderson 2484196dca6SPeter Maydell static __attribute__((unused)) inline void tcg_patch64(tcg_insn_unit *p, 2494196dca6SPeter Maydell uint64_t v) 2505c53bb81SPeter Maydell { 2511813e175SRichard Henderson if (TCG_TARGET_INSN_UNIT_SIZE == 8) { 2521813e175SRichard Henderson *p = v; 2531813e175SRichard Henderson } else { 2545c53bb81SPeter Maydell memcpy(p, &v, sizeof(v)); 2555c53bb81SPeter Maydell } 2561813e175SRichard Henderson } 2571813e175SRichard Henderson #endif 2585c53bb81SPeter Maydell 259c896fe29Sbellard /* label relocation processing */ 260c896fe29Sbellard 2611813e175SRichard Henderson static void tcg_out_reloc(TCGContext *s, tcg_insn_unit *code_ptr, int type, 262bec16311SRichard Henderson TCGLabel *l, intptr_t addend) 263c896fe29Sbellard { 264c896fe29Sbellard TCGRelocation *r; 265c896fe29Sbellard 266c896fe29Sbellard if (l->has_value) { 267623e265cSpbrook /* FIXME: This may break relocations on RISC targets that 268623e265cSpbrook modify instruction fields in place. The caller may not have 269623e265cSpbrook written the initial value. */ 270f54b3f92Saurel32 patch_reloc(code_ptr, type, l->u.value, addend); 271c896fe29Sbellard } else { 272c896fe29Sbellard /* add a new relocation entry */ 273c896fe29Sbellard r = tcg_malloc(sizeof(TCGRelocation)); 274c896fe29Sbellard r->type = type; 275c896fe29Sbellard r->ptr = code_ptr; 276c896fe29Sbellard r->addend = addend; 277c896fe29Sbellard r->next = l->u.first_reloc; 278c896fe29Sbellard l->u.first_reloc = r; 279c896fe29Sbellard } 280c896fe29Sbellard } 281c896fe29Sbellard 282bec16311SRichard Henderson static void tcg_out_label(TCGContext *s, TCGLabel *l, tcg_insn_unit *ptr) 283c896fe29Sbellard { 2842ba7fae2SRichard Henderson intptr_t value = (intptr_t)ptr; 2851813e175SRichard Henderson TCGRelocation *r; 286c896fe29Sbellard 287eabb7b91SAurelien Jarno tcg_debug_assert(!l->has_value); 2881813e175SRichard Henderson 2891813e175SRichard Henderson for (r = l->u.first_reloc; r != NULL; r = r->next) { 290f54b3f92Saurel32 patch_reloc(r->ptr, r->type, value, r->addend); 291c896fe29Sbellard } 2921813e175SRichard Henderson 293c896fe29Sbellard l->has_value = 1; 2941813e175SRichard Henderson l->u.value_ptr = ptr; 295c896fe29Sbellard } 296c896fe29Sbellard 29742a268c2SRichard Henderson TCGLabel *gen_new_label(void) 298c896fe29Sbellard { 299b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 30051e3972cSRichard Henderson TCGLabel *l = tcg_malloc(sizeof(TCGLabel)); 301c896fe29Sbellard 30251e3972cSRichard Henderson *l = (TCGLabel){ 30351e3972cSRichard Henderson .id = s->nb_labels++ 30451e3972cSRichard Henderson }; 30542a268c2SRichard Henderson 30642a268c2SRichard Henderson return l; 307c896fe29Sbellard } 308c896fe29Sbellard 3099f754620SRichard Henderson static void set_jmp_reset_offset(TCGContext *s, int which) 3109f754620SRichard Henderson { 3119f754620SRichard Henderson size_t off = tcg_current_code_size(s); 3129f754620SRichard Henderson s->tb_jmp_reset_offset[which] = off; 3139f754620SRichard Henderson /* Make sure that we didn't overflow the stored offset. */ 3149f754620SRichard Henderson assert(s->tb_jmp_reset_offset[which] == off); 3159f754620SRichard Henderson } 3169f754620SRichard Henderson 317ce151109SPeter Maydell #include "tcg-target.inc.c" 318c896fe29Sbellard 319be2cdc5eSEmilio G. Cota /* compare a pointer @ptr and a tb_tc @s */ 320be2cdc5eSEmilio G. Cota static int ptr_cmp_tb_tc(const void *ptr, const struct tb_tc *s) 321be2cdc5eSEmilio G. Cota { 322be2cdc5eSEmilio G. Cota if (ptr >= s->ptr + s->size) { 323be2cdc5eSEmilio G. Cota return 1; 324be2cdc5eSEmilio G. Cota } else if (ptr < s->ptr) { 325be2cdc5eSEmilio G. Cota return -1; 326be2cdc5eSEmilio G. Cota } 327be2cdc5eSEmilio G. Cota return 0; 328be2cdc5eSEmilio G. Cota } 329be2cdc5eSEmilio G. Cota 330be2cdc5eSEmilio G. Cota static gint tb_tc_cmp(gconstpointer ap, gconstpointer bp) 331be2cdc5eSEmilio G. Cota { 332be2cdc5eSEmilio G. Cota const struct tb_tc *a = ap; 333be2cdc5eSEmilio G. Cota const struct tb_tc *b = bp; 334be2cdc5eSEmilio G. Cota 335be2cdc5eSEmilio G. Cota /* 336be2cdc5eSEmilio G. Cota * When both sizes are set, we know this isn't a lookup. 337be2cdc5eSEmilio G. Cota * This is the most likely case: every TB must be inserted; lookups 338be2cdc5eSEmilio G. Cota * are a lot less frequent. 339be2cdc5eSEmilio G. Cota */ 340be2cdc5eSEmilio G. Cota if (likely(a->size && b->size)) { 341be2cdc5eSEmilio G. Cota if (a->ptr > b->ptr) { 342be2cdc5eSEmilio G. Cota return 1; 343be2cdc5eSEmilio G. Cota } else if (a->ptr < b->ptr) { 344be2cdc5eSEmilio G. Cota return -1; 345be2cdc5eSEmilio G. Cota } 346be2cdc5eSEmilio G. Cota /* a->ptr == b->ptr should happen only on deletions */ 347be2cdc5eSEmilio G. Cota g_assert(a->size == b->size); 348be2cdc5eSEmilio G. Cota return 0; 349be2cdc5eSEmilio G. Cota } 350be2cdc5eSEmilio G. Cota /* 351be2cdc5eSEmilio G. Cota * All lookups have either .size field set to 0. 352be2cdc5eSEmilio G. Cota * From the glib sources we see that @ap is always the lookup key. However 353be2cdc5eSEmilio G. Cota * the docs provide no guarantee, so we just mark this case as likely. 354be2cdc5eSEmilio G. Cota */ 355be2cdc5eSEmilio G. Cota if (likely(a->size == 0)) { 356be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(a->ptr, b); 357be2cdc5eSEmilio G. Cota } 358be2cdc5eSEmilio G. Cota return ptr_cmp_tb_tc(b->ptr, a); 359be2cdc5eSEmilio G. Cota } 360be2cdc5eSEmilio G. Cota 361be2cdc5eSEmilio G. Cota static void tcg_region_trees_init(void) 362be2cdc5eSEmilio G. Cota { 363be2cdc5eSEmilio G. Cota size_t i; 364be2cdc5eSEmilio G. Cota 365be2cdc5eSEmilio G. Cota tree_size = ROUND_UP(sizeof(struct tcg_region_tree), qemu_dcache_linesize); 366be2cdc5eSEmilio G. Cota region_trees = qemu_memalign(qemu_dcache_linesize, region.n * tree_size); 367be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 368be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 369be2cdc5eSEmilio G. Cota 370be2cdc5eSEmilio G. Cota qemu_mutex_init(&rt->lock); 371be2cdc5eSEmilio G. Cota rt->tree = g_tree_new(tb_tc_cmp); 372be2cdc5eSEmilio G. Cota } 373be2cdc5eSEmilio G. Cota } 374be2cdc5eSEmilio G. Cota 375be2cdc5eSEmilio G. Cota static struct tcg_region_tree *tc_ptr_to_region_tree(void *p) 376be2cdc5eSEmilio G. Cota { 377be2cdc5eSEmilio G. Cota size_t region_idx; 378be2cdc5eSEmilio G. Cota 379be2cdc5eSEmilio G. Cota if (p < region.start_aligned) { 380be2cdc5eSEmilio G. Cota region_idx = 0; 381be2cdc5eSEmilio G. Cota } else { 382be2cdc5eSEmilio G. Cota ptrdiff_t offset = p - region.start_aligned; 383be2cdc5eSEmilio G. Cota 384be2cdc5eSEmilio G. Cota if (offset > region.stride * (region.n - 1)) { 385be2cdc5eSEmilio G. Cota region_idx = region.n - 1; 386be2cdc5eSEmilio G. Cota } else { 387be2cdc5eSEmilio G. Cota region_idx = offset / region.stride; 388be2cdc5eSEmilio G. Cota } 389be2cdc5eSEmilio G. Cota } 390be2cdc5eSEmilio G. Cota return region_trees + region_idx * tree_size; 391be2cdc5eSEmilio G. Cota } 392be2cdc5eSEmilio G. Cota 393be2cdc5eSEmilio G. Cota void tcg_tb_insert(TranslationBlock *tb) 394be2cdc5eSEmilio G. Cota { 395be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 396be2cdc5eSEmilio G. Cota 397be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 398be2cdc5eSEmilio G. Cota g_tree_insert(rt->tree, &tb->tc, tb); 399be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 400be2cdc5eSEmilio G. Cota } 401be2cdc5eSEmilio G. Cota 402be2cdc5eSEmilio G. Cota void tcg_tb_remove(TranslationBlock *tb) 403be2cdc5eSEmilio G. Cota { 404be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree(tb->tc.ptr); 405be2cdc5eSEmilio G. Cota 406be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 407be2cdc5eSEmilio G. Cota g_tree_remove(rt->tree, &tb->tc); 408be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 409be2cdc5eSEmilio G. Cota } 410be2cdc5eSEmilio G. Cota 411be2cdc5eSEmilio G. Cota /* 412be2cdc5eSEmilio G. Cota * Find the TB 'tb' such that 413be2cdc5eSEmilio G. Cota * tb->tc.ptr <= tc_ptr < tb->tc.ptr + tb->tc.size 414be2cdc5eSEmilio G. Cota * Return NULL if not found. 415be2cdc5eSEmilio G. Cota */ 416be2cdc5eSEmilio G. Cota TranslationBlock *tcg_tb_lookup(uintptr_t tc_ptr) 417be2cdc5eSEmilio G. Cota { 418be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = tc_ptr_to_region_tree((void *)tc_ptr); 419be2cdc5eSEmilio G. Cota TranslationBlock *tb; 420be2cdc5eSEmilio G. Cota struct tb_tc s = { .ptr = (void *)tc_ptr }; 421be2cdc5eSEmilio G. Cota 422be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 423be2cdc5eSEmilio G. Cota tb = g_tree_lookup(rt->tree, &s); 424be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 425be2cdc5eSEmilio G. Cota return tb; 426be2cdc5eSEmilio G. Cota } 427be2cdc5eSEmilio G. Cota 428be2cdc5eSEmilio G. Cota static void tcg_region_tree_lock_all(void) 429be2cdc5eSEmilio G. Cota { 430be2cdc5eSEmilio G. Cota size_t i; 431be2cdc5eSEmilio G. Cota 432be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 433be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 434be2cdc5eSEmilio G. Cota 435be2cdc5eSEmilio G. Cota qemu_mutex_lock(&rt->lock); 436be2cdc5eSEmilio G. Cota } 437be2cdc5eSEmilio G. Cota } 438be2cdc5eSEmilio G. Cota 439be2cdc5eSEmilio G. Cota static void tcg_region_tree_unlock_all(void) 440be2cdc5eSEmilio G. Cota { 441be2cdc5eSEmilio G. Cota size_t i; 442be2cdc5eSEmilio G. Cota 443be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 444be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 445be2cdc5eSEmilio G. Cota 446be2cdc5eSEmilio G. Cota qemu_mutex_unlock(&rt->lock); 447be2cdc5eSEmilio G. Cota } 448be2cdc5eSEmilio G. Cota } 449be2cdc5eSEmilio G. Cota 450be2cdc5eSEmilio G. Cota void tcg_tb_foreach(GTraverseFunc func, gpointer user_data) 451be2cdc5eSEmilio G. Cota { 452be2cdc5eSEmilio G. Cota size_t i; 453be2cdc5eSEmilio G. Cota 454be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 455be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 456be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 457be2cdc5eSEmilio G. Cota 458be2cdc5eSEmilio G. Cota g_tree_foreach(rt->tree, func, user_data); 459be2cdc5eSEmilio G. Cota } 460be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 461be2cdc5eSEmilio G. Cota } 462be2cdc5eSEmilio G. Cota 463be2cdc5eSEmilio G. Cota size_t tcg_nb_tbs(void) 464be2cdc5eSEmilio G. Cota { 465be2cdc5eSEmilio G. Cota size_t nb_tbs = 0; 466be2cdc5eSEmilio G. Cota size_t i; 467be2cdc5eSEmilio G. Cota 468be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 469be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 470be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 471be2cdc5eSEmilio G. Cota 472be2cdc5eSEmilio G. Cota nb_tbs += g_tree_nnodes(rt->tree); 473be2cdc5eSEmilio G. Cota } 474be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 475be2cdc5eSEmilio G. Cota return nb_tbs; 476be2cdc5eSEmilio G. Cota } 477be2cdc5eSEmilio G. Cota 478be2cdc5eSEmilio G. Cota static void tcg_region_tree_reset_all(void) 479be2cdc5eSEmilio G. Cota { 480be2cdc5eSEmilio G. Cota size_t i; 481be2cdc5eSEmilio G. Cota 482be2cdc5eSEmilio G. Cota tcg_region_tree_lock_all(); 483be2cdc5eSEmilio G. Cota for (i = 0; i < region.n; i++) { 484be2cdc5eSEmilio G. Cota struct tcg_region_tree *rt = region_trees + i * tree_size; 485be2cdc5eSEmilio G. Cota 486be2cdc5eSEmilio G. Cota /* Increment the refcount first so that destroy acts as a reset */ 487be2cdc5eSEmilio G. Cota g_tree_ref(rt->tree); 488be2cdc5eSEmilio G. Cota g_tree_destroy(rt->tree); 489be2cdc5eSEmilio G. Cota } 490be2cdc5eSEmilio G. Cota tcg_region_tree_unlock_all(); 491be2cdc5eSEmilio G. Cota } 492be2cdc5eSEmilio G. Cota 493e8feb96fSEmilio G. Cota static void tcg_region_bounds(size_t curr_region, void **pstart, void **pend) 494e8feb96fSEmilio G. Cota { 495e8feb96fSEmilio G. Cota void *start, *end; 496e8feb96fSEmilio G. Cota 497e8feb96fSEmilio G. Cota start = region.start_aligned + curr_region * region.stride; 498e8feb96fSEmilio G. Cota end = start + region.size; 499e8feb96fSEmilio G. Cota 500e8feb96fSEmilio G. Cota if (curr_region == 0) { 501e8feb96fSEmilio G. Cota start = region.start; 502e8feb96fSEmilio G. Cota } 503e8feb96fSEmilio G. Cota if (curr_region == region.n - 1) { 504e8feb96fSEmilio G. Cota end = region.end; 505e8feb96fSEmilio G. Cota } 506e8feb96fSEmilio G. Cota 507e8feb96fSEmilio G. Cota *pstart = start; 508e8feb96fSEmilio G. Cota *pend = end; 509e8feb96fSEmilio G. Cota } 510e8feb96fSEmilio G. Cota 511e8feb96fSEmilio G. Cota static void tcg_region_assign(TCGContext *s, size_t curr_region) 512e8feb96fSEmilio G. Cota { 513e8feb96fSEmilio G. Cota void *start, *end; 514e8feb96fSEmilio G. Cota 515e8feb96fSEmilio G. Cota tcg_region_bounds(curr_region, &start, &end); 516e8feb96fSEmilio G. Cota 517e8feb96fSEmilio G. Cota s->code_gen_buffer = start; 518e8feb96fSEmilio G. Cota s->code_gen_ptr = start; 519e8feb96fSEmilio G. Cota s->code_gen_buffer_size = end - start; 520e8feb96fSEmilio G. Cota s->code_gen_highwater = end - TCG_HIGHWATER; 521e8feb96fSEmilio G. Cota } 522e8feb96fSEmilio G. Cota 523e8feb96fSEmilio G. Cota static bool tcg_region_alloc__locked(TCGContext *s) 524e8feb96fSEmilio G. Cota { 525e8feb96fSEmilio G. Cota if (region.current == region.n) { 526e8feb96fSEmilio G. Cota return true; 527e8feb96fSEmilio G. Cota } 528e8feb96fSEmilio G. Cota tcg_region_assign(s, region.current); 529e8feb96fSEmilio G. Cota region.current++; 530e8feb96fSEmilio G. Cota return false; 531e8feb96fSEmilio G. Cota } 532e8feb96fSEmilio G. Cota 533e8feb96fSEmilio G. Cota /* 534e8feb96fSEmilio G. Cota * Request a new region once the one in use has filled up. 535e8feb96fSEmilio G. Cota * Returns true on error. 536e8feb96fSEmilio G. Cota */ 537e8feb96fSEmilio G. Cota static bool tcg_region_alloc(TCGContext *s) 538e8feb96fSEmilio G. Cota { 539e8feb96fSEmilio G. Cota bool err; 540e8feb96fSEmilio G. Cota /* read the region size now; alloc__locked will overwrite it on success */ 541e8feb96fSEmilio G. Cota size_t size_full = s->code_gen_buffer_size; 542e8feb96fSEmilio G. Cota 543e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 544e8feb96fSEmilio G. Cota err = tcg_region_alloc__locked(s); 545e8feb96fSEmilio G. Cota if (!err) { 546e8feb96fSEmilio G. Cota region.agg_size_full += size_full - TCG_HIGHWATER; 547e8feb96fSEmilio G. Cota } 548e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 549e8feb96fSEmilio G. Cota return err; 550e8feb96fSEmilio G. Cota } 551e8feb96fSEmilio G. Cota 552e8feb96fSEmilio G. Cota /* 553e8feb96fSEmilio G. Cota * Perform a context's first region allocation. 554e8feb96fSEmilio G. Cota * This function does _not_ increment region.agg_size_full. 555e8feb96fSEmilio G. Cota */ 556e8feb96fSEmilio G. Cota static inline bool tcg_region_initial_alloc__locked(TCGContext *s) 557e8feb96fSEmilio G. Cota { 558e8feb96fSEmilio G. Cota return tcg_region_alloc__locked(s); 559e8feb96fSEmilio G. Cota } 560e8feb96fSEmilio G. Cota 561e8feb96fSEmilio G. Cota /* Call from a safe-work context */ 562e8feb96fSEmilio G. Cota void tcg_region_reset_all(void) 563e8feb96fSEmilio G. Cota { 5643468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 565e8feb96fSEmilio G. Cota unsigned int i; 566e8feb96fSEmilio G. Cota 567e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 568e8feb96fSEmilio G. Cota region.current = 0; 569e8feb96fSEmilio G. Cota region.agg_size_full = 0; 570e8feb96fSEmilio G. Cota 5713468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 5723468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 5733468b59eSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(s); 574e8feb96fSEmilio G. Cota 575e8feb96fSEmilio G. Cota g_assert(!err); 576e8feb96fSEmilio G. Cota } 577e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 578be2cdc5eSEmilio G. Cota 579be2cdc5eSEmilio G. Cota tcg_region_tree_reset_all(); 580e8feb96fSEmilio G. Cota } 581e8feb96fSEmilio G. Cota 5823468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 5833468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5843468b59eSEmilio G. Cota { 5853468b59eSEmilio G. Cota return 1; 5863468b59eSEmilio G. Cota } 5873468b59eSEmilio G. Cota #else 5883468b59eSEmilio G. Cota /* 5893468b59eSEmilio G. Cota * It is likely that some vCPUs will translate more code than others, so we 5903468b59eSEmilio G. Cota * first try to set more regions than max_cpus, with those regions being of 5913468b59eSEmilio G. Cota * reasonable size. If that's not possible we make do by evenly dividing 5923468b59eSEmilio G. Cota * the code_gen_buffer among the vCPUs. 5933468b59eSEmilio G. Cota */ 5943468b59eSEmilio G. Cota static size_t tcg_n_regions(void) 5953468b59eSEmilio G. Cota { 5963468b59eSEmilio G. Cota size_t i; 5973468b59eSEmilio G. Cota 5983468b59eSEmilio G. Cota /* Use a single region if all we have is one vCPU thread */ 5993468b59eSEmilio G. Cota if (max_cpus == 1 || !qemu_tcg_mttcg_enabled()) { 6003468b59eSEmilio G. Cota return 1; 6013468b59eSEmilio G. Cota } 6023468b59eSEmilio G. Cota 6033468b59eSEmilio G. Cota /* Try to have more regions than max_cpus, with each region being >= 2 MB */ 6043468b59eSEmilio G. Cota for (i = 8; i > 0; i--) { 6053468b59eSEmilio G. Cota size_t regions_per_thread = i; 6063468b59eSEmilio G. Cota size_t region_size; 6073468b59eSEmilio G. Cota 6083468b59eSEmilio G. Cota region_size = tcg_init_ctx.code_gen_buffer_size; 6093468b59eSEmilio G. Cota region_size /= max_cpus * regions_per_thread; 6103468b59eSEmilio G. Cota 6113468b59eSEmilio G. Cota if (region_size >= 2 * 1024u * 1024) { 6123468b59eSEmilio G. Cota return max_cpus * regions_per_thread; 6133468b59eSEmilio G. Cota } 6143468b59eSEmilio G. Cota } 6153468b59eSEmilio G. Cota /* If we can't, then just allocate one region per vCPU thread */ 6163468b59eSEmilio G. Cota return max_cpus; 6173468b59eSEmilio G. Cota } 6183468b59eSEmilio G. Cota #endif 6193468b59eSEmilio G. Cota 620e8feb96fSEmilio G. Cota /* 621e8feb96fSEmilio G. Cota * Initializes region partitioning. 622e8feb96fSEmilio G. Cota * 623e8feb96fSEmilio G. Cota * Called at init time from the parent thread (i.e. the one calling 624e8feb96fSEmilio G. Cota * tcg_context_init), after the target's TCG globals have been set. 6253468b59eSEmilio G. Cota * 6263468b59eSEmilio G. Cota * Region partitioning works by splitting code_gen_buffer into separate regions, 6273468b59eSEmilio G. Cota * and then assigning regions to TCG threads so that the threads can translate 6283468b59eSEmilio G. Cota * code in parallel without synchronization. 6293468b59eSEmilio G. Cota * 6303468b59eSEmilio G. Cota * In softmmu the number of TCG threads is bounded by max_cpus, so we use at 6313468b59eSEmilio G. Cota * least max_cpus regions in MTTCG. In !MTTCG we use a single region. 6323468b59eSEmilio G. Cota * Note that the TCG options from the command-line (i.e. -accel accel=tcg,[...]) 6333468b59eSEmilio G. Cota * must have been parsed before calling this function, since it calls 6343468b59eSEmilio G. Cota * qemu_tcg_mttcg_enabled(). 6353468b59eSEmilio G. Cota * 6363468b59eSEmilio G. Cota * In user-mode we use a single region. Having multiple regions in user-mode 6373468b59eSEmilio G. Cota * is not supported, because the number of vCPU threads (recall that each thread 6383468b59eSEmilio G. Cota * spawned by the guest corresponds to a vCPU thread) is only bounded by the 6393468b59eSEmilio G. Cota * OS, and usually this number is huge (tens of thousands is not uncommon). 6403468b59eSEmilio G. Cota * Thus, given this large bound on the number of vCPU threads and the fact 6413468b59eSEmilio G. Cota * that code_gen_buffer is allocated at compile-time, we cannot guarantee 6423468b59eSEmilio G. Cota * that the availability of at least one region per vCPU thread. 6433468b59eSEmilio G. Cota * 6443468b59eSEmilio G. Cota * However, this user-mode limitation is unlikely to be a significant problem 6453468b59eSEmilio G. Cota * in practice. Multi-threaded guests share most if not all of their translated 6463468b59eSEmilio G. Cota * code, which makes parallel code generation less appealing than in softmmu. 647e8feb96fSEmilio G. Cota */ 648e8feb96fSEmilio G. Cota void tcg_region_init(void) 649e8feb96fSEmilio G. Cota { 650e8feb96fSEmilio G. Cota void *buf = tcg_init_ctx.code_gen_buffer; 651e8feb96fSEmilio G. Cota void *aligned; 652e8feb96fSEmilio G. Cota size_t size = tcg_init_ctx.code_gen_buffer_size; 653e8feb96fSEmilio G. Cota size_t page_size = qemu_real_host_page_size; 654e8feb96fSEmilio G. Cota size_t region_size; 655e8feb96fSEmilio G. Cota size_t n_regions; 656e8feb96fSEmilio G. Cota size_t i; 657e8feb96fSEmilio G. Cota 6583468b59eSEmilio G. Cota n_regions = tcg_n_regions(); 659e8feb96fSEmilio G. Cota 660e8feb96fSEmilio G. Cota /* The first region will be 'aligned - buf' bytes larger than the others */ 661e8feb96fSEmilio G. Cota aligned = QEMU_ALIGN_PTR_UP(buf, page_size); 662e8feb96fSEmilio G. Cota g_assert(aligned < tcg_init_ctx.code_gen_buffer + size); 663e8feb96fSEmilio G. Cota /* 664e8feb96fSEmilio G. Cota * Make region_size a multiple of page_size, using aligned as the start. 665e8feb96fSEmilio G. Cota * As a result of this we might end up with a few extra pages at the end of 666e8feb96fSEmilio G. Cota * the buffer; we will assign those to the last region. 667e8feb96fSEmilio G. Cota */ 668e8feb96fSEmilio G. Cota region_size = (size - (aligned - buf)) / n_regions; 669e8feb96fSEmilio G. Cota region_size = QEMU_ALIGN_DOWN(region_size, page_size); 670e8feb96fSEmilio G. Cota 671e8feb96fSEmilio G. Cota /* A region must have at least 2 pages; one code, one guard */ 672e8feb96fSEmilio G. Cota g_assert(region_size >= 2 * page_size); 673e8feb96fSEmilio G. Cota 674e8feb96fSEmilio G. Cota /* init the region struct */ 675e8feb96fSEmilio G. Cota qemu_mutex_init(®ion.lock); 676e8feb96fSEmilio G. Cota region.n = n_regions; 677e8feb96fSEmilio G. Cota region.size = region_size - page_size; 678e8feb96fSEmilio G. Cota region.stride = region_size; 679e8feb96fSEmilio G. Cota region.start = buf; 680e8feb96fSEmilio G. Cota region.start_aligned = aligned; 681e8feb96fSEmilio G. Cota /* page-align the end, since its last page will be a guard page */ 682e8feb96fSEmilio G. Cota region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size); 683e8feb96fSEmilio G. Cota /* account for that last guard page */ 684e8feb96fSEmilio G. Cota region.end -= page_size; 685e8feb96fSEmilio G. Cota 686e8feb96fSEmilio G. Cota /* set guard pages */ 687e8feb96fSEmilio G. Cota for (i = 0; i < region.n; i++) { 688e8feb96fSEmilio G. Cota void *start, *end; 689e8feb96fSEmilio G. Cota int rc; 690e8feb96fSEmilio G. Cota 691e8feb96fSEmilio G. Cota tcg_region_bounds(i, &start, &end); 692e8feb96fSEmilio G. Cota rc = qemu_mprotect_none(end, page_size); 693e8feb96fSEmilio G. Cota g_assert(!rc); 694e8feb96fSEmilio G. Cota } 695e8feb96fSEmilio G. Cota 696be2cdc5eSEmilio G. Cota tcg_region_trees_init(); 697be2cdc5eSEmilio G. Cota 6983468b59eSEmilio G. Cota /* In user-mode we support only one ctx, so do the initial allocation now */ 6993468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 700e8feb96fSEmilio G. Cota { 701e8feb96fSEmilio G. Cota bool err = tcg_region_initial_alloc__locked(tcg_ctx); 702e8feb96fSEmilio G. Cota 703e8feb96fSEmilio G. Cota g_assert(!err); 704e8feb96fSEmilio G. Cota } 7053468b59eSEmilio G. Cota #endif 706e8feb96fSEmilio G. Cota } 707e8feb96fSEmilio G. Cota 708e8feb96fSEmilio G. Cota /* 7093468b59eSEmilio G. Cota * All TCG threads except the parent (i.e. the one that called tcg_context_init 7103468b59eSEmilio G. Cota * and registered the target's TCG globals) must register with this function 7113468b59eSEmilio G. Cota * before initiating translation. 7123468b59eSEmilio G. Cota * 7133468b59eSEmilio G. Cota * In user-mode we just point tcg_ctx to tcg_init_ctx. See the documentation 7143468b59eSEmilio G. Cota * of tcg_region_init() for the reasoning behind this. 7153468b59eSEmilio G. Cota * 7163468b59eSEmilio G. Cota * In softmmu each caller registers its context in tcg_ctxs[]. Note that in 7173468b59eSEmilio G. Cota * softmmu tcg_ctxs[] does not track tcg_ctx_init, since the initial context 7183468b59eSEmilio G. Cota * is not used anymore for translation once this function is called. 7193468b59eSEmilio G. Cota * 7203468b59eSEmilio G. Cota * Not tracking tcg_init_ctx in tcg_ctxs[] in softmmu keeps code that iterates 7213468b59eSEmilio G. Cota * over the array (e.g. tcg_code_size() the same for both softmmu and user-mode. 7223468b59eSEmilio G. Cota */ 7233468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 7243468b59eSEmilio G. Cota void tcg_register_thread(void) 7253468b59eSEmilio G. Cota { 7263468b59eSEmilio G. Cota tcg_ctx = &tcg_init_ctx; 7273468b59eSEmilio G. Cota } 7283468b59eSEmilio G. Cota #else 7293468b59eSEmilio G. Cota void tcg_register_thread(void) 7303468b59eSEmilio G. Cota { 7313468b59eSEmilio G. Cota TCGContext *s = g_malloc(sizeof(*s)); 7323468b59eSEmilio G. Cota unsigned int i, n; 7333468b59eSEmilio G. Cota bool err; 7343468b59eSEmilio G. Cota 7353468b59eSEmilio G. Cota *s = tcg_init_ctx; 7363468b59eSEmilio G. Cota 7373468b59eSEmilio G. Cota /* Relink mem_base. */ 7383468b59eSEmilio G. Cota for (i = 0, n = tcg_init_ctx.nb_globals; i < n; ++i) { 7393468b59eSEmilio G. Cota if (tcg_init_ctx.temps[i].mem_base) { 7403468b59eSEmilio G. Cota ptrdiff_t b = tcg_init_ctx.temps[i].mem_base - tcg_init_ctx.temps; 7413468b59eSEmilio G. Cota tcg_debug_assert(b >= 0 && b < n); 7423468b59eSEmilio G. Cota s->temps[i].mem_base = &s->temps[b]; 7433468b59eSEmilio G. Cota } 7443468b59eSEmilio G. Cota } 7453468b59eSEmilio G. Cota 7463468b59eSEmilio G. Cota /* Claim an entry in tcg_ctxs */ 7473468b59eSEmilio G. Cota n = atomic_fetch_inc(&n_tcg_ctxs); 7483468b59eSEmilio G. Cota g_assert(n < max_cpus); 7493468b59eSEmilio G. Cota atomic_set(&tcg_ctxs[n], s); 7503468b59eSEmilio G. Cota 7513468b59eSEmilio G. Cota tcg_ctx = s; 7523468b59eSEmilio G. Cota qemu_mutex_lock(®ion.lock); 7533468b59eSEmilio G. Cota err = tcg_region_initial_alloc__locked(tcg_ctx); 7543468b59eSEmilio G. Cota g_assert(!err); 7553468b59eSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 7563468b59eSEmilio G. Cota } 7573468b59eSEmilio G. Cota #endif /* !CONFIG_USER_ONLY */ 7583468b59eSEmilio G. Cota 7593468b59eSEmilio G. Cota /* 760e8feb96fSEmilio G. Cota * Returns the size (in bytes) of all translated code (i.e. from all regions) 761e8feb96fSEmilio G. Cota * currently in the cache. 762e8feb96fSEmilio G. Cota * See also: tcg_code_capacity() 763e8feb96fSEmilio G. Cota * Do not confuse with tcg_current_code_size(); that one applies to a single 764e8feb96fSEmilio G. Cota * TCG context. 765e8feb96fSEmilio G. Cota */ 766e8feb96fSEmilio G. Cota size_t tcg_code_size(void) 767e8feb96fSEmilio G. Cota { 7683468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 769e8feb96fSEmilio G. Cota unsigned int i; 770e8feb96fSEmilio G. Cota size_t total; 771e8feb96fSEmilio G. Cota 772e8feb96fSEmilio G. Cota qemu_mutex_lock(®ion.lock); 773e8feb96fSEmilio G. Cota total = region.agg_size_full; 7743468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 7753468b59eSEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 776e8feb96fSEmilio G. Cota size_t size; 777e8feb96fSEmilio G. Cota 778e8feb96fSEmilio G. Cota size = atomic_read(&s->code_gen_ptr) - s->code_gen_buffer; 779e8feb96fSEmilio G. Cota g_assert(size <= s->code_gen_buffer_size); 780e8feb96fSEmilio G. Cota total += size; 781e8feb96fSEmilio G. Cota } 782e8feb96fSEmilio G. Cota qemu_mutex_unlock(®ion.lock); 783e8feb96fSEmilio G. Cota return total; 784e8feb96fSEmilio G. Cota } 785e8feb96fSEmilio G. Cota 786e8feb96fSEmilio G. Cota /* 787e8feb96fSEmilio G. Cota * Returns the code capacity (in bytes) of the entire cache, i.e. including all 788e8feb96fSEmilio G. Cota * regions. 789e8feb96fSEmilio G. Cota * See also: tcg_code_size() 790e8feb96fSEmilio G. Cota */ 791e8feb96fSEmilio G. Cota size_t tcg_code_capacity(void) 792e8feb96fSEmilio G. Cota { 793e8feb96fSEmilio G. Cota size_t guard_size, capacity; 794e8feb96fSEmilio G. Cota 795e8feb96fSEmilio G. Cota /* no need for synchronization; these variables are set at init time */ 796e8feb96fSEmilio G. Cota guard_size = region.stride - region.size; 797e8feb96fSEmilio G. Cota capacity = region.end + guard_size - region.start; 798e8feb96fSEmilio G. Cota capacity -= region.n * (guard_size + TCG_HIGHWATER); 799e8feb96fSEmilio G. Cota return capacity; 800e8feb96fSEmilio G. Cota } 801e8feb96fSEmilio G. Cota 802128ed227SEmilio G. Cota size_t tcg_tb_phys_invalidate_count(void) 803128ed227SEmilio G. Cota { 804128ed227SEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 805128ed227SEmilio G. Cota unsigned int i; 806128ed227SEmilio G. Cota size_t total = 0; 807128ed227SEmilio G. Cota 808128ed227SEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 809128ed227SEmilio G. Cota const TCGContext *s = atomic_read(&tcg_ctxs[i]); 810128ed227SEmilio G. Cota 811128ed227SEmilio G. Cota total += atomic_read(&s->tb_phys_invalidate_count); 812128ed227SEmilio G. Cota } 813128ed227SEmilio G. Cota return total; 814128ed227SEmilio G. Cota } 815128ed227SEmilio G. Cota 816c896fe29Sbellard /* pool based memory allocation */ 817c896fe29Sbellard void *tcg_malloc_internal(TCGContext *s, int size) 818c896fe29Sbellard { 819c896fe29Sbellard TCGPool *p; 820c896fe29Sbellard int pool_size; 821c896fe29Sbellard 822c896fe29Sbellard if (size > TCG_POOL_CHUNK_SIZE) { 823c896fe29Sbellard /* big malloc: insert a new pool (XXX: could optimize) */ 8247267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + size); 825c896fe29Sbellard p->size = size; 8264055299eSKirill Batuzov p->next = s->pool_first_large; 8274055299eSKirill Batuzov s->pool_first_large = p; 8284055299eSKirill Batuzov return p->data; 829c896fe29Sbellard } else { 830c896fe29Sbellard p = s->pool_current; 831c896fe29Sbellard if (!p) { 832c896fe29Sbellard p = s->pool_first; 833c896fe29Sbellard if (!p) 834c896fe29Sbellard goto new_pool; 835c896fe29Sbellard } else { 836c896fe29Sbellard if (!p->next) { 837c896fe29Sbellard new_pool: 838c896fe29Sbellard pool_size = TCG_POOL_CHUNK_SIZE; 8397267c094SAnthony Liguori p = g_malloc(sizeof(TCGPool) + pool_size); 840c896fe29Sbellard p->size = pool_size; 841c896fe29Sbellard p->next = NULL; 842c896fe29Sbellard if (s->pool_current) 843c896fe29Sbellard s->pool_current->next = p; 844c896fe29Sbellard else 845c896fe29Sbellard s->pool_first = p; 846c896fe29Sbellard } else { 847c896fe29Sbellard p = p->next; 848c896fe29Sbellard } 849c896fe29Sbellard } 850c896fe29Sbellard } 851c896fe29Sbellard s->pool_current = p; 852c896fe29Sbellard s->pool_cur = p->data + size; 853c896fe29Sbellard s->pool_end = p->data + p->size; 854c896fe29Sbellard return p->data; 855c896fe29Sbellard } 856c896fe29Sbellard 857c896fe29Sbellard void tcg_pool_reset(TCGContext *s) 858c896fe29Sbellard { 8594055299eSKirill Batuzov TCGPool *p, *t; 8604055299eSKirill Batuzov for (p = s->pool_first_large; p; p = t) { 8614055299eSKirill Batuzov t = p->next; 8624055299eSKirill Batuzov g_free(p); 8634055299eSKirill Batuzov } 8644055299eSKirill Batuzov s->pool_first_large = NULL; 865c896fe29Sbellard s->pool_cur = s->pool_end = NULL; 866c896fe29Sbellard s->pool_current = NULL; 867c896fe29Sbellard } 868c896fe29Sbellard 869100b5e01SRichard Henderson typedef struct TCGHelperInfo { 870100b5e01SRichard Henderson void *func; 871100b5e01SRichard Henderson const char *name; 872afb49896SRichard Henderson unsigned flags; 873afb49896SRichard Henderson unsigned sizemask; 874100b5e01SRichard Henderson } TCGHelperInfo; 875100b5e01SRichard Henderson 8762ef6175aSRichard Henderson #include "exec/helper-proto.h" 8772ef6175aSRichard Henderson 878100b5e01SRichard Henderson static const TCGHelperInfo all_helpers[] = { 8792ef6175aSRichard Henderson #include "exec/helper-tcg.h" 880100b5e01SRichard Henderson }; 881619205fdSEmilio G. Cota static GHashTable *helper_table; 882100b5e01SRichard Henderson 88391478cefSRichard Henderson static int indirect_reg_alloc_order[ARRAY_SIZE(tcg_target_reg_alloc_order)]; 884f69d277eSRichard Henderson static void process_op_defs(TCGContext *s); 8851c2adb95SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 8861c2adb95SRichard Henderson TCGReg reg, const char *name); 88791478cefSRichard Henderson 888c896fe29Sbellard void tcg_context_init(TCGContext *s) 889c896fe29Sbellard { 890100b5e01SRichard Henderson int op, total_args, n, i; 891c896fe29Sbellard TCGOpDef *def; 892c896fe29Sbellard TCGArgConstraint *args_ct; 893c896fe29Sbellard int *sorted_args; 8941c2adb95SRichard Henderson TCGTemp *ts; 895c896fe29Sbellard 896c896fe29Sbellard memset(s, 0, sizeof(*s)); 897c896fe29Sbellard s->nb_globals = 0; 898c896fe29Sbellard 899c896fe29Sbellard /* Count total number of arguments and allocate the corresponding 900c896fe29Sbellard space */ 901c896fe29Sbellard total_args = 0; 902c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 903c896fe29Sbellard def = &tcg_op_defs[op]; 904c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 905c896fe29Sbellard total_args += n; 906c896fe29Sbellard } 907c896fe29Sbellard 9087267c094SAnthony Liguori args_ct = g_malloc(sizeof(TCGArgConstraint) * total_args); 9097267c094SAnthony Liguori sorted_args = g_malloc(sizeof(int) * total_args); 910c896fe29Sbellard 911c896fe29Sbellard for(op = 0; op < NB_OPS; op++) { 912c896fe29Sbellard def = &tcg_op_defs[op]; 913c896fe29Sbellard def->args_ct = args_ct; 914c896fe29Sbellard def->sorted_args = sorted_args; 915c896fe29Sbellard n = def->nb_iargs + def->nb_oargs; 916c896fe29Sbellard sorted_args += n; 917c896fe29Sbellard args_ct += n; 918c896fe29Sbellard } 919c896fe29Sbellard 9205cd8f621SRichard Henderson /* Register helpers. */ 92184fd9dd3SRichard Henderson /* Use g_direct_hash/equal for direct pointer comparisons on func. */ 922619205fdSEmilio G. Cota helper_table = g_hash_table_new(NULL, NULL); 92384fd9dd3SRichard Henderson 924100b5e01SRichard Henderson for (i = 0; i < ARRAY_SIZE(all_helpers); ++i) { 92584fd9dd3SRichard Henderson g_hash_table_insert(helper_table, (gpointer)all_helpers[i].func, 92672866e82SRichard Henderson (gpointer)&all_helpers[i]); 927100b5e01SRichard Henderson } 9285cd8f621SRichard Henderson 929c896fe29Sbellard tcg_target_init(s); 930f69d277eSRichard Henderson process_op_defs(s); 93191478cefSRichard Henderson 93291478cefSRichard Henderson /* Reverse the order of the saved registers, assuming they're all at 93391478cefSRichard Henderson the start of tcg_target_reg_alloc_order. */ 93491478cefSRichard Henderson for (n = 0; n < ARRAY_SIZE(tcg_target_reg_alloc_order); ++n) { 93591478cefSRichard Henderson int r = tcg_target_reg_alloc_order[n]; 93691478cefSRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, r)) { 93791478cefSRichard Henderson break; 93891478cefSRichard Henderson } 93991478cefSRichard Henderson } 94091478cefSRichard Henderson for (i = 0; i < n; ++i) { 94191478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[n - 1 - i]; 94291478cefSRichard Henderson } 94391478cefSRichard Henderson for (; i < ARRAY_SIZE(tcg_target_reg_alloc_order); ++i) { 94491478cefSRichard Henderson indirect_reg_alloc_order[i] = tcg_target_reg_alloc_order[i]; 94591478cefSRichard Henderson } 946b1311c4aSEmilio G. Cota 947b1311c4aSEmilio G. Cota tcg_ctx = s; 9483468b59eSEmilio G. Cota /* 9493468b59eSEmilio G. Cota * In user-mode we simply share the init context among threads, since we 9503468b59eSEmilio G. Cota * use a single region. See the documentation tcg_region_init() for the 9513468b59eSEmilio G. Cota * reasoning behind this. 9523468b59eSEmilio G. Cota * In softmmu we will have at most max_cpus TCG threads. 9533468b59eSEmilio G. Cota */ 9543468b59eSEmilio G. Cota #ifdef CONFIG_USER_ONLY 955df2cce29SEmilio G. Cota tcg_ctxs = &tcg_ctx; 956df2cce29SEmilio G. Cota n_tcg_ctxs = 1; 9573468b59eSEmilio G. Cota #else 9583468b59eSEmilio G. Cota tcg_ctxs = g_new(TCGContext *, max_cpus); 9593468b59eSEmilio G. Cota #endif 9601c2adb95SRichard Henderson 9611c2adb95SRichard Henderson tcg_debug_assert(!tcg_regset_test_reg(s->reserved_regs, TCG_AREG0)); 9621c2adb95SRichard Henderson ts = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, TCG_AREG0, "env"); 9631c2adb95SRichard Henderson cpu_env = temp_tcgv_ptr(ts); 9649002ec79SRichard Henderson } 965b03cce8eSbellard 9666e3b2bfdSEmilio G. Cota /* 9676e3b2bfdSEmilio G. Cota * Allocate TBs right before their corresponding translated code, making 9686e3b2bfdSEmilio G. Cota * sure that TBs and code are on different cache lines. 9696e3b2bfdSEmilio G. Cota */ 9706e3b2bfdSEmilio G. Cota TranslationBlock *tcg_tb_alloc(TCGContext *s) 9716e3b2bfdSEmilio G. Cota { 9726e3b2bfdSEmilio G. Cota uintptr_t align = qemu_icache_linesize; 9736e3b2bfdSEmilio G. Cota TranslationBlock *tb; 9746e3b2bfdSEmilio G. Cota void *next; 9756e3b2bfdSEmilio G. Cota 976e8feb96fSEmilio G. Cota retry: 9776e3b2bfdSEmilio G. Cota tb = (void *)ROUND_UP((uintptr_t)s->code_gen_ptr, align); 9786e3b2bfdSEmilio G. Cota next = (void *)ROUND_UP((uintptr_t)(tb + 1), align); 9796e3b2bfdSEmilio G. Cota 9806e3b2bfdSEmilio G. Cota if (unlikely(next > s->code_gen_highwater)) { 981e8feb96fSEmilio G. Cota if (tcg_region_alloc(s)) { 9826e3b2bfdSEmilio G. Cota return NULL; 9836e3b2bfdSEmilio G. Cota } 984e8feb96fSEmilio G. Cota goto retry; 985e8feb96fSEmilio G. Cota } 986e8feb96fSEmilio G. Cota atomic_set(&s->code_gen_ptr, next); 98757a26946SRichard Henderson s->data_gen_ptr = NULL; 9886e3b2bfdSEmilio G. Cota return tb; 9896e3b2bfdSEmilio G. Cota } 9906e3b2bfdSEmilio G. Cota 9919002ec79SRichard Henderson void tcg_prologue_init(TCGContext *s) 9929002ec79SRichard Henderson { 9938163b749SRichard Henderson size_t prologue_size, total_size; 9948163b749SRichard Henderson void *buf0, *buf1; 9958163b749SRichard Henderson 9968163b749SRichard Henderson /* Put the prologue at the beginning of code_gen_buffer. */ 9978163b749SRichard Henderson buf0 = s->code_gen_buffer; 9985b38ee31SRichard Henderson total_size = s->code_gen_buffer_size; 9998163b749SRichard Henderson s->code_ptr = buf0; 10008163b749SRichard Henderson s->code_buf = buf0; 10015b38ee31SRichard Henderson s->data_gen_ptr = NULL; 10028163b749SRichard Henderson s->code_gen_prologue = buf0; 10038163b749SRichard Henderson 10045b38ee31SRichard Henderson /* Compute a high-water mark, at which we voluntarily flush the buffer 10055b38ee31SRichard Henderson and start over. The size here is arbitrary, significantly larger 10065b38ee31SRichard Henderson than we expect the code generation for any one opcode to require. */ 10075b38ee31SRichard Henderson s->code_gen_highwater = s->code_gen_buffer + (total_size - TCG_HIGHWATER); 10085b38ee31SRichard Henderson 10095b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10105b38ee31SRichard Henderson s->pool_labels = NULL; 10115b38ee31SRichard Henderson #endif 10125b38ee31SRichard Henderson 10138163b749SRichard Henderson /* Generate the prologue. */ 1014b03cce8eSbellard tcg_target_qemu_prologue(s); 10155b38ee31SRichard Henderson 10165b38ee31SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 10175b38ee31SRichard Henderson /* Allow the prologue to put e.g. guest_base into a pool entry. */ 10185b38ee31SRichard Henderson { 10195b38ee31SRichard Henderson bool ok = tcg_out_pool_finalize(s); 10205b38ee31SRichard Henderson tcg_debug_assert(ok); 10215b38ee31SRichard Henderson } 10225b38ee31SRichard Henderson #endif 10235b38ee31SRichard Henderson 10248163b749SRichard Henderson buf1 = s->code_ptr; 10258163b749SRichard Henderson flush_icache_range((uintptr_t)buf0, (uintptr_t)buf1); 10268163b749SRichard Henderson 10278163b749SRichard Henderson /* Deduct the prologue from the buffer. */ 10288163b749SRichard Henderson prologue_size = tcg_current_code_size(s); 10298163b749SRichard Henderson s->code_gen_ptr = buf1; 10308163b749SRichard Henderson s->code_gen_buffer = buf1; 10318163b749SRichard Henderson s->code_buf = buf1; 10325b38ee31SRichard Henderson total_size -= prologue_size; 10338163b749SRichard Henderson s->code_gen_buffer_size = total_size; 10348163b749SRichard Henderson 10358163b749SRichard Henderson tcg_register_jit(s->code_gen_buffer, total_size); 1036d6b64b2bSRichard Henderson 1037d6b64b2bSRichard Henderson #ifdef DEBUG_DISAS 1038d6b64b2bSRichard Henderson if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM)) { 10391ee73216SRichard Henderson qemu_log_lock(); 10408163b749SRichard Henderson qemu_log("PROLOGUE: [size=%zu]\n", prologue_size); 10415b38ee31SRichard Henderson if (s->data_gen_ptr) { 10425b38ee31SRichard Henderson size_t code_size = s->data_gen_ptr - buf0; 10435b38ee31SRichard Henderson size_t data_size = prologue_size - code_size; 10445b38ee31SRichard Henderson size_t i; 10455b38ee31SRichard Henderson 10465b38ee31SRichard Henderson log_disas(buf0, code_size); 10475b38ee31SRichard Henderson 10485b38ee31SRichard Henderson for (i = 0; i < data_size; i += sizeof(tcg_target_ulong)) { 10495b38ee31SRichard Henderson if (sizeof(tcg_target_ulong) == 8) { 10505b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .quad 0x%016" PRIx64 "\n", 10515b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10525b38ee31SRichard Henderson *(uint64_t *)(s->data_gen_ptr + i)); 10535b38ee31SRichard Henderson } else { 10545b38ee31SRichard Henderson qemu_log("0x%08" PRIxPTR ": .long 0x%08x\n", 10555b38ee31SRichard Henderson (uintptr_t)s->data_gen_ptr + i, 10565b38ee31SRichard Henderson *(uint32_t *)(s->data_gen_ptr + i)); 10575b38ee31SRichard Henderson } 10585b38ee31SRichard Henderson } 10595b38ee31SRichard Henderson } else { 10608163b749SRichard Henderson log_disas(buf0, prologue_size); 10615b38ee31SRichard Henderson } 1062d6b64b2bSRichard Henderson qemu_log("\n"); 1063d6b64b2bSRichard Henderson qemu_log_flush(); 10641ee73216SRichard Henderson qemu_log_unlock(); 1065d6b64b2bSRichard Henderson } 1066d6b64b2bSRichard Henderson #endif 1067cedbcb01SEmilio G. Cota 1068cedbcb01SEmilio G. Cota /* Assert that goto_ptr is implemented completely. */ 1069cedbcb01SEmilio G. Cota if (TCG_TARGET_HAS_goto_ptr) { 1070cedbcb01SEmilio G. Cota tcg_debug_assert(s->code_gen_epilogue != NULL); 1071cedbcb01SEmilio G. Cota } 1072c896fe29Sbellard } 1073c896fe29Sbellard 1074c896fe29Sbellard void tcg_func_start(TCGContext *s) 1075c896fe29Sbellard { 1076c896fe29Sbellard tcg_pool_reset(s); 1077c896fe29Sbellard s->nb_temps = s->nb_globals; 10780ec9eabcSRichard Henderson 10790ec9eabcSRichard Henderson /* No temps have been previously allocated for size or locality. */ 10800ec9eabcSRichard Henderson memset(s->free_temps, 0, sizeof(s->free_temps)); 10810ec9eabcSRichard Henderson 1082abebf925SRichard Henderson s->nb_ops = 0; 1083c896fe29Sbellard s->nb_labels = 0; 1084c896fe29Sbellard s->current_frame_offset = s->frame_start; 1085c896fe29Sbellard 10860a209d4bSRichard Henderson #ifdef CONFIG_DEBUG_TCG 10870a209d4bSRichard Henderson s->goto_tb_issue_mask = 0; 10880a209d4bSRichard Henderson #endif 10890a209d4bSRichard Henderson 109015fa08f8SRichard Henderson QTAILQ_INIT(&s->ops); 109115fa08f8SRichard Henderson QTAILQ_INIT(&s->free_ops); 1092c896fe29Sbellard } 1093c896fe29Sbellard 10947ca4b752SRichard Henderson static inline TCGTemp *tcg_temp_alloc(TCGContext *s) 10957ca4b752SRichard Henderson { 10967ca4b752SRichard Henderson int n = s->nb_temps++; 10977ca4b752SRichard Henderson tcg_debug_assert(n < TCG_MAX_TEMPS); 10987ca4b752SRichard Henderson return memset(&s->temps[n], 0, sizeof(TCGTemp)); 10997ca4b752SRichard Henderson } 11007ca4b752SRichard Henderson 11017ca4b752SRichard Henderson static inline TCGTemp *tcg_global_alloc(TCGContext *s) 11027ca4b752SRichard Henderson { 1103fa477d25SRichard Henderson TCGTemp *ts; 1104fa477d25SRichard Henderson 11057ca4b752SRichard Henderson tcg_debug_assert(s->nb_globals == s->nb_temps); 11067ca4b752SRichard Henderson s->nb_globals++; 1107fa477d25SRichard Henderson ts = tcg_temp_alloc(s); 1108fa477d25SRichard Henderson ts->temp_global = 1; 1109fa477d25SRichard Henderson 1110fa477d25SRichard Henderson return ts; 1111c896fe29Sbellard } 1112c896fe29Sbellard 1113085272b3SRichard Henderson static TCGTemp *tcg_global_reg_new_internal(TCGContext *s, TCGType type, 1114b6638662SRichard Henderson TCGReg reg, const char *name) 1115c896fe29Sbellard { 1116c896fe29Sbellard TCGTemp *ts; 1117c896fe29Sbellard 1118b3a62939SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type != TCG_TYPE_I32) { 1119c896fe29Sbellard tcg_abort(); 1120b3a62939SRichard Henderson } 11217ca4b752SRichard Henderson 11227ca4b752SRichard Henderson ts = tcg_global_alloc(s); 1123c896fe29Sbellard ts->base_type = type; 1124c896fe29Sbellard ts->type = type; 1125c896fe29Sbellard ts->fixed_reg = 1; 1126c896fe29Sbellard ts->reg = reg; 1127c896fe29Sbellard ts->name = name; 1128c896fe29Sbellard tcg_regset_set_reg(s->reserved_regs, reg); 11297ca4b752SRichard Henderson 1130085272b3SRichard Henderson return ts; 1131a7812ae4Spbrook } 1132a7812ae4Spbrook 1133b6638662SRichard Henderson void tcg_set_frame(TCGContext *s, TCGReg reg, intptr_t start, intptr_t size) 1134a7812ae4Spbrook { 1135b3a62939SRichard Henderson s->frame_start = start; 1136b3a62939SRichard Henderson s->frame_end = start + size; 1137085272b3SRichard Henderson s->frame_temp 1138085272b3SRichard Henderson = tcg_global_reg_new_internal(s, TCG_TYPE_PTR, reg, "_frame"); 1139b3a62939SRichard Henderson } 1140a7812ae4Spbrook 1141085272b3SRichard Henderson TCGTemp *tcg_global_mem_new_internal(TCGType type, TCGv_ptr base, 1142e1ccc054SRichard Henderson intptr_t offset, const char *name) 1143c896fe29Sbellard { 1144b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1145dc41aa7dSRichard Henderson TCGTemp *base_ts = tcgv_ptr_temp(base); 11467ca4b752SRichard Henderson TCGTemp *ts = tcg_global_alloc(s); 1147b3915dbbSRichard Henderson int indirect_reg = 0, bigendian = 0; 11487ca4b752SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 11497ca4b752SRichard Henderson bigendian = 1; 11507ca4b752SRichard Henderson #endif 1151c896fe29Sbellard 1152b3915dbbSRichard Henderson if (!base_ts->fixed_reg) { 11535a18407fSRichard Henderson /* We do not support double-indirect registers. */ 11545a18407fSRichard Henderson tcg_debug_assert(!base_ts->indirect_reg); 1155b3915dbbSRichard Henderson base_ts->indirect_base = 1; 11565a18407fSRichard Henderson s->nb_indirects += (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64 11575a18407fSRichard Henderson ? 2 : 1); 11585a18407fSRichard Henderson indirect_reg = 1; 1159b3915dbbSRichard Henderson } 1160b3915dbbSRichard Henderson 11617ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 11627ca4b752SRichard Henderson TCGTemp *ts2 = tcg_global_alloc(s); 1163c896fe29Sbellard char buf[64]; 11647ca4b752SRichard Henderson 11657ca4b752SRichard Henderson ts->base_type = TCG_TYPE_I64; 1166c896fe29Sbellard ts->type = TCG_TYPE_I32; 1167b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1168c896fe29Sbellard ts->mem_allocated = 1; 1169b3a62939SRichard Henderson ts->mem_base = base_ts; 11707ca4b752SRichard Henderson ts->mem_offset = offset + bigendian * 4; 1171c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1172c896fe29Sbellard pstrcat(buf, sizeof(buf), "_0"); 1173c896fe29Sbellard ts->name = strdup(buf); 1174c896fe29Sbellard 11757ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 11767ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 11777ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 1178b3915dbbSRichard Henderson ts2->indirect_reg = indirect_reg; 11797ca4b752SRichard Henderson ts2->mem_allocated = 1; 11807ca4b752SRichard Henderson ts2->mem_base = base_ts; 11817ca4b752SRichard Henderson ts2->mem_offset = offset + (1 - bigendian) * 4; 1182c896fe29Sbellard pstrcpy(buf, sizeof(buf), name); 1183c896fe29Sbellard pstrcat(buf, sizeof(buf), "_1"); 1184120c1084SRichard Henderson ts2->name = strdup(buf); 11857ca4b752SRichard Henderson } else { 1186c896fe29Sbellard ts->base_type = type; 1187c896fe29Sbellard ts->type = type; 1188b3915dbbSRichard Henderson ts->indirect_reg = indirect_reg; 1189c896fe29Sbellard ts->mem_allocated = 1; 1190b3a62939SRichard Henderson ts->mem_base = base_ts; 1191c896fe29Sbellard ts->mem_offset = offset; 1192c896fe29Sbellard ts->name = name; 1193c896fe29Sbellard } 1194085272b3SRichard Henderson return ts; 1195c896fe29Sbellard } 1196c896fe29Sbellard 11975bfa8034SRichard Henderson TCGTemp *tcg_temp_new_internal(TCGType type, bool temp_local) 1198c896fe29Sbellard { 1199b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1200c896fe29Sbellard TCGTemp *ts; 1201641d5fbeSbellard int idx, k; 1202c896fe29Sbellard 12030ec9eabcSRichard Henderson k = type + (temp_local ? TCG_TYPE_COUNT : 0); 12040ec9eabcSRichard Henderson idx = find_first_bit(s->free_temps[k].l, TCG_MAX_TEMPS); 12050ec9eabcSRichard Henderson if (idx < TCG_MAX_TEMPS) { 12060ec9eabcSRichard Henderson /* There is already an available temp with the right type. */ 12070ec9eabcSRichard Henderson clear_bit(idx, s->free_temps[k].l); 12080ec9eabcSRichard Henderson 1209e8996ee0Sbellard ts = &s->temps[idx]; 1210e8996ee0Sbellard ts->temp_allocated = 1; 12117ca4b752SRichard Henderson tcg_debug_assert(ts->base_type == type); 12127ca4b752SRichard Henderson tcg_debug_assert(ts->temp_local == temp_local); 1213e8996ee0Sbellard } else { 12147ca4b752SRichard Henderson ts = tcg_temp_alloc(s); 12157ca4b752SRichard Henderson if (TCG_TARGET_REG_BITS == 32 && type == TCG_TYPE_I64) { 12167ca4b752SRichard Henderson TCGTemp *ts2 = tcg_temp_alloc(s); 12177ca4b752SRichard Henderson 1218c896fe29Sbellard ts->base_type = type; 1219c896fe29Sbellard ts->type = TCG_TYPE_I32; 1220e8996ee0Sbellard ts->temp_allocated = 1; 1221641d5fbeSbellard ts->temp_local = temp_local; 12227ca4b752SRichard Henderson 12237ca4b752SRichard Henderson tcg_debug_assert(ts2 == ts + 1); 12247ca4b752SRichard Henderson ts2->base_type = TCG_TYPE_I64; 12257ca4b752SRichard Henderson ts2->type = TCG_TYPE_I32; 12267ca4b752SRichard Henderson ts2->temp_allocated = 1; 12277ca4b752SRichard Henderson ts2->temp_local = temp_local; 12287ca4b752SRichard Henderson } else { 1229c896fe29Sbellard ts->base_type = type; 1230c896fe29Sbellard ts->type = type; 1231e8996ee0Sbellard ts->temp_allocated = 1; 1232641d5fbeSbellard ts->temp_local = temp_local; 1233c896fe29Sbellard } 1234e8996ee0Sbellard } 123527bfd83cSPeter Maydell 123627bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 123727bfd83cSPeter Maydell s->temps_in_use++; 123827bfd83cSPeter Maydell #endif 1239085272b3SRichard Henderson return ts; 1240c896fe29Sbellard } 1241c896fe29Sbellard 1242d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec(TCGType type) 1243d2fd745fSRichard Henderson { 1244d2fd745fSRichard Henderson TCGTemp *t; 1245d2fd745fSRichard Henderson 1246d2fd745fSRichard Henderson #ifdef CONFIG_DEBUG_TCG 1247d2fd745fSRichard Henderson switch (type) { 1248d2fd745fSRichard Henderson case TCG_TYPE_V64: 1249d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v64); 1250d2fd745fSRichard Henderson break; 1251d2fd745fSRichard Henderson case TCG_TYPE_V128: 1252d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v128); 1253d2fd745fSRichard Henderson break; 1254d2fd745fSRichard Henderson case TCG_TYPE_V256: 1255d2fd745fSRichard Henderson assert(TCG_TARGET_HAS_v256); 1256d2fd745fSRichard Henderson break; 1257d2fd745fSRichard Henderson default: 1258d2fd745fSRichard Henderson g_assert_not_reached(); 1259d2fd745fSRichard Henderson } 1260d2fd745fSRichard Henderson #endif 1261d2fd745fSRichard Henderson 1262d2fd745fSRichard Henderson t = tcg_temp_new_internal(type, 0); 1263d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1264d2fd745fSRichard Henderson } 1265d2fd745fSRichard Henderson 1266d2fd745fSRichard Henderson /* Create a new temp of the same type as an existing temp. */ 1267d2fd745fSRichard Henderson TCGv_vec tcg_temp_new_vec_matching(TCGv_vec match) 1268d2fd745fSRichard Henderson { 1269d2fd745fSRichard Henderson TCGTemp *t = tcgv_vec_temp(match); 1270d2fd745fSRichard Henderson 1271d2fd745fSRichard Henderson tcg_debug_assert(t->temp_allocated != 0); 1272d2fd745fSRichard Henderson 1273d2fd745fSRichard Henderson t = tcg_temp_new_internal(t->base_type, 0); 1274d2fd745fSRichard Henderson return temp_tcgv_vec(t); 1275d2fd745fSRichard Henderson } 1276d2fd745fSRichard Henderson 12775bfa8034SRichard Henderson void tcg_temp_free_internal(TCGTemp *ts) 1278c896fe29Sbellard { 1279b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 1280085272b3SRichard Henderson int k, idx; 1281c896fe29Sbellard 128227bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 128327bfd83cSPeter Maydell s->temps_in_use--; 128427bfd83cSPeter Maydell if (s->temps_in_use < 0) { 128527bfd83cSPeter Maydell fprintf(stderr, "More temporaries freed than allocated!\n"); 128627bfd83cSPeter Maydell } 128727bfd83cSPeter Maydell #endif 128827bfd83cSPeter Maydell 1289085272b3SRichard Henderson tcg_debug_assert(ts->temp_global == 0); 1290eabb7b91SAurelien Jarno tcg_debug_assert(ts->temp_allocated != 0); 1291e8996ee0Sbellard ts->temp_allocated = 0; 12920ec9eabcSRichard Henderson 1293085272b3SRichard Henderson idx = temp_idx(ts); 129418d13fa2SAlexander Graf k = ts->base_type + (ts->temp_local ? TCG_TYPE_COUNT : 0); 12950ec9eabcSRichard Henderson set_bit(idx, s->free_temps[k].l); 1296e8996ee0Sbellard } 1297e8996ee0Sbellard 1298a7812ae4Spbrook TCGv_i32 tcg_const_i32(int32_t val) 1299a7812ae4Spbrook { 1300a7812ae4Spbrook TCGv_i32 t0; 1301a7812ae4Spbrook t0 = tcg_temp_new_i32(); 1302e8996ee0Sbellard tcg_gen_movi_i32(t0, val); 1303e8996ee0Sbellard return t0; 1304c896fe29Sbellard } 1305c896fe29Sbellard 1306a7812ae4Spbrook TCGv_i64 tcg_const_i64(int64_t val) 1307c896fe29Sbellard { 1308a7812ae4Spbrook TCGv_i64 t0; 1309a7812ae4Spbrook t0 = tcg_temp_new_i64(); 1310e8996ee0Sbellard tcg_gen_movi_i64(t0, val); 1311e8996ee0Sbellard return t0; 1312c896fe29Sbellard } 1313c896fe29Sbellard 1314a7812ae4Spbrook TCGv_i32 tcg_const_local_i32(int32_t val) 1315bdffd4a9Saurel32 { 1316a7812ae4Spbrook TCGv_i32 t0; 1317a7812ae4Spbrook t0 = tcg_temp_local_new_i32(); 1318bdffd4a9Saurel32 tcg_gen_movi_i32(t0, val); 1319bdffd4a9Saurel32 return t0; 1320bdffd4a9Saurel32 } 1321bdffd4a9Saurel32 1322a7812ae4Spbrook TCGv_i64 tcg_const_local_i64(int64_t val) 1323bdffd4a9Saurel32 { 1324a7812ae4Spbrook TCGv_i64 t0; 1325a7812ae4Spbrook t0 = tcg_temp_local_new_i64(); 1326bdffd4a9Saurel32 tcg_gen_movi_i64(t0, val); 1327bdffd4a9Saurel32 return t0; 1328bdffd4a9Saurel32 } 1329bdffd4a9Saurel32 133027bfd83cSPeter Maydell #if defined(CONFIG_DEBUG_TCG) 133127bfd83cSPeter Maydell void tcg_clear_temp_count(void) 133227bfd83cSPeter Maydell { 1333b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 133427bfd83cSPeter Maydell s->temps_in_use = 0; 133527bfd83cSPeter Maydell } 133627bfd83cSPeter Maydell 133727bfd83cSPeter Maydell int tcg_check_temp_count(void) 133827bfd83cSPeter Maydell { 1339b1311c4aSEmilio G. Cota TCGContext *s = tcg_ctx; 134027bfd83cSPeter Maydell if (s->temps_in_use) { 134127bfd83cSPeter Maydell /* Clear the count so that we don't give another 134227bfd83cSPeter Maydell * warning immediately next time around. 134327bfd83cSPeter Maydell */ 134427bfd83cSPeter Maydell s->temps_in_use = 0; 134527bfd83cSPeter Maydell return 1; 134627bfd83cSPeter Maydell } 134727bfd83cSPeter Maydell return 0; 134827bfd83cSPeter Maydell } 134927bfd83cSPeter Maydell #endif 135027bfd83cSPeter Maydell 1351be0f34b5SRichard Henderson /* Return true if OP may appear in the opcode stream. 1352be0f34b5SRichard Henderson Test the runtime variable that controls each opcode. */ 1353be0f34b5SRichard Henderson bool tcg_op_supported(TCGOpcode op) 1354be0f34b5SRichard Henderson { 1355d2fd745fSRichard Henderson const bool have_vec 1356d2fd745fSRichard Henderson = TCG_TARGET_HAS_v64 | TCG_TARGET_HAS_v128 | TCG_TARGET_HAS_v256; 1357d2fd745fSRichard Henderson 1358be0f34b5SRichard Henderson switch (op) { 1359be0f34b5SRichard Henderson case INDEX_op_discard: 1360be0f34b5SRichard Henderson case INDEX_op_set_label: 1361be0f34b5SRichard Henderson case INDEX_op_call: 1362be0f34b5SRichard Henderson case INDEX_op_br: 1363be0f34b5SRichard Henderson case INDEX_op_mb: 1364be0f34b5SRichard Henderson case INDEX_op_insn_start: 1365be0f34b5SRichard Henderson case INDEX_op_exit_tb: 1366be0f34b5SRichard Henderson case INDEX_op_goto_tb: 1367be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i32: 1368be0f34b5SRichard Henderson case INDEX_op_qemu_st_i32: 1369be0f34b5SRichard Henderson case INDEX_op_qemu_ld_i64: 1370be0f34b5SRichard Henderson case INDEX_op_qemu_st_i64: 1371be0f34b5SRichard Henderson return true; 1372be0f34b5SRichard Henderson 1373be0f34b5SRichard Henderson case INDEX_op_goto_ptr: 1374be0f34b5SRichard Henderson return TCG_TARGET_HAS_goto_ptr; 1375be0f34b5SRichard Henderson 1376be0f34b5SRichard Henderson case INDEX_op_mov_i32: 1377be0f34b5SRichard Henderson case INDEX_op_movi_i32: 1378be0f34b5SRichard Henderson case INDEX_op_setcond_i32: 1379be0f34b5SRichard Henderson case INDEX_op_brcond_i32: 1380be0f34b5SRichard Henderson case INDEX_op_ld8u_i32: 1381be0f34b5SRichard Henderson case INDEX_op_ld8s_i32: 1382be0f34b5SRichard Henderson case INDEX_op_ld16u_i32: 1383be0f34b5SRichard Henderson case INDEX_op_ld16s_i32: 1384be0f34b5SRichard Henderson case INDEX_op_ld_i32: 1385be0f34b5SRichard Henderson case INDEX_op_st8_i32: 1386be0f34b5SRichard Henderson case INDEX_op_st16_i32: 1387be0f34b5SRichard Henderson case INDEX_op_st_i32: 1388be0f34b5SRichard Henderson case INDEX_op_add_i32: 1389be0f34b5SRichard Henderson case INDEX_op_sub_i32: 1390be0f34b5SRichard Henderson case INDEX_op_mul_i32: 1391be0f34b5SRichard Henderson case INDEX_op_and_i32: 1392be0f34b5SRichard Henderson case INDEX_op_or_i32: 1393be0f34b5SRichard Henderson case INDEX_op_xor_i32: 1394be0f34b5SRichard Henderson case INDEX_op_shl_i32: 1395be0f34b5SRichard Henderson case INDEX_op_shr_i32: 1396be0f34b5SRichard Henderson case INDEX_op_sar_i32: 1397be0f34b5SRichard Henderson return true; 1398be0f34b5SRichard Henderson 1399be0f34b5SRichard Henderson case INDEX_op_movcond_i32: 1400be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i32; 1401be0f34b5SRichard Henderson case INDEX_op_div_i32: 1402be0f34b5SRichard Henderson case INDEX_op_divu_i32: 1403be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i32; 1404be0f34b5SRichard Henderson case INDEX_op_rem_i32: 1405be0f34b5SRichard Henderson case INDEX_op_remu_i32: 1406be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i32; 1407be0f34b5SRichard Henderson case INDEX_op_div2_i32: 1408be0f34b5SRichard Henderson case INDEX_op_divu2_i32: 1409be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i32; 1410be0f34b5SRichard Henderson case INDEX_op_rotl_i32: 1411be0f34b5SRichard Henderson case INDEX_op_rotr_i32: 1412be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i32; 1413be0f34b5SRichard Henderson case INDEX_op_deposit_i32: 1414be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i32; 1415be0f34b5SRichard Henderson case INDEX_op_extract_i32: 1416be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i32; 1417be0f34b5SRichard Henderson case INDEX_op_sextract_i32: 1418be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i32; 1419be0f34b5SRichard Henderson case INDEX_op_add2_i32: 1420be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i32; 1421be0f34b5SRichard Henderson case INDEX_op_sub2_i32: 1422be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i32; 1423be0f34b5SRichard Henderson case INDEX_op_mulu2_i32: 1424be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i32; 1425be0f34b5SRichard Henderson case INDEX_op_muls2_i32: 1426be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i32; 1427be0f34b5SRichard Henderson case INDEX_op_muluh_i32: 1428be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i32; 1429be0f34b5SRichard Henderson case INDEX_op_mulsh_i32: 1430be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i32; 1431be0f34b5SRichard Henderson case INDEX_op_ext8s_i32: 1432be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i32; 1433be0f34b5SRichard Henderson case INDEX_op_ext16s_i32: 1434be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i32; 1435be0f34b5SRichard Henderson case INDEX_op_ext8u_i32: 1436be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i32; 1437be0f34b5SRichard Henderson case INDEX_op_ext16u_i32: 1438be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i32; 1439be0f34b5SRichard Henderson case INDEX_op_bswap16_i32: 1440be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i32; 1441be0f34b5SRichard Henderson case INDEX_op_bswap32_i32: 1442be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i32; 1443be0f34b5SRichard Henderson case INDEX_op_not_i32: 1444be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i32; 1445be0f34b5SRichard Henderson case INDEX_op_neg_i32: 1446be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i32; 1447be0f34b5SRichard Henderson case INDEX_op_andc_i32: 1448be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i32; 1449be0f34b5SRichard Henderson case INDEX_op_orc_i32: 1450be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i32; 1451be0f34b5SRichard Henderson case INDEX_op_eqv_i32: 1452be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i32; 1453be0f34b5SRichard Henderson case INDEX_op_nand_i32: 1454be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i32; 1455be0f34b5SRichard Henderson case INDEX_op_nor_i32: 1456be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i32; 1457be0f34b5SRichard Henderson case INDEX_op_clz_i32: 1458be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i32; 1459be0f34b5SRichard Henderson case INDEX_op_ctz_i32: 1460be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i32; 1461be0f34b5SRichard Henderson case INDEX_op_ctpop_i32: 1462be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i32; 1463be0f34b5SRichard Henderson 1464be0f34b5SRichard Henderson case INDEX_op_brcond2_i32: 1465be0f34b5SRichard Henderson case INDEX_op_setcond2_i32: 1466be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 32; 1467be0f34b5SRichard Henderson 1468be0f34b5SRichard Henderson case INDEX_op_mov_i64: 1469be0f34b5SRichard Henderson case INDEX_op_movi_i64: 1470be0f34b5SRichard Henderson case INDEX_op_setcond_i64: 1471be0f34b5SRichard Henderson case INDEX_op_brcond_i64: 1472be0f34b5SRichard Henderson case INDEX_op_ld8u_i64: 1473be0f34b5SRichard Henderson case INDEX_op_ld8s_i64: 1474be0f34b5SRichard Henderson case INDEX_op_ld16u_i64: 1475be0f34b5SRichard Henderson case INDEX_op_ld16s_i64: 1476be0f34b5SRichard Henderson case INDEX_op_ld32u_i64: 1477be0f34b5SRichard Henderson case INDEX_op_ld32s_i64: 1478be0f34b5SRichard Henderson case INDEX_op_ld_i64: 1479be0f34b5SRichard Henderson case INDEX_op_st8_i64: 1480be0f34b5SRichard Henderson case INDEX_op_st16_i64: 1481be0f34b5SRichard Henderson case INDEX_op_st32_i64: 1482be0f34b5SRichard Henderson case INDEX_op_st_i64: 1483be0f34b5SRichard Henderson case INDEX_op_add_i64: 1484be0f34b5SRichard Henderson case INDEX_op_sub_i64: 1485be0f34b5SRichard Henderson case INDEX_op_mul_i64: 1486be0f34b5SRichard Henderson case INDEX_op_and_i64: 1487be0f34b5SRichard Henderson case INDEX_op_or_i64: 1488be0f34b5SRichard Henderson case INDEX_op_xor_i64: 1489be0f34b5SRichard Henderson case INDEX_op_shl_i64: 1490be0f34b5SRichard Henderson case INDEX_op_shr_i64: 1491be0f34b5SRichard Henderson case INDEX_op_sar_i64: 1492be0f34b5SRichard Henderson case INDEX_op_ext_i32_i64: 1493be0f34b5SRichard Henderson case INDEX_op_extu_i32_i64: 1494be0f34b5SRichard Henderson return TCG_TARGET_REG_BITS == 64; 1495be0f34b5SRichard Henderson 1496be0f34b5SRichard Henderson case INDEX_op_movcond_i64: 1497be0f34b5SRichard Henderson return TCG_TARGET_HAS_movcond_i64; 1498be0f34b5SRichard Henderson case INDEX_op_div_i64: 1499be0f34b5SRichard Henderson case INDEX_op_divu_i64: 1500be0f34b5SRichard Henderson return TCG_TARGET_HAS_div_i64; 1501be0f34b5SRichard Henderson case INDEX_op_rem_i64: 1502be0f34b5SRichard Henderson case INDEX_op_remu_i64: 1503be0f34b5SRichard Henderson return TCG_TARGET_HAS_rem_i64; 1504be0f34b5SRichard Henderson case INDEX_op_div2_i64: 1505be0f34b5SRichard Henderson case INDEX_op_divu2_i64: 1506be0f34b5SRichard Henderson return TCG_TARGET_HAS_div2_i64; 1507be0f34b5SRichard Henderson case INDEX_op_rotl_i64: 1508be0f34b5SRichard Henderson case INDEX_op_rotr_i64: 1509be0f34b5SRichard Henderson return TCG_TARGET_HAS_rot_i64; 1510be0f34b5SRichard Henderson case INDEX_op_deposit_i64: 1511be0f34b5SRichard Henderson return TCG_TARGET_HAS_deposit_i64; 1512be0f34b5SRichard Henderson case INDEX_op_extract_i64: 1513be0f34b5SRichard Henderson return TCG_TARGET_HAS_extract_i64; 1514be0f34b5SRichard Henderson case INDEX_op_sextract_i64: 1515be0f34b5SRichard Henderson return TCG_TARGET_HAS_sextract_i64; 1516be0f34b5SRichard Henderson case INDEX_op_extrl_i64_i32: 1517be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrl_i64_i32; 1518be0f34b5SRichard Henderson case INDEX_op_extrh_i64_i32: 1519be0f34b5SRichard Henderson return TCG_TARGET_HAS_extrh_i64_i32; 1520be0f34b5SRichard Henderson case INDEX_op_ext8s_i64: 1521be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8s_i64; 1522be0f34b5SRichard Henderson case INDEX_op_ext16s_i64: 1523be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16s_i64; 1524be0f34b5SRichard Henderson case INDEX_op_ext32s_i64: 1525be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32s_i64; 1526be0f34b5SRichard Henderson case INDEX_op_ext8u_i64: 1527be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext8u_i64; 1528be0f34b5SRichard Henderson case INDEX_op_ext16u_i64: 1529be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext16u_i64; 1530be0f34b5SRichard Henderson case INDEX_op_ext32u_i64: 1531be0f34b5SRichard Henderson return TCG_TARGET_HAS_ext32u_i64; 1532be0f34b5SRichard Henderson case INDEX_op_bswap16_i64: 1533be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap16_i64; 1534be0f34b5SRichard Henderson case INDEX_op_bswap32_i64: 1535be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap32_i64; 1536be0f34b5SRichard Henderson case INDEX_op_bswap64_i64: 1537be0f34b5SRichard Henderson return TCG_TARGET_HAS_bswap64_i64; 1538be0f34b5SRichard Henderson case INDEX_op_not_i64: 1539be0f34b5SRichard Henderson return TCG_TARGET_HAS_not_i64; 1540be0f34b5SRichard Henderson case INDEX_op_neg_i64: 1541be0f34b5SRichard Henderson return TCG_TARGET_HAS_neg_i64; 1542be0f34b5SRichard Henderson case INDEX_op_andc_i64: 1543be0f34b5SRichard Henderson return TCG_TARGET_HAS_andc_i64; 1544be0f34b5SRichard Henderson case INDEX_op_orc_i64: 1545be0f34b5SRichard Henderson return TCG_TARGET_HAS_orc_i64; 1546be0f34b5SRichard Henderson case INDEX_op_eqv_i64: 1547be0f34b5SRichard Henderson return TCG_TARGET_HAS_eqv_i64; 1548be0f34b5SRichard Henderson case INDEX_op_nand_i64: 1549be0f34b5SRichard Henderson return TCG_TARGET_HAS_nand_i64; 1550be0f34b5SRichard Henderson case INDEX_op_nor_i64: 1551be0f34b5SRichard Henderson return TCG_TARGET_HAS_nor_i64; 1552be0f34b5SRichard Henderson case INDEX_op_clz_i64: 1553be0f34b5SRichard Henderson return TCG_TARGET_HAS_clz_i64; 1554be0f34b5SRichard Henderson case INDEX_op_ctz_i64: 1555be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctz_i64; 1556be0f34b5SRichard Henderson case INDEX_op_ctpop_i64: 1557be0f34b5SRichard Henderson return TCG_TARGET_HAS_ctpop_i64; 1558be0f34b5SRichard Henderson case INDEX_op_add2_i64: 1559be0f34b5SRichard Henderson return TCG_TARGET_HAS_add2_i64; 1560be0f34b5SRichard Henderson case INDEX_op_sub2_i64: 1561be0f34b5SRichard Henderson return TCG_TARGET_HAS_sub2_i64; 1562be0f34b5SRichard Henderson case INDEX_op_mulu2_i64: 1563be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulu2_i64; 1564be0f34b5SRichard Henderson case INDEX_op_muls2_i64: 1565be0f34b5SRichard Henderson return TCG_TARGET_HAS_muls2_i64; 1566be0f34b5SRichard Henderson case INDEX_op_muluh_i64: 1567be0f34b5SRichard Henderson return TCG_TARGET_HAS_muluh_i64; 1568be0f34b5SRichard Henderson case INDEX_op_mulsh_i64: 1569be0f34b5SRichard Henderson return TCG_TARGET_HAS_mulsh_i64; 1570be0f34b5SRichard Henderson 1571d2fd745fSRichard Henderson case INDEX_op_mov_vec: 1572d2fd745fSRichard Henderson case INDEX_op_dup_vec: 1573d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 1574d2fd745fSRichard Henderson case INDEX_op_ld_vec: 1575d2fd745fSRichard Henderson case INDEX_op_st_vec: 1576d2fd745fSRichard Henderson case INDEX_op_add_vec: 1577d2fd745fSRichard Henderson case INDEX_op_sub_vec: 1578d2fd745fSRichard Henderson case INDEX_op_and_vec: 1579d2fd745fSRichard Henderson case INDEX_op_or_vec: 1580d2fd745fSRichard Henderson case INDEX_op_xor_vec: 1581212be173SRichard Henderson case INDEX_op_cmp_vec: 1582d2fd745fSRichard Henderson return have_vec; 1583d2fd745fSRichard Henderson case INDEX_op_dup2_vec: 1584d2fd745fSRichard Henderson return have_vec && TCG_TARGET_REG_BITS == 32; 1585d2fd745fSRichard Henderson case INDEX_op_not_vec: 1586d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_not_vec; 1587d2fd745fSRichard Henderson case INDEX_op_neg_vec: 1588d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_neg_vec; 1589d2fd745fSRichard Henderson case INDEX_op_andc_vec: 1590d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_andc_vec; 1591d2fd745fSRichard Henderson case INDEX_op_orc_vec: 1592d2fd745fSRichard Henderson return have_vec && TCG_TARGET_HAS_orc_vec; 15933774030aSRichard Henderson case INDEX_op_mul_vec: 15943774030aSRichard Henderson return have_vec && TCG_TARGET_HAS_mul_vec; 1595d0ec9796SRichard Henderson case INDEX_op_shli_vec: 1596d0ec9796SRichard Henderson case INDEX_op_shri_vec: 1597d0ec9796SRichard Henderson case INDEX_op_sari_vec: 1598d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shi_vec; 1599d0ec9796SRichard Henderson case INDEX_op_shls_vec: 1600d0ec9796SRichard Henderson case INDEX_op_shrs_vec: 1601d0ec9796SRichard Henderson case INDEX_op_sars_vec: 1602d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shs_vec; 1603d0ec9796SRichard Henderson case INDEX_op_shlv_vec: 1604d0ec9796SRichard Henderson case INDEX_op_shrv_vec: 1605d0ec9796SRichard Henderson case INDEX_op_sarv_vec: 1606d0ec9796SRichard Henderson return have_vec && TCG_TARGET_HAS_shv_vec; 1607d2fd745fSRichard Henderson 1608db432672SRichard Henderson default: 1609db432672SRichard Henderson tcg_debug_assert(op > INDEX_op_last_generic && op < NB_OPS); 1610db432672SRichard Henderson return true; 1611be0f34b5SRichard Henderson } 1612be0f34b5SRichard Henderson } 1613be0f34b5SRichard Henderson 161439cf05d3Sbellard /* Note: we convert the 64 bit args to 32 bit and do some alignment 161539cf05d3Sbellard and endian swap. Maybe it would be better to do the alignment 161639cf05d3Sbellard and endian swap in tcg_reg_alloc_call(). */ 1617ae8b75dcSRichard Henderson void tcg_gen_callN(void *func, TCGTemp *ret, int nargs, TCGTemp **args) 1618c896fe29Sbellard { 161975e8b9b7SRichard Henderson int i, real_args, nb_rets, pi; 1620bbb8a1b4SRichard Henderson unsigned sizemask, flags; 1621afb49896SRichard Henderson TCGHelperInfo *info; 162275e8b9b7SRichard Henderson TCGOp *op; 1623afb49896SRichard Henderson 1624619205fdSEmilio G. Cota info = g_hash_table_lookup(helper_table, (gpointer)func); 1625bbb8a1b4SRichard Henderson flags = info->flags; 1626bbb8a1b4SRichard Henderson sizemask = info->sizemask; 16272bece2c8SRichard Henderson 162834b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 162934b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 163034b1a49cSRichard Henderson /* We have 64-bit values in one register, but need to pass as two 163134b1a49cSRichard Henderson separate parameters. Split them. */ 163234b1a49cSRichard Henderson int orig_sizemask = sizemask; 163334b1a49cSRichard Henderson int orig_nargs = nargs; 163434b1a49cSRichard Henderson TCGv_i64 retl, reth; 1635ae8b75dcSRichard Henderson TCGTemp *split_args[MAX_OPC_PARAM]; 163634b1a49cSRichard Henderson 1637f764718dSRichard Henderson retl = NULL; 1638f764718dSRichard Henderson reth = NULL; 163934b1a49cSRichard Henderson if (sizemask != 0) { 164034b1a49cSRichard Henderson for (i = real_args = 0; i < nargs; ++i) { 164134b1a49cSRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 164234b1a49cSRichard Henderson if (is_64bit) { 1643085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 164434b1a49cSRichard Henderson TCGv_i32 h = tcg_temp_new_i32(); 164534b1a49cSRichard Henderson TCGv_i32 l = tcg_temp_new_i32(); 164634b1a49cSRichard Henderson tcg_gen_extr_i64_i32(l, h, orig); 1647ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(h); 1648ae8b75dcSRichard Henderson split_args[real_args++] = tcgv_i32_temp(l); 164934b1a49cSRichard Henderson } else { 165034b1a49cSRichard Henderson split_args[real_args++] = args[i]; 165134b1a49cSRichard Henderson } 165234b1a49cSRichard Henderson } 165334b1a49cSRichard Henderson nargs = real_args; 165434b1a49cSRichard Henderson args = split_args; 165534b1a49cSRichard Henderson sizemask = 0; 165634b1a49cSRichard Henderson } 165734b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 16582bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 16592bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 16602bece2c8SRichard Henderson int is_signed = sizemask & (2 << (i+1)*2); 16612bece2c8SRichard Henderson if (!is_64bit) { 16622bece2c8SRichard Henderson TCGv_i64 temp = tcg_temp_new_i64(); 1663085272b3SRichard Henderson TCGv_i64 orig = temp_tcgv_i64(args[i]); 16642bece2c8SRichard Henderson if (is_signed) { 16652bece2c8SRichard Henderson tcg_gen_ext32s_i64(temp, orig); 16662bece2c8SRichard Henderson } else { 16672bece2c8SRichard Henderson tcg_gen_ext32u_i64(temp, orig); 16682bece2c8SRichard Henderson } 1669ae8b75dcSRichard Henderson args[i] = tcgv_i64_temp(temp); 16702bece2c8SRichard Henderson } 16712bece2c8SRichard Henderson } 16722bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 16732bece2c8SRichard Henderson 167415fa08f8SRichard Henderson op = tcg_emit_op(INDEX_op_call); 167575e8b9b7SRichard Henderson 167675e8b9b7SRichard Henderson pi = 0; 1677ae8b75dcSRichard Henderson if (ret != NULL) { 167834b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 167934b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 168034b1a49cSRichard Henderson if (orig_sizemask & 1) { 168134b1a49cSRichard Henderson /* The 32-bit ABI is going to return the 64-bit value in 168234b1a49cSRichard Henderson the %o0/%o1 register pair. Prepare for this by using 168334b1a49cSRichard Henderson two return temporaries, and reassemble below. */ 168434b1a49cSRichard Henderson retl = tcg_temp_new_i64(); 168534b1a49cSRichard Henderson reth = tcg_temp_new_i64(); 1686ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(reth); 1687ae8b75dcSRichard Henderson op->args[pi++] = tcgv_i64_arg(retl); 168834b1a49cSRichard Henderson nb_rets = 2; 168934b1a49cSRichard Henderson } else { 1690ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 169134b1a49cSRichard Henderson nb_rets = 1; 169234b1a49cSRichard Henderson } 169334b1a49cSRichard Henderson #else 169434b1a49cSRichard Henderson if (TCG_TARGET_REG_BITS < 64 && (sizemask & 1)) { 169502eb19d0SRichard Henderson #ifdef HOST_WORDS_BIGENDIAN 1696ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1697ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1698a7812ae4Spbrook #else 1699ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1700ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret + 1); 1701a7812ae4Spbrook #endif 1702a7812ae4Spbrook nb_rets = 2; 170334b1a49cSRichard Henderson } else { 1704ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(ret); 1705a7812ae4Spbrook nb_rets = 1; 1706a7812ae4Spbrook } 170734b1a49cSRichard Henderson #endif 1708a7812ae4Spbrook } else { 1709a7812ae4Spbrook nb_rets = 0; 1710a7812ae4Spbrook } 1711cd9090aaSRichard Henderson TCGOP_CALLO(op) = nb_rets; 171275e8b9b7SRichard Henderson 1713a7812ae4Spbrook real_args = 0; 1714a7812ae4Spbrook for (i = 0; i < nargs; i++) { 17152bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 1716bbb8a1b4SRichard Henderson if (TCG_TARGET_REG_BITS < 64 && is_64bit) { 171739cf05d3Sbellard #ifdef TCG_TARGET_CALL_ALIGN_ARGS 171839cf05d3Sbellard /* some targets want aligned 64 bit args */ 1719ebd486d5Smalc if (real_args & 1) { 172075e8b9b7SRichard Henderson op->args[pi++] = TCG_CALL_DUMMY_ARG; 1721ebd486d5Smalc real_args++; 172239cf05d3Sbellard } 172339cf05d3Sbellard #endif 17243f90f252SRichard Henderson /* If stack grows up, then we will be placing successive 17253f90f252SRichard Henderson arguments at lower addresses, which means we need to 17263f90f252SRichard Henderson reverse the order compared to how we would normally 17273f90f252SRichard Henderson treat either big or little-endian. For those arguments 17283f90f252SRichard Henderson that will wind up in registers, this still works for 17293f90f252SRichard Henderson HPPA (the only current STACK_GROWSUP target) since the 17303f90f252SRichard Henderson argument registers are *also* allocated in decreasing 17313f90f252SRichard Henderson order. If another such target is added, this logic may 17323f90f252SRichard Henderson have to get more complicated to differentiate between 17333f90f252SRichard Henderson stack arguments and register arguments. */ 173402eb19d0SRichard Henderson #if defined(HOST_WORDS_BIGENDIAN) != defined(TCG_TARGET_STACK_GROWSUP) 1735ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1736ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1737c896fe29Sbellard #else 1738ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1739ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i] + 1); 1740c896fe29Sbellard #endif 1741a7812ae4Spbrook real_args += 2; 17422bece2c8SRichard Henderson continue; 17432bece2c8SRichard Henderson } 17442bece2c8SRichard Henderson 1745ae8b75dcSRichard Henderson op->args[pi++] = temp_arg(args[i]); 1746a7812ae4Spbrook real_args++; 1747c896fe29Sbellard } 174875e8b9b7SRichard Henderson op->args[pi++] = (uintptr_t)func; 174975e8b9b7SRichard Henderson op->args[pi++] = flags; 1750cd9090aaSRichard Henderson TCGOP_CALLI(op) = real_args; 1751a7812ae4Spbrook 175275e8b9b7SRichard Henderson /* Make sure the fields didn't overflow. */ 1753cd9090aaSRichard Henderson tcg_debug_assert(TCGOP_CALLI(op) == real_args); 175475e8b9b7SRichard Henderson tcg_debug_assert(pi <= ARRAY_SIZE(op->args)); 17552bece2c8SRichard Henderson 175634b1a49cSRichard Henderson #if defined(__sparc__) && !defined(__arch64__) \ 175734b1a49cSRichard Henderson && !defined(CONFIG_TCG_INTERPRETER) 175834b1a49cSRichard Henderson /* Free all of the parts we allocated above. */ 175934b1a49cSRichard Henderson for (i = real_args = 0; i < orig_nargs; ++i) { 176034b1a49cSRichard Henderson int is_64bit = orig_sizemask & (1 << (i+1)*2); 176134b1a49cSRichard Henderson if (is_64bit) { 1762085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 1763085272b3SRichard Henderson tcg_temp_free_internal(args[real_args++]); 176434b1a49cSRichard Henderson } else { 176534b1a49cSRichard Henderson real_args++; 176634b1a49cSRichard Henderson } 176734b1a49cSRichard Henderson } 176834b1a49cSRichard Henderson if (orig_sizemask & 1) { 176934b1a49cSRichard Henderson /* The 32-bit ABI returned two 32-bit pieces. Re-assemble them. 177034b1a49cSRichard Henderson Note that describing these as TCGv_i64 eliminates an unnecessary 177134b1a49cSRichard Henderson zero-extension that tcg_gen_concat_i32_i64 would create. */ 1772085272b3SRichard Henderson tcg_gen_concat32_i64(temp_tcgv_i64(ret), retl, reth); 177334b1a49cSRichard Henderson tcg_temp_free_i64(retl); 177434b1a49cSRichard Henderson tcg_temp_free_i64(reth); 177534b1a49cSRichard Henderson } 177634b1a49cSRichard Henderson #elif defined(TCG_TARGET_EXTEND_ARGS) && TCG_TARGET_REG_BITS == 64 17772bece2c8SRichard Henderson for (i = 0; i < nargs; ++i) { 17782bece2c8SRichard Henderson int is_64bit = sizemask & (1 << (i+1)*2); 17792bece2c8SRichard Henderson if (!is_64bit) { 1780085272b3SRichard Henderson tcg_temp_free_internal(args[i]); 17812bece2c8SRichard Henderson } 17822bece2c8SRichard Henderson } 17832bece2c8SRichard Henderson #endif /* TCG_TARGET_EXTEND_ARGS */ 1784a7812ae4Spbrook } 1785c896fe29Sbellard 17868fcd3692Sblueswir1 static void tcg_reg_alloc_start(TCGContext *s) 1787c896fe29Sbellard { 1788ac3b8891SRichard Henderson int i, n; 1789c896fe29Sbellard TCGTemp *ts; 1790ac3b8891SRichard Henderson 1791ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 1792c896fe29Sbellard ts = &s->temps[i]; 1793ac3b8891SRichard Henderson ts->val_type = (ts->fixed_reg ? TEMP_VAL_REG : TEMP_VAL_MEM); 1794c896fe29Sbellard } 1795ac3b8891SRichard Henderson for (n = s->nb_temps; i < n; i++) { 1796e8996ee0Sbellard ts = &s->temps[i]; 1797ac3b8891SRichard Henderson ts->val_type = (ts->temp_local ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 1798e8996ee0Sbellard ts->mem_allocated = 0; 1799e8996ee0Sbellard ts->fixed_reg = 0; 1800e8996ee0Sbellard } 1801f8b2f202SRichard Henderson 1802f8b2f202SRichard Henderson memset(s->reg_to_temp, 0, sizeof(s->reg_to_temp)); 1803c896fe29Sbellard } 1804c896fe29Sbellard 1805f8b2f202SRichard Henderson static char *tcg_get_arg_str_ptr(TCGContext *s, char *buf, int buf_size, 1806f8b2f202SRichard Henderson TCGTemp *ts) 1807c896fe29Sbellard { 18081807f4c4SRichard Henderson int idx = temp_idx(ts); 1809ac56dd48Spbrook 1810fa477d25SRichard Henderson if (ts->temp_global) { 1811ac56dd48Spbrook pstrcpy(buf, buf_size, ts->name); 1812f8b2f202SRichard Henderson } else if (ts->temp_local) { 1813641d5fbeSbellard snprintf(buf, buf_size, "loc%d", idx - s->nb_globals); 1814f8b2f202SRichard Henderson } else { 1815ac56dd48Spbrook snprintf(buf, buf_size, "tmp%d", idx - s->nb_globals); 1816c896fe29Sbellard } 1817c896fe29Sbellard return buf; 1818c896fe29Sbellard } 1819c896fe29Sbellard 182043439139SRichard Henderson static char *tcg_get_arg_str(TCGContext *s, char *buf, 182143439139SRichard Henderson int buf_size, TCGArg arg) 1822f8b2f202SRichard Henderson { 182343439139SRichard Henderson return tcg_get_arg_str_ptr(s, buf, buf_size, arg_temp(arg)); 1824f8b2f202SRichard Henderson } 1825f8b2f202SRichard Henderson 18266e085f72SRichard Henderson /* Find helper name. */ 18276e085f72SRichard Henderson static inline const char *tcg_find_helper(TCGContext *s, uintptr_t val) 1828e8996ee0Sbellard { 18296e085f72SRichard Henderson const char *ret = NULL; 1830619205fdSEmilio G. Cota if (helper_table) { 1831619205fdSEmilio G. Cota TCGHelperInfo *info = g_hash_table_lookup(helper_table, (gpointer)val); 183272866e82SRichard Henderson if (info) { 183372866e82SRichard Henderson ret = info->name; 183472866e82SRichard Henderson } 1835e8996ee0Sbellard } 18366e085f72SRichard Henderson return ret; 18374dc81f28Sbellard } 18384dc81f28Sbellard 1839f48f3edeSblueswir1 static const char * const cond_name[] = 1840f48f3edeSblueswir1 { 18410aed257fSRichard Henderson [TCG_COND_NEVER] = "never", 18420aed257fSRichard Henderson [TCG_COND_ALWAYS] = "always", 1843f48f3edeSblueswir1 [TCG_COND_EQ] = "eq", 1844f48f3edeSblueswir1 [TCG_COND_NE] = "ne", 1845f48f3edeSblueswir1 [TCG_COND_LT] = "lt", 1846f48f3edeSblueswir1 [TCG_COND_GE] = "ge", 1847f48f3edeSblueswir1 [TCG_COND_LE] = "le", 1848f48f3edeSblueswir1 [TCG_COND_GT] = "gt", 1849f48f3edeSblueswir1 [TCG_COND_LTU] = "ltu", 1850f48f3edeSblueswir1 [TCG_COND_GEU] = "geu", 1851f48f3edeSblueswir1 [TCG_COND_LEU] = "leu", 1852f48f3edeSblueswir1 [TCG_COND_GTU] = "gtu" 1853f48f3edeSblueswir1 }; 1854f48f3edeSblueswir1 1855f713d6adSRichard Henderson static const char * const ldst_name[] = 1856f713d6adSRichard Henderson { 1857f713d6adSRichard Henderson [MO_UB] = "ub", 1858f713d6adSRichard Henderson [MO_SB] = "sb", 1859f713d6adSRichard Henderson [MO_LEUW] = "leuw", 1860f713d6adSRichard Henderson [MO_LESW] = "lesw", 1861f713d6adSRichard Henderson [MO_LEUL] = "leul", 1862f713d6adSRichard Henderson [MO_LESL] = "lesl", 1863f713d6adSRichard Henderson [MO_LEQ] = "leq", 1864f713d6adSRichard Henderson [MO_BEUW] = "beuw", 1865f713d6adSRichard Henderson [MO_BESW] = "besw", 1866f713d6adSRichard Henderson [MO_BEUL] = "beul", 1867f713d6adSRichard Henderson [MO_BESL] = "besl", 1868f713d6adSRichard Henderson [MO_BEQ] = "beq", 1869f713d6adSRichard Henderson }; 1870f713d6adSRichard Henderson 18711f00b27fSSergey Sorokin static const char * const alignment_name[(MO_AMASK >> MO_ASHIFT) + 1] = { 18721f00b27fSSergey Sorokin #ifdef ALIGNED_ONLY 18731f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "un+", 18741f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "", 18751f00b27fSSergey Sorokin #else 18761f00b27fSSergey Sorokin [MO_UNALN >> MO_ASHIFT] = "", 18771f00b27fSSergey Sorokin [MO_ALIGN >> MO_ASHIFT] = "al+", 18781f00b27fSSergey Sorokin #endif 18791f00b27fSSergey Sorokin [MO_ALIGN_2 >> MO_ASHIFT] = "al2+", 18801f00b27fSSergey Sorokin [MO_ALIGN_4 >> MO_ASHIFT] = "al4+", 18811f00b27fSSergey Sorokin [MO_ALIGN_8 >> MO_ASHIFT] = "al8+", 18821f00b27fSSergey Sorokin [MO_ALIGN_16 >> MO_ASHIFT] = "al16+", 18831f00b27fSSergey Sorokin [MO_ALIGN_32 >> MO_ASHIFT] = "al32+", 18841f00b27fSSergey Sorokin [MO_ALIGN_64 >> MO_ASHIFT] = "al64+", 18851f00b27fSSergey Sorokin }; 18861f00b27fSSergey Sorokin 1887eeacee4dSBlue Swirl void tcg_dump_ops(TCGContext *s) 1888c896fe29Sbellard { 1889c896fe29Sbellard char buf[128]; 1890c45cb8bbSRichard Henderson TCGOp *op; 1891c896fe29Sbellard 189215fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 1893c45cb8bbSRichard Henderson int i, k, nb_oargs, nb_iargs, nb_cargs; 1894c45cb8bbSRichard Henderson const TCGOpDef *def; 1895c45cb8bbSRichard Henderson TCGOpcode c; 1896bdfb460eSRichard Henderson int col = 0; 1897c45cb8bbSRichard Henderson 1898c45cb8bbSRichard Henderson c = op->opc; 1899c896fe29Sbellard def = &tcg_op_defs[c]; 1900c45cb8bbSRichard Henderson 1901765b842aSRichard Henderson if (c == INDEX_op_insn_start) { 190215fa08f8SRichard Henderson col += qemu_log("\n ----"); 19039aef40edSRichard Henderson 19049aef40edSRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 19059aef40edSRichard Henderson target_ulong a; 19067e4597d7Sbellard #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 1907efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 19087e4597d7Sbellard #else 1909efee3746SRichard Henderson a = op->args[i]; 19107e4597d7Sbellard #endif 1911bdfb460eSRichard Henderson col += qemu_log(" " TARGET_FMT_lx, a); 1912eeacee4dSBlue Swirl } 19137e4597d7Sbellard } else if (c == INDEX_op_call) { 1914c896fe29Sbellard /* variable number of arguments */ 1915cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 1916cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 1917c896fe29Sbellard nb_cargs = def->nb_cargs; 1918b03cce8eSbellard 1919cf066674SRichard Henderson /* function name, flags, out args */ 1920bdfb460eSRichard Henderson col += qemu_log(" %s %s,$0x%" TCG_PRIlx ",$%d", def->name, 1921efee3746SRichard Henderson tcg_find_helper(s, op->args[nb_oargs + nb_iargs]), 1922efee3746SRichard Henderson op->args[nb_oargs + nb_iargs + 1], nb_oargs); 1923b03cce8eSbellard for (i = 0; i < nb_oargs; i++) { 192443439139SRichard Henderson col += qemu_log(",%s", tcg_get_arg_str(s, buf, sizeof(buf), 1925efee3746SRichard Henderson op->args[i])); 1926b03cce8eSbellard } 1927cf066674SRichard Henderson for (i = 0; i < nb_iargs; i++) { 1928efee3746SRichard Henderson TCGArg arg = op->args[nb_oargs + i]; 1929cf066674SRichard Henderson const char *t = "<dummy>"; 1930cf066674SRichard Henderson if (arg != TCG_CALL_DUMMY_ARG) { 193143439139SRichard Henderson t = tcg_get_arg_str(s, buf, sizeof(buf), arg); 1932b03cce8eSbellard } 1933bdfb460eSRichard Henderson col += qemu_log(",%s", t); 1934e8996ee0Sbellard } 1935b03cce8eSbellard } else { 1936bdfb460eSRichard Henderson col += qemu_log(" %s ", def->name); 1937c45cb8bbSRichard Henderson 1938c896fe29Sbellard nb_oargs = def->nb_oargs; 1939c896fe29Sbellard nb_iargs = def->nb_iargs; 1940c896fe29Sbellard nb_cargs = def->nb_cargs; 1941c896fe29Sbellard 1942d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 1943d2fd745fSRichard Henderson col += qemu_log("v%d,e%d,", 64 << TCGOP_VECL(op), 1944d2fd745fSRichard Henderson 8 << TCGOP_VECE(op)); 1945d2fd745fSRichard Henderson } 1946d2fd745fSRichard Henderson 1947c896fe29Sbellard k = 0; 1948c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 1949eeacee4dSBlue Swirl if (k != 0) { 1950bdfb460eSRichard Henderson col += qemu_log(","); 1951eeacee4dSBlue Swirl } 195243439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1953efee3746SRichard Henderson op->args[k++])); 1954c896fe29Sbellard } 1955c896fe29Sbellard for (i = 0; i < nb_iargs; i++) { 1956eeacee4dSBlue Swirl if (k != 0) { 1957bdfb460eSRichard Henderson col += qemu_log(","); 1958eeacee4dSBlue Swirl } 195943439139SRichard Henderson col += qemu_log("%s", tcg_get_arg_str(s, buf, sizeof(buf), 1960efee3746SRichard Henderson op->args[k++])); 1961c896fe29Sbellard } 1962be210acbSRichard Henderson switch (c) { 1963be210acbSRichard Henderson case INDEX_op_brcond_i32: 1964ffc5ea09SRichard Henderson case INDEX_op_setcond_i32: 1965ffc5ea09SRichard Henderson case INDEX_op_movcond_i32: 1966be210acbSRichard Henderson case INDEX_op_brcond2_i32: 1967be210acbSRichard Henderson case INDEX_op_setcond2_i32: 1968ffc5ea09SRichard Henderson case INDEX_op_brcond_i64: 1969be210acbSRichard Henderson case INDEX_op_setcond_i64: 1970ffc5ea09SRichard Henderson case INDEX_op_movcond_i64: 1971212be173SRichard Henderson case INDEX_op_cmp_vec: 1972efee3746SRichard Henderson if (op->args[k] < ARRAY_SIZE(cond_name) 1973efee3746SRichard Henderson && cond_name[op->args[k]]) { 1974efee3746SRichard Henderson col += qemu_log(",%s", cond_name[op->args[k++]]); 1975eeacee4dSBlue Swirl } else { 1976efee3746SRichard Henderson col += qemu_log(",$0x%" TCG_PRIlx, op->args[k++]); 1977eeacee4dSBlue Swirl } 1978f48f3edeSblueswir1 i = 1; 1979be210acbSRichard Henderson break; 1980f713d6adSRichard Henderson case INDEX_op_qemu_ld_i32: 1981f713d6adSRichard Henderson case INDEX_op_qemu_st_i32: 1982f713d6adSRichard Henderson case INDEX_op_qemu_ld_i64: 1983f713d6adSRichard Henderson case INDEX_op_qemu_st_i64: 198459227d5dSRichard Henderson { 1985efee3746SRichard Henderson TCGMemOpIdx oi = op->args[k++]; 198659227d5dSRichard Henderson TCGMemOp op = get_memop(oi); 198759227d5dSRichard Henderson unsigned ix = get_mmuidx(oi); 198859227d5dSRichard Henderson 198959c4b7e8SRichard Henderson if (op & ~(MO_AMASK | MO_BSWAP | MO_SSIZE)) { 1990bdfb460eSRichard Henderson col += qemu_log(",$0x%x,%u", op, ix); 199159c4b7e8SRichard Henderson } else { 19921f00b27fSSergey Sorokin const char *s_al, *s_op; 19931f00b27fSSergey Sorokin s_al = alignment_name[(op & MO_AMASK) >> MO_ASHIFT]; 199459c4b7e8SRichard Henderson s_op = ldst_name[op & (MO_BSWAP | MO_SSIZE)]; 1995bdfb460eSRichard Henderson col += qemu_log(",%s%s,%u", s_al, s_op, ix); 1996f713d6adSRichard Henderson } 1997f713d6adSRichard Henderson i = 1; 199859227d5dSRichard Henderson } 1999f713d6adSRichard Henderson break; 2000be210acbSRichard Henderson default: 2001f48f3edeSblueswir1 i = 0; 2002be210acbSRichard Henderson break; 2003be210acbSRichard Henderson } 200451e3972cSRichard Henderson switch (c) { 200551e3972cSRichard Henderson case INDEX_op_set_label: 200651e3972cSRichard Henderson case INDEX_op_br: 200751e3972cSRichard Henderson case INDEX_op_brcond_i32: 200851e3972cSRichard Henderson case INDEX_op_brcond_i64: 200951e3972cSRichard Henderson case INDEX_op_brcond2_i32: 2010efee3746SRichard Henderson col += qemu_log("%s$L%d", k ? "," : "", 2011efee3746SRichard Henderson arg_label(op->args[k])->id); 201251e3972cSRichard Henderson i++, k++; 201351e3972cSRichard Henderson break; 201451e3972cSRichard Henderson default: 201551e3972cSRichard Henderson break; 2016eeacee4dSBlue Swirl } 201751e3972cSRichard Henderson for (; i < nb_cargs; i++, k++) { 2018efee3746SRichard Henderson col += qemu_log("%s$0x%" TCG_PRIlx, k ? "," : "", op->args[k]); 2019bdfb460eSRichard Henderson } 2020bdfb460eSRichard Henderson } 2021bdfb460eSRichard Henderson if (op->life) { 2022bdfb460eSRichard Henderson unsigned life = op->life; 2023bdfb460eSRichard Henderson 2024bdfb460eSRichard Henderson for (; col < 48; ++col) { 2025bdfb460eSRichard Henderson putc(' ', qemu_logfile); 2026bdfb460eSRichard Henderson } 2027bdfb460eSRichard Henderson 2028bdfb460eSRichard Henderson if (life & (SYNC_ARG * 3)) { 2029bdfb460eSRichard Henderson qemu_log(" sync:"); 2030bdfb460eSRichard Henderson for (i = 0; i < 2; ++i) { 2031bdfb460eSRichard Henderson if (life & (SYNC_ARG << i)) { 2032bdfb460eSRichard Henderson qemu_log(" %d", i); 2033bdfb460eSRichard Henderson } 2034bdfb460eSRichard Henderson } 2035bdfb460eSRichard Henderson } 2036bdfb460eSRichard Henderson life /= DEAD_ARG; 2037bdfb460eSRichard Henderson if (life) { 2038bdfb460eSRichard Henderson qemu_log(" dead:"); 2039bdfb460eSRichard Henderson for (i = 0; life; ++i, life >>= 1) { 2040bdfb460eSRichard Henderson if (life & 1) { 2041bdfb460eSRichard Henderson qemu_log(" %d", i); 2042bdfb460eSRichard Henderson } 2043bdfb460eSRichard Henderson } 2044c896fe29Sbellard } 2045b03cce8eSbellard } 2046eeacee4dSBlue Swirl qemu_log("\n"); 2047c896fe29Sbellard } 2048c896fe29Sbellard } 2049c896fe29Sbellard 2050c896fe29Sbellard /* we give more priority to constraints with less registers */ 2051c896fe29Sbellard static int get_constraint_priority(const TCGOpDef *def, int k) 2052c896fe29Sbellard { 2053c896fe29Sbellard const TCGArgConstraint *arg_ct; 2054c896fe29Sbellard 2055c896fe29Sbellard int i, n; 2056c896fe29Sbellard arg_ct = &def->args_ct[k]; 2057c896fe29Sbellard if (arg_ct->ct & TCG_CT_ALIAS) { 2058c896fe29Sbellard /* an alias is equivalent to a single register */ 2059c896fe29Sbellard n = 1; 2060c896fe29Sbellard } else { 2061c896fe29Sbellard if (!(arg_ct->ct & TCG_CT_REG)) 2062c896fe29Sbellard return 0; 2063c896fe29Sbellard n = 0; 2064c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2065c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, i)) 2066c896fe29Sbellard n++; 2067c896fe29Sbellard } 2068c896fe29Sbellard } 2069c896fe29Sbellard return TCG_TARGET_NB_REGS - n + 1; 2070c896fe29Sbellard } 2071c896fe29Sbellard 2072c896fe29Sbellard /* sort from highest priority to lowest */ 2073c896fe29Sbellard static void sort_constraints(TCGOpDef *def, int start, int n) 2074c896fe29Sbellard { 2075c896fe29Sbellard int i, j, p1, p2, tmp; 2076c896fe29Sbellard 2077c896fe29Sbellard for(i = 0; i < n; i++) 2078c896fe29Sbellard def->sorted_args[start + i] = start + i; 2079c896fe29Sbellard if (n <= 1) 2080c896fe29Sbellard return; 2081c896fe29Sbellard for(i = 0; i < n - 1; i++) { 2082c896fe29Sbellard for(j = i + 1; j < n; j++) { 2083c896fe29Sbellard p1 = get_constraint_priority(def, def->sorted_args[start + i]); 2084c896fe29Sbellard p2 = get_constraint_priority(def, def->sorted_args[start + j]); 2085c896fe29Sbellard if (p1 < p2) { 2086c896fe29Sbellard tmp = def->sorted_args[start + i]; 2087c896fe29Sbellard def->sorted_args[start + i] = def->sorted_args[start + j]; 2088c896fe29Sbellard def->sorted_args[start + j] = tmp; 2089c896fe29Sbellard } 2090c896fe29Sbellard } 2091c896fe29Sbellard } 2092c896fe29Sbellard } 2093c896fe29Sbellard 2094f69d277eSRichard Henderson static void process_op_defs(TCGContext *s) 2095c896fe29Sbellard { 2096a9751609SRichard Henderson TCGOpcode op; 2097c896fe29Sbellard 2098f69d277eSRichard Henderson for (op = 0; op < NB_OPS; op++) { 2099f69d277eSRichard Henderson TCGOpDef *def = &tcg_op_defs[op]; 2100f69d277eSRichard Henderson const TCGTargetOpDef *tdefs; 2101069ea736SRichard Henderson TCGType type; 2102069ea736SRichard Henderson int i, nb_args; 2103f69d277eSRichard Henderson 2104f69d277eSRichard Henderson if (def->flags & TCG_OPF_NOT_PRESENT) { 2105f69d277eSRichard Henderson continue; 2106f69d277eSRichard Henderson } 2107f69d277eSRichard Henderson 2108c896fe29Sbellard nb_args = def->nb_iargs + def->nb_oargs; 2109f69d277eSRichard Henderson if (nb_args == 0) { 2110f69d277eSRichard Henderson continue; 2111f69d277eSRichard Henderson } 2112f69d277eSRichard Henderson 2113f69d277eSRichard Henderson tdefs = tcg_target_op_def(op); 2114f69d277eSRichard Henderson /* Missing TCGTargetOpDef entry. */ 2115f69d277eSRichard Henderson tcg_debug_assert(tdefs != NULL); 2116f69d277eSRichard Henderson 2117069ea736SRichard Henderson type = (def->flags & TCG_OPF_64BIT ? TCG_TYPE_I64 : TCG_TYPE_I32); 2118c896fe29Sbellard for (i = 0; i < nb_args; i++) { 2119f69d277eSRichard Henderson const char *ct_str = tdefs->args_ct_str[i]; 2120f69d277eSRichard Henderson /* Incomplete TCGTargetOpDef entry. */ 2121eabb7b91SAurelien Jarno tcg_debug_assert(ct_str != NULL); 2122f69d277eSRichard Henderson 2123ccb1bb66SRichard Henderson def->args_ct[i].u.regs = 0; 2124c896fe29Sbellard def->args_ct[i].ct = 0; 212517280ff4SRichard Henderson while (*ct_str != '\0') { 212617280ff4SRichard Henderson switch(*ct_str) { 212717280ff4SRichard Henderson case '0' ... '9': 212817280ff4SRichard Henderson { 212917280ff4SRichard Henderson int oarg = *ct_str - '0'; 213017280ff4SRichard Henderson tcg_debug_assert(ct_str == tdefs->args_ct_str[i]); 2131eabb7b91SAurelien Jarno tcg_debug_assert(oarg < def->nb_oargs); 2132eabb7b91SAurelien Jarno tcg_debug_assert(def->args_ct[oarg].ct & TCG_CT_REG); 213317280ff4SRichard Henderson /* TCG_CT_ALIAS is for the output arguments. 213417280ff4SRichard Henderson The input is tagged with TCG_CT_IALIAS. */ 2135c896fe29Sbellard def->args_ct[i] = def->args_ct[oarg]; 213617280ff4SRichard Henderson def->args_ct[oarg].ct |= TCG_CT_ALIAS; 21375ff9d6a4Sbellard def->args_ct[oarg].alias_index = i; 2138c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_IALIAS; 21395ff9d6a4Sbellard def->args_ct[i].alias_index = oarg; 214017280ff4SRichard Henderson } 214117280ff4SRichard Henderson ct_str++; 2142c896fe29Sbellard break; 214382790a87SRichard Henderson case '&': 214482790a87SRichard Henderson def->args_ct[i].ct |= TCG_CT_NEWREG; 214582790a87SRichard Henderson ct_str++; 214682790a87SRichard Henderson break; 2147c896fe29Sbellard case 'i': 2148c896fe29Sbellard def->args_ct[i].ct |= TCG_CT_CONST; 2149c896fe29Sbellard ct_str++; 2150c896fe29Sbellard break; 2151c896fe29Sbellard default: 2152069ea736SRichard Henderson ct_str = target_parse_constraint(&def->args_ct[i], 2153069ea736SRichard Henderson ct_str, type); 2154f69d277eSRichard Henderson /* Typo in TCGTargetOpDef constraint. */ 2155069ea736SRichard Henderson tcg_debug_assert(ct_str != NULL); 2156c896fe29Sbellard } 2157c896fe29Sbellard } 2158c896fe29Sbellard } 2159c896fe29Sbellard 2160c68aaa18SStefan Weil /* TCGTargetOpDef entry with too much information? */ 2161eabb7b91SAurelien Jarno tcg_debug_assert(i == TCG_MAX_OP_ARGS || tdefs->args_ct_str[i] == NULL); 2162c68aaa18SStefan Weil 2163c896fe29Sbellard /* sort the constraints (XXX: this is just an heuristic) */ 2164c896fe29Sbellard sort_constraints(def, 0, def->nb_oargs); 2165c896fe29Sbellard sort_constraints(def, def->nb_oargs, def->nb_iargs); 2166c896fe29Sbellard } 2167c896fe29Sbellard } 2168c896fe29Sbellard 21690c627cdcSRichard Henderson void tcg_op_remove(TCGContext *s, TCGOp *op) 21700c627cdcSRichard Henderson { 217115fa08f8SRichard Henderson QTAILQ_REMOVE(&s->ops, op, link); 217215fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&s->free_ops, op, link); 2173abebf925SRichard Henderson s->nb_ops--; 21740c627cdcSRichard Henderson 21750c627cdcSRichard Henderson #ifdef CONFIG_PROFILER 2176c3fac113SEmilio G. Cota atomic_set(&s->prof.del_op_count, s->prof.del_op_count + 1); 21770c627cdcSRichard Henderson #endif 21780c627cdcSRichard Henderson } 21790c627cdcSRichard Henderson 218015fa08f8SRichard Henderson static TCGOp *tcg_op_alloc(TCGOpcode opc) 218115fa08f8SRichard Henderson { 218215fa08f8SRichard Henderson TCGContext *s = tcg_ctx; 218315fa08f8SRichard Henderson TCGOp *op; 218415fa08f8SRichard Henderson 218515fa08f8SRichard Henderson if (likely(QTAILQ_EMPTY(&s->free_ops))) { 218615fa08f8SRichard Henderson op = tcg_malloc(sizeof(TCGOp)); 218715fa08f8SRichard Henderson } else { 218815fa08f8SRichard Henderson op = QTAILQ_FIRST(&s->free_ops); 218915fa08f8SRichard Henderson QTAILQ_REMOVE(&s->free_ops, op, link); 219015fa08f8SRichard Henderson } 219115fa08f8SRichard Henderson memset(op, 0, offsetof(TCGOp, link)); 219215fa08f8SRichard Henderson op->opc = opc; 2193abebf925SRichard Henderson s->nb_ops++; 219415fa08f8SRichard Henderson 219515fa08f8SRichard Henderson return op; 219615fa08f8SRichard Henderson } 219715fa08f8SRichard Henderson 219815fa08f8SRichard Henderson TCGOp *tcg_emit_op(TCGOpcode opc) 219915fa08f8SRichard Henderson { 220015fa08f8SRichard Henderson TCGOp *op = tcg_op_alloc(opc); 220115fa08f8SRichard Henderson QTAILQ_INSERT_TAIL(&tcg_ctx->ops, op, link); 220215fa08f8SRichard Henderson return op; 220315fa08f8SRichard Henderson } 220415fa08f8SRichard Henderson 22055a18407fSRichard Henderson TCGOp *tcg_op_insert_before(TCGContext *s, TCGOp *old_op, 22065a18407fSRichard Henderson TCGOpcode opc, int nargs) 22075a18407fSRichard Henderson { 220815fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 220915fa08f8SRichard Henderson QTAILQ_INSERT_BEFORE(old_op, new_op, link); 22105a18407fSRichard Henderson return new_op; 22115a18407fSRichard Henderson } 22125a18407fSRichard Henderson 22135a18407fSRichard Henderson TCGOp *tcg_op_insert_after(TCGContext *s, TCGOp *old_op, 22145a18407fSRichard Henderson TCGOpcode opc, int nargs) 22155a18407fSRichard Henderson { 221615fa08f8SRichard Henderson TCGOp *new_op = tcg_op_alloc(opc); 221715fa08f8SRichard Henderson QTAILQ_INSERT_AFTER(&s->ops, old_op, new_op, link); 22185a18407fSRichard Henderson return new_op; 22195a18407fSRichard Henderson } 22205a18407fSRichard Henderson 2221c70fbf0aSRichard Henderson #define TS_DEAD 1 2222c70fbf0aSRichard Henderson #define TS_MEM 2 2223c70fbf0aSRichard Henderson 22245a18407fSRichard Henderson #define IS_DEAD_ARG(n) (arg_life & (DEAD_ARG << (n))) 22255a18407fSRichard Henderson #define NEED_SYNC_ARG(n) (arg_life & (SYNC_ARG << (n))) 22265a18407fSRichard Henderson 22279c43b68dSAurelien Jarno /* liveness analysis: end of function: all temps are dead, and globals 22289c43b68dSAurelien Jarno should be in memory. */ 2229b83eabeaSRichard Henderson static void tcg_la_func_end(TCGContext *s) 2230c896fe29Sbellard { 2231b83eabeaSRichard Henderson int ng = s->nb_globals; 2232b83eabeaSRichard Henderson int nt = s->nb_temps; 2233b83eabeaSRichard Henderson int i; 2234b83eabeaSRichard Henderson 2235b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2236b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2237b83eabeaSRichard Henderson } 2238b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2239b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD; 2240b83eabeaSRichard Henderson } 2241c896fe29Sbellard } 2242c896fe29Sbellard 22439c43b68dSAurelien Jarno /* liveness analysis: end of basic block: all temps are dead, globals 22449c43b68dSAurelien Jarno and local temps should be in memory. */ 2245b83eabeaSRichard Henderson static void tcg_la_bb_end(TCGContext *s) 2246641d5fbeSbellard { 2247b83eabeaSRichard Henderson int ng = s->nb_globals; 2248b83eabeaSRichard Henderson int nt = s->nb_temps; 2249b83eabeaSRichard Henderson int i; 2250641d5fbeSbellard 2251b83eabeaSRichard Henderson for (i = 0; i < ng; ++i) { 2252b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2253c70fbf0aSRichard Henderson } 2254b83eabeaSRichard Henderson for (i = ng; i < nt; ++i) { 2255b83eabeaSRichard Henderson s->temps[i].state = (s->temps[i].temp_local 2256b83eabeaSRichard Henderson ? TS_DEAD | TS_MEM 2257b83eabeaSRichard Henderson : TS_DEAD); 2258641d5fbeSbellard } 2259641d5fbeSbellard } 2260641d5fbeSbellard 2261a1b3c48dSRichard Henderson /* Liveness analysis : update the opc_arg_life array to tell if a 2262c896fe29Sbellard given input arguments is dead. Instructions updating dead 2263c896fe29Sbellard temporaries are removed. */ 2264b83eabeaSRichard Henderson static void liveness_pass_1(TCGContext *s) 2265c896fe29Sbellard { 2266c70fbf0aSRichard Henderson int nb_globals = s->nb_globals; 226715fa08f8SRichard Henderson TCGOp *op, *op_prev; 2268c896fe29Sbellard 2269b83eabeaSRichard Henderson tcg_la_func_end(s); 2270c896fe29Sbellard 227115fa08f8SRichard Henderson QTAILQ_FOREACH_REVERSE_SAFE(op, &s->ops, TCGOpHead, link, op_prev) { 2272c45cb8bbSRichard Henderson int i, nb_iargs, nb_oargs; 2273c45cb8bbSRichard Henderson TCGOpcode opc_new, opc_new2; 2274c45cb8bbSRichard Henderson bool have_opc_new2; 2275a1b3c48dSRichard Henderson TCGLifeData arg_life = 0; 2276b83eabeaSRichard Henderson TCGTemp *arg_ts; 2277c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 2278c45cb8bbSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 2279c45cb8bbSRichard Henderson 2280c45cb8bbSRichard Henderson switch (opc) { 2281c896fe29Sbellard case INDEX_op_call: 2282c6e113f5Sbellard { 2283c6e113f5Sbellard int call_flags; 2284c6e113f5Sbellard 2285cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2286cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2287efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 2288c6e113f5Sbellard 2289c45cb8bbSRichard Henderson /* pure functions can be removed if their result is unused */ 229078505279SAurelien Jarno if (call_flags & TCG_CALL_NO_SIDE_EFFECTS) { 2291c6e113f5Sbellard for (i = 0; i < nb_oargs; i++) { 2292b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2293b83eabeaSRichard Henderson if (arg_ts->state != TS_DEAD) { 2294c6e113f5Sbellard goto do_not_remove_call; 2295c6e113f5Sbellard } 22969c43b68dSAurelien Jarno } 2297c45cb8bbSRichard Henderson goto do_remove; 2298c6e113f5Sbellard } else { 2299c6e113f5Sbellard do_not_remove_call: 2300c896fe29Sbellard 2301c896fe29Sbellard /* output args are dead */ 2302c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2303b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2304b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2305a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 23066b64b624SAurelien Jarno } 2307b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2308a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 23099c43b68dSAurelien Jarno } 2310b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2311c896fe29Sbellard } 2312c896fe29Sbellard 231378505279SAurelien Jarno if (!(call_flags & (TCG_CALL_NO_WRITE_GLOBALS | 231478505279SAurelien Jarno TCG_CALL_NO_READ_GLOBALS))) { 23159c43b68dSAurelien Jarno /* globals should go back to memory */ 2316b83eabeaSRichard Henderson for (i = 0; i < nb_globals; i++) { 2317b83eabeaSRichard Henderson s->temps[i].state = TS_DEAD | TS_MEM; 2318b83eabeaSRichard Henderson } 2319c70fbf0aSRichard Henderson } else if (!(call_flags & TCG_CALL_NO_READ_GLOBALS)) { 2320c70fbf0aSRichard Henderson /* globals should be synced to memory */ 2321c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2322b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2323c70fbf0aSRichard Henderson } 2324b9c18f56Saurel32 } 2325c896fe29Sbellard 2326c19f47bfSAurelien Jarno /* record arguments that die in this helper */ 2327866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2328b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2329b83eabeaSRichard Henderson if (arg_ts && arg_ts->state & TS_DEAD) { 2330a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2331c896fe29Sbellard } 2332c896fe29Sbellard } 233367cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2334c70fbf0aSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2335b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2336b83eabeaSRichard Henderson if (arg_ts) { 2337b83eabeaSRichard Henderson arg_ts->state &= ~TS_DEAD; 2338c70fbf0aSRichard Henderson } 2339c19f47bfSAurelien Jarno } 2340c6e113f5Sbellard } 2341c6e113f5Sbellard } 2342c896fe29Sbellard break; 2343765b842aSRichard Henderson case INDEX_op_insn_start: 2344c896fe29Sbellard break; 23455ff9d6a4Sbellard case INDEX_op_discard: 23465ff9d6a4Sbellard /* mark the temporary as dead */ 2347b83eabeaSRichard Henderson arg_temp(op->args[0])->state = TS_DEAD; 23485ff9d6a4Sbellard break; 23491305c451SRichard Henderson 23501305c451SRichard Henderson case INDEX_op_add2_i32: 2351c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i32; 2352f1fae40cSRichard Henderson goto do_addsub2; 23531305c451SRichard Henderson case INDEX_op_sub2_i32: 2354c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i32; 2355f1fae40cSRichard Henderson goto do_addsub2; 2356f1fae40cSRichard Henderson case INDEX_op_add2_i64: 2357c45cb8bbSRichard Henderson opc_new = INDEX_op_add_i64; 2358f1fae40cSRichard Henderson goto do_addsub2; 2359f1fae40cSRichard Henderson case INDEX_op_sub2_i64: 2360c45cb8bbSRichard Henderson opc_new = INDEX_op_sub_i64; 2361f1fae40cSRichard Henderson do_addsub2: 23621305c451SRichard Henderson nb_iargs = 4; 23631305c451SRichard Henderson nb_oargs = 2; 23641305c451SRichard Henderson /* Test if the high part of the operation is dead, but not 23651305c451SRichard Henderson the low part. The result can be optimized to a simple 23661305c451SRichard Henderson add or sub. This happens often for x86_64 guest when the 23671305c451SRichard Henderson cpu mode is set to 32 bit. */ 2368b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2369b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 23701305c451SRichard Henderson goto do_remove; 23711305c451SRichard Henderson } 2372c45cb8bbSRichard Henderson /* Replace the opcode and adjust the args in place, 2373c45cb8bbSRichard Henderson leaving 3 unused args at the end. */ 2374c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2375efee3746SRichard Henderson op->args[1] = op->args[2]; 2376efee3746SRichard Henderson op->args[2] = op->args[4]; 23771305c451SRichard Henderson /* Fall through and mark the single-word operation live. */ 23781305c451SRichard Henderson nb_iargs = 2; 23791305c451SRichard Henderson nb_oargs = 1; 23801305c451SRichard Henderson } 23811305c451SRichard Henderson goto do_not_remove; 23821305c451SRichard Henderson 23831414968aSRichard Henderson case INDEX_op_mulu2_i32: 2384c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2385c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i32; 2386c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i32; 238703271524SRichard Henderson goto do_mul2; 2388f1fae40cSRichard Henderson case INDEX_op_muls2_i32: 2389c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i32; 2390c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i32; 2391c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i32; 2392f1fae40cSRichard Henderson goto do_mul2; 2393f1fae40cSRichard Henderson case INDEX_op_mulu2_i64: 2394c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2395c45cb8bbSRichard Henderson opc_new2 = INDEX_op_muluh_i64; 2396c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_muluh_i64; 239703271524SRichard Henderson goto do_mul2; 2398f1fae40cSRichard Henderson case INDEX_op_muls2_i64: 2399c45cb8bbSRichard Henderson opc_new = INDEX_op_mul_i64; 2400c45cb8bbSRichard Henderson opc_new2 = INDEX_op_mulsh_i64; 2401c45cb8bbSRichard Henderson have_opc_new2 = TCG_TARGET_HAS_mulsh_i64; 240203271524SRichard Henderson goto do_mul2; 2403f1fae40cSRichard Henderson do_mul2: 24041414968aSRichard Henderson nb_iargs = 2; 24051414968aSRichard Henderson nb_oargs = 2; 2406b83eabeaSRichard Henderson if (arg_temp(op->args[1])->state == TS_DEAD) { 2407b83eabeaSRichard Henderson if (arg_temp(op->args[0])->state == TS_DEAD) { 240803271524SRichard Henderson /* Both parts of the operation are dead. */ 24091414968aSRichard Henderson goto do_remove; 24101414968aSRichard Henderson } 241103271524SRichard Henderson /* The high part of the operation is dead; generate the low. */ 2412c45cb8bbSRichard Henderson op->opc = opc = opc_new; 2413efee3746SRichard Henderson op->args[1] = op->args[2]; 2414efee3746SRichard Henderson op->args[2] = op->args[3]; 2415b83eabeaSRichard Henderson } else if (arg_temp(op->args[0])->state == TS_DEAD && have_opc_new2) { 241603271524SRichard Henderson /* The low part of the operation is dead; generate the high. */ 2417c45cb8bbSRichard Henderson op->opc = opc = opc_new2; 2418efee3746SRichard Henderson op->args[0] = op->args[1]; 2419efee3746SRichard Henderson op->args[1] = op->args[2]; 2420efee3746SRichard Henderson op->args[2] = op->args[3]; 242103271524SRichard Henderson } else { 242203271524SRichard Henderson goto do_not_remove; 242303271524SRichard Henderson } 242403271524SRichard Henderson /* Mark the single-word operation live. */ 24251414968aSRichard Henderson nb_oargs = 1; 24261414968aSRichard Henderson goto do_not_remove; 24271414968aSRichard Henderson 2428c896fe29Sbellard default: 24291305c451SRichard Henderson /* XXX: optimize by hardcoding common cases (e.g. triadic ops) */ 2430c896fe29Sbellard nb_iargs = def->nb_iargs; 2431c896fe29Sbellard nb_oargs = def->nb_oargs; 2432c896fe29Sbellard 2433c896fe29Sbellard /* Test if the operation can be removed because all 24345ff9d6a4Sbellard its outputs are dead. We assume that nb_oargs == 0 24355ff9d6a4Sbellard implies side effects */ 24365ff9d6a4Sbellard if (!(def->flags & TCG_OPF_SIDE_EFFECTS) && nb_oargs != 0) { 2437c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2438b83eabeaSRichard Henderson if (arg_temp(op->args[i])->state != TS_DEAD) { 2439c896fe29Sbellard goto do_not_remove; 2440c896fe29Sbellard } 24419c43b68dSAurelien Jarno } 24421305c451SRichard Henderson do_remove: 24430c627cdcSRichard Henderson tcg_op_remove(s, op); 2444c896fe29Sbellard } else { 2445c896fe29Sbellard do_not_remove: 2446c896fe29Sbellard /* output args are dead */ 2447c896fe29Sbellard for (i = 0; i < nb_oargs; i++) { 2448b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2449b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2450a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 24516b64b624SAurelien Jarno } 2452b83eabeaSRichard Henderson if (arg_ts->state & TS_MEM) { 2453a1b3c48dSRichard Henderson arg_life |= SYNC_ARG << i; 24549c43b68dSAurelien Jarno } 2455b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 2456c896fe29Sbellard } 2457c896fe29Sbellard 2458c896fe29Sbellard /* if end of basic block, update */ 2459c896fe29Sbellard if (def->flags & TCG_OPF_BB_END) { 2460b83eabeaSRichard Henderson tcg_la_bb_end(s); 24613d5c5f87SAurelien Jarno } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 24623d5c5f87SAurelien Jarno /* globals should be synced to memory */ 2463c70fbf0aSRichard Henderson for (i = 0; i < nb_globals; i++) { 2464b83eabeaSRichard Henderson s->temps[i].state |= TS_MEM; 2465c70fbf0aSRichard Henderson } 2466c896fe29Sbellard } 2467c896fe29Sbellard 2468c19f47bfSAurelien Jarno /* record arguments that die in this opcode */ 2469866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2470b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2471b83eabeaSRichard Henderson if (arg_ts->state & TS_DEAD) { 2472a1b3c48dSRichard Henderson arg_life |= DEAD_ARG << i; 2473c896fe29Sbellard } 2474c19f47bfSAurelien Jarno } 247567cc32ebSVeres Lajos /* input arguments are live for preceding opcodes */ 2476c19f47bfSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 2477b83eabeaSRichard Henderson arg_temp(op->args[i])->state &= ~TS_DEAD; 2478c896fe29Sbellard } 2479c896fe29Sbellard } 2480c896fe29Sbellard break; 2481c896fe29Sbellard } 2482bee158cbSRichard Henderson op->life = arg_life; 2483c896fe29Sbellard } 24841ff0a2c5SEvgeny Voevodin } 2485c896fe29Sbellard 24865a18407fSRichard Henderson /* Liveness analysis: Convert indirect regs to direct temporaries. */ 2487b83eabeaSRichard Henderson static bool liveness_pass_2(TCGContext *s) 24885a18407fSRichard Henderson { 24895a18407fSRichard Henderson int nb_globals = s->nb_globals; 249015fa08f8SRichard Henderson int nb_temps, i; 24915a18407fSRichard Henderson bool changes = false; 249215fa08f8SRichard Henderson TCGOp *op, *op_next; 24935a18407fSRichard Henderson 24945a18407fSRichard Henderson /* Create a temporary for each indirect global. */ 24955a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 24965a18407fSRichard Henderson TCGTemp *its = &s->temps[i]; 24975a18407fSRichard Henderson if (its->indirect_reg) { 24985a18407fSRichard Henderson TCGTemp *dts = tcg_temp_alloc(s); 24995a18407fSRichard Henderson dts->type = its->type; 25005a18407fSRichard Henderson dts->base_type = its->base_type; 2501b83eabeaSRichard Henderson its->state_ptr = dts; 2502b83eabeaSRichard Henderson } else { 2503b83eabeaSRichard Henderson its->state_ptr = NULL; 25045a18407fSRichard Henderson } 2505b83eabeaSRichard Henderson /* All globals begin dead. */ 2506b83eabeaSRichard Henderson its->state = TS_DEAD; 25075a18407fSRichard Henderson } 2508b83eabeaSRichard Henderson for (nb_temps = s->nb_temps; i < nb_temps; ++i) { 2509b83eabeaSRichard Henderson TCGTemp *its = &s->temps[i]; 2510b83eabeaSRichard Henderson its->state_ptr = NULL; 2511b83eabeaSRichard Henderson its->state = TS_DEAD; 2512b83eabeaSRichard Henderson } 25135a18407fSRichard Henderson 251415fa08f8SRichard Henderson QTAILQ_FOREACH_SAFE(op, &s->ops, link, op_next) { 25155a18407fSRichard Henderson TCGOpcode opc = op->opc; 25165a18407fSRichard Henderson const TCGOpDef *def = &tcg_op_defs[opc]; 25175a18407fSRichard Henderson TCGLifeData arg_life = op->life; 25185a18407fSRichard Henderson int nb_iargs, nb_oargs, call_flags; 2519b83eabeaSRichard Henderson TCGTemp *arg_ts, *dir_ts; 25205a18407fSRichard Henderson 25215a18407fSRichard Henderson if (opc == INDEX_op_call) { 2522cd9090aaSRichard Henderson nb_oargs = TCGOP_CALLO(op); 2523cd9090aaSRichard Henderson nb_iargs = TCGOP_CALLI(op); 2524efee3746SRichard Henderson call_flags = op->args[nb_oargs + nb_iargs + 1]; 25255a18407fSRichard Henderson } else { 25265a18407fSRichard Henderson nb_iargs = def->nb_iargs; 25275a18407fSRichard Henderson nb_oargs = def->nb_oargs; 25285a18407fSRichard Henderson 25295a18407fSRichard Henderson /* Set flags similar to how calls require. */ 25305a18407fSRichard Henderson if (def->flags & TCG_OPF_BB_END) { 25315a18407fSRichard Henderson /* Like writing globals: save_globals */ 25325a18407fSRichard Henderson call_flags = 0; 25335a18407fSRichard Henderson } else if (def->flags & TCG_OPF_SIDE_EFFECTS) { 25345a18407fSRichard Henderson /* Like reading globals: sync_globals */ 25355a18407fSRichard Henderson call_flags = TCG_CALL_NO_WRITE_GLOBALS; 25365a18407fSRichard Henderson } else { 25375a18407fSRichard Henderson /* No effect on globals. */ 25385a18407fSRichard Henderson call_flags = (TCG_CALL_NO_READ_GLOBALS | 25395a18407fSRichard Henderson TCG_CALL_NO_WRITE_GLOBALS); 25405a18407fSRichard Henderson } 25415a18407fSRichard Henderson } 25425a18407fSRichard Henderson 25435a18407fSRichard Henderson /* Make sure that input arguments are available. */ 25445a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2545b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2546b83eabeaSRichard Henderson if (arg_ts) { 2547b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2548b83eabeaSRichard Henderson if (dir_ts && arg_ts->state == TS_DEAD) { 2549b83eabeaSRichard Henderson TCGOpcode lopc = (arg_ts->type == TCG_TYPE_I32 25505a18407fSRichard Henderson ? INDEX_op_ld_i32 25515a18407fSRichard Henderson : INDEX_op_ld_i64); 25525a18407fSRichard Henderson TCGOp *lop = tcg_op_insert_before(s, op, lopc, 3); 25535a18407fSRichard Henderson 2554b83eabeaSRichard Henderson lop->args[0] = temp_arg(dir_ts); 2555b83eabeaSRichard Henderson lop->args[1] = temp_arg(arg_ts->mem_base); 2556b83eabeaSRichard Henderson lop->args[2] = arg_ts->mem_offset; 25575a18407fSRichard Henderson 25585a18407fSRichard Henderson /* Loaded, but synced with memory. */ 2559b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 25605a18407fSRichard Henderson } 25615a18407fSRichard Henderson } 25625a18407fSRichard Henderson } 25635a18407fSRichard Henderson 25645a18407fSRichard Henderson /* Perform input replacement, and mark inputs that became dead. 25655a18407fSRichard Henderson No action is required except keeping temp_state up to date 25665a18407fSRichard Henderson so that we reload when needed. */ 25675a18407fSRichard Henderson for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 2568b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2569b83eabeaSRichard Henderson if (arg_ts) { 2570b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2571b83eabeaSRichard Henderson if (dir_ts) { 2572b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 25735a18407fSRichard Henderson changes = true; 25745a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2575b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 25765a18407fSRichard Henderson } 25775a18407fSRichard Henderson } 25785a18407fSRichard Henderson } 25795a18407fSRichard Henderson } 25805a18407fSRichard Henderson 25815a18407fSRichard Henderson /* Liveness analysis should ensure that the following are 25825a18407fSRichard Henderson all correct, for call sites and basic block end points. */ 25835a18407fSRichard Henderson if (call_flags & TCG_CALL_NO_READ_GLOBALS) { 25845a18407fSRichard Henderson /* Nothing to do */ 25855a18407fSRichard Henderson } else if (call_flags & TCG_CALL_NO_WRITE_GLOBALS) { 25865a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 25875a18407fSRichard Henderson /* Liveness should see that globals are synced back, 25885a18407fSRichard Henderson that is, either TS_DEAD or TS_MEM. */ 2589b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2590b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2591b83eabeaSRichard Henderson || arg_ts->state != 0); 25925a18407fSRichard Henderson } 25935a18407fSRichard Henderson } else { 25945a18407fSRichard Henderson for (i = 0; i < nb_globals; ++i) { 25955a18407fSRichard Henderson /* Liveness should see that globals are saved back, 25965a18407fSRichard Henderson that is, TS_DEAD, waiting to be reloaded. */ 2597b83eabeaSRichard Henderson arg_ts = &s->temps[i]; 2598b83eabeaSRichard Henderson tcg_debug_assert(arg_ts->state_ptr == 0 2599b83eabeaSRichard Henderson || arg_ts->state == TS_DEAD); 26005a18407fSRichard Henderson } 26015a18407fSRichard Henderson } 26025a18407fSRichard Henderson 26035a18407fSRichard Henderson /* Outputs become available. */ 26045a18407fSRichard Henderson for (i = 0; i < nb_oargs; i++) { 2605b83eabeaSRichard Henderson arg_ts = arg_temp(op->args[i]); 2606b83eabeaSRichard Henderson dir_ts = arg_ts->state_ptr; 2607b83eabeaSRichard Henderson if (!dir_ts) { 26085a18407fSRichard Henderson continue; 26095a18407fSRichard Henderson } 2610b83eabeaSRichard Henderson op->args[i] = temp_arg(dir_ts); 26115a18407fSRichard Henderson changes = true; 26125a18407fSRichard Henderson 26135a18407fSRichard Henderson /* The output is now live and modified. */ 2614b83eabeaSRichard Henderson arg_ts->state = 0; 26155a18407fSRichard Henderson 26165a18407fSRichard Henderson /* Sync outputs upon their last write. */ 26175a18407fSRichard Henderson if (NEED_SYNC_ARG(i)) { 2618b83eabeaSRichard Henderson TCGOpcode sopc = (arg_ts->type == TCG_TYPE_I32 26195a18407fSRichard Henderson ? INDEX_op_st_i32 26205a18407fSRichard Henderson : INDEX_op_st_i64); 26215a18407fSRichard Henderson TCGOp *sop = tcg_op_insert_after(s, op, sopc, 3); 26225a18407fSRichard Henderson 2623b83eabeaSRichard Henderson sop->args[0] = temp_arg(dir_ts); 2624b83eabeaSRichard Henderson sop->args[1] = temp_arg(arg_ts->mem_base); 2625b83eabeaSRichard Henderson sop->args[2] = arg_ts->mem_offset; 26265a18407fSRichard Henderson 2627b83eabeaSRichard Henderson arg_ts->state = TS_MEM; 26285a18407fSRichard Henderson } 26295a18407fSRichard Henderson /* Drop outputs that are dead. */ 26305a18407fSRichard Henderson if (IS_DEAD_ARG(i)) { 2631b83eabeaSRichard Henderson arg_ts->state = TS_DEAD; 26325a18407fSRichard Henderson } 26335a18407fSRichard Henderson } 26345a18407fSRichard Henderson } 26355a18407fSRichard Henderson 26365a18407fSRichard Henderson return changes; 26375a18407fSRichard Henderson } 26385a18407fSRichard Henderson 26398d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 2640c896fe29Sbellard static void dump_regs(TCGContext *s) 2641c896fe29Sbellard { 2642c896fe29Sbellard TCGTemp *ts; 2643c896fe29Sbellard int i; 2644c896fe29Sbellard char buf[64]; 2645c896fe29Sbellard 2646c896fe29Sbellard for(i = 0; i < s->nb_temps; i++) { 2647c896fe29Sbellard ts = &s->temps[i]; 264843439139SRichard Henderson printf(" %10s: ", tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2649c896fe29Sbellard switch(ts->val_type) { 2650c896fe29Sbellard case TEMP_VAL_REG: 2651c896fe29Sbellard printf("%s", tcg_target_reg_names[ts->reg]); 2652c896fe29Sbellard break; 2653c896fe29Sbellard case TEMP_VAL_MEM: 2654b3a62939SRichard Henderson printf("%d(%s)", (int)ts->mem_offset, 2655b3a62939SRichard Henderson tcg_target_reg_names[ts->mem_base->reg]); 2656c896fe29Sbellard break; 2657c896fe29Sbellard case TEMP_VAL_CONST: 2658c896fe29Sbellard printf("$0x%" TCG_PRIlx, ts->val); 2659c896fe29Sbellard break; 2660c896fe29Sbellard case TEMP_VAL_DEAD: 2661c896fe29Sbellard printf("D"); 2662c896fe29Sbellard break; 2663c896fe29Sbellard default: 2664c896fe29Sbellard printf("???"); 2665c896fe29Sbellard break; 2666c896fe29Sbellard } 2667c896fe29Sbellard printf("\n"); 2668c896fe29Sbellard } 2669c896fe29Sbellard 2670c896fe29Sbellard for(i = 0; i < TCG_TARGET_NB_REGS; i++) { 2671f8b2f202SRichard Henderson if (s->reg_to_temp[i] != NULL) { 2672c896fe29Sbellard printf("%s: %s\n", 2673c896fe29Sbellard tcg_target_reg_names[i], 2674f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), s->reg_to_temp[i])); 2675c896fe29Sbellard } 2676c896fe29Sbellard } 2677c896fe29Sbellard } 2678c896fe29Sbellard 2679c896fe29Sbellard static void check_regs(TCGContext *s) 2680c896fe29Sbellard { 2681869938aeSRichard Henderson int reg; 2682b6638662SRichard Henderson int k; 2683c896fe29Sbellard TCGTemp *ts; 2684c896fe29Sbellard char buf[64]; 2685c896fe29Sbellard 2686c896fe29Sbellard for (reg = 0; reg < TCG_TARGET_NB_REGS; reg++) { 2687f8b2f202SRichard Henderson ts = s->reg_to_temp[reg]; 2688f8b2f202SRichard Henderson if (ts != NULL) { 2689f8b2f202SRichard Henderson if (ts->val_type != TEMP_VAL_REG || ts->reg != reg) { 2690c896fe29Sbellard printf("Inconsistency for register %s:\n", 2691c896fe29Sbellard tcg_target_reg_names[reg]); 2692b03cce8eSbellard goto fail; 2693c896fe29Sbellard } 2694c896fe29Sbellard } 2695c896fe29Sbellard } 2696c896fe29Sbellard for (k = 0; k < s->nb_temps; k++) { 2697c896fe29Sbellard ts = &s->temps[k]; 2698f8b2f202SRichard Henderson if (ts->val_type == TEMP_VAL_REG && !ts->fixed_reg 2699f8b2f202SRichard Henderson && s->reg_to_temp[ts->reg] != ts) { 2700c896fe29Sbellard printf("Inconsistency for temp %s:\n", 2701f8b2f202SRichard Henderson tcg_get_arg_str_ptr(s, buf, sizeof(buf), ts)); 2702b03cce8eSbellard fail: 2703c896fe29Sbellard printf("reg state:\n"); 2704c896fe29Sbellard dump_regs(s); 2705c896fe29Sbellard tcg_abort(); 2706c896fe29Sbellard } 2707c896fe29Sbellard } 2708c896fe29Sbellard } 2709c896fe29Sbellard #endif 2710c896fe29Sbellard 27112272e4a7SRichard Henderson static void temp_allocate_frame(TCGContext *s, TCGTemp *ts) 2712c896fe29Sbellard { 27139b9c37c3SRichard Henderson #if !(defined(__sparc__) && TCG_TARGET_REG_BITS == 64) 27149b9c37c3SRichard Henderson /* Sparc64 stack is accessed with offset of 2047 */ 2715b591dc59SBlue Swirl s->current_frame_offset = (s->current_frame_offset + 2716b591dc59SBlue Swirl (tcg_target_long)sizeof(tcg_target_long) - 1) & 2717b591dc59SBlue Swirl ~(sizeof(tcg_target_long) - 1); 2718f44c9960SBlue Swirl #endif 2719b591dc59SBlue Swirl if (s->current_frame_offset + (tcg_target_long)sizeof(tcg_target_long) > 2720b591dc59SBlue Swirl s->frame_end) { 27215ff9d6a4Sbellard tcg_abort(); 2722b591dc59SBlue Swirl } 2723c896fe29Sbellard ts->mem_offset = s->current_frame_offset; 2724b3a62939SRichard Henderson ts->mem_base = s->frame_temp; 2725c896fe29Sbellard ts->mem_allocated = 1; 2726e2c6d1b4SRichard Henderson s->current_frame_offset += sizeof(tcg_target_long); 2727c896fe29Sbellard } 2728c896fe29Sbellard 2729b3915dbbSRichard Henderson static void temp_load(TCGContext *, TCGTemp *, TCGRegSet, TCGRegSet); 2730b3915dbbSRichard Henderson 273159d7c14eSRichard Henderson /* Mark a temporary as free or dead. If 'free_or_dead' is negative, 273259d7c14eSRichard Henderson mark it free; otherwise mark it dead. */ 273359d7c14eSRichard Henderson static void temp_free_or_dead(TCGContext *s, TCGTemp *ts, int free_or_dead) 2734c896fe29Sbellard { 273559d7c14eSRichard Henderson if (ts->fixed_reg) { 273659d7c14eSRichard Henderson return; 273759d7c14eSRichard Henderson } 273859d7c14eSRichard Henderson if (ts->val_type == TEMP_VAL_REG) { 273959d7c14eSRichard Henderson s->reg_to_temp[ts->reg] = NULL; 274059d7c14eSRichard Henderson } 274159d7c14eSRichard Henderson ts->val_type = (free_or_dead < 0 274259d7c14eSRichard Henderson || ts->temp_local 2743fa477d25SRichard Henderson || ts->temp_global 274459d7c14eSRichard Henderson ? TEMP_VAL_MEM : TEMP_VAL_DEAD); 274559d7c14eSRichard Henderson } 2746c896fe29Sbellard 274759d7c14eSRichard Henderson /* Mark a temporary as dead. */ 274859d7c14eSRichard Henderson static inline void temp_dead(TCGContext *s, TCGTemp *ts) 274959d7c14eSRichard Henderson { 275059d7c14eSRichard Henderson temp_free_or_dead(s, ts, 1); 275159d7c14eSRichard Henderson } 275259d7c14eSRichard Henderson 275359d7c14eSRichard Henderson /* Sync a temporary to memory. 'allocated_regs' is used in case a temporary 275459d7c14eSRichard Henderson registers needs to be allocated to store a constant. If 'free_or_dead' 275559d7c14eSRichard Henderson is non-zero, subsequently release the temporary; if it is positive, the 275659d7c14eSRichard Henderson temp is dead; if it is negative, the temp is free. */ 275759d7c14eSRichard Henderson static void temp_sync(TCGContext *s, TCGTemp *ts, 275859d7c14eSRichard Henderson TCGRegSet allocated_regs, int free_or_dead) 275959d7c14eSRichard Henderson { 276059d7c14eSRichard Henderson if (ts->fixed_reg) { 276159d7c14eSRichard Henderson return; 276259d7c14eSRichard Henderson } 276359d7c14eSRichard Henderson if (!ts->mem_coherent) { 27647f6ceedfSAurelien Jarno if (!ts->mem_allocated) { 27652272e4a7SRichard Henderson temp_allocate_frame(s, ts); 276659d7c14eSRichard Henderson } 276759d7c14eSRichard Henderson switch (ts->val_type) { 276859d7c14eSRichard Henderson case TEMP_VAL_CONST: 276959d7c14eSRichard Henderson /* If we're going to free the temp immediately, then we won't 277059d7c14eSRichard Henderson require it later in a register, so attempt to store the 277159d7c14eSRichard Henderson constant to memory directly. */ 277259d7c14eSRichard Henderson if (free_or_dead 277359d7c14eSRichard Henderson && tcg_out_sti(s, ts->type, ts->val, 277459d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset)) { 277559d7c14eSRichard Henderson break; 277659d7c14eSRichard Henderson } 277759d7c14eSRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 277859d7c14eSRichard Henderson allocated_regs); 277959d7c14eSRichard Henderson /* fallthrough */ 278059d7c14eSRichard Henderson 278159d7c14eSRichard Henderson case TEMP_VAL_REG: 278259d7c14eSRichard Henderson tcg_out_st(s, ts->type, ts->reg, 278359d7c14eSRichard Henderson ts->mem_base->reg, ts->mem_offset); 278459d7c14eSRichard Henderson break; 278559d7c14eSRichard Henderson 278659d7c14eSRichard Henderson case TEMP_VAL_MEM: 278759d7c14eSRichard Henderson break; 278859d7c14eSRichard Henderson 278959d7c14eSRichard Henderson case TEMP_VAL_DEAD: 279059d7c14eSRichard Henderson default: 279159d7c14eSRichard Henderson tcg_abort(); 2792c896fe29Sbellard } 27937f6ceedfSAurelien Jarno ts->mem_coherent = 1; 27947f6ceedfSAurelien Jarno } 279559d7c14eSRichard Henderson if (free_or_dead) { 279659d7c14eSRichard Henderson temp_free_or_dead(s, ts, free_or_dead); 279759d7c14eSRichard Henderson } 279859d7c14eSRichard Henderson } 27997f6ceedfSAurelien Jarno 28007f6ceedfSAurelien Jarno /* free register 'reg' by spilling the corresponding temporary if necessary */ 2801b3915dbbSRichard Henderson static void tcg_reg_free(TCGContext *s, TCGReg reg, TCGRegSet allocated_regs) 28027f6ceedfSAurelien Jarno { 2803f8b2f202SRichard Henderson TCGTemp *ts = s->reg_to_temp[reg]; 2804f8b2f202SRichard Henderson if (ts != NULL) { 280559d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, -1); 2806c896fe29Sbellard } 2807c896fe29Sbellard } 2808c896fe29Sbellard 2809c896fe29Sbellard /* Allocate a register belonging to reg1 & ~reg2 */ 2810b3915dbbSRichard Henderson static TCGReg tcg_reg_alloc(TCGContext *s, TCGRegSet desired_regs, 281191478cefSRichard Henderson TCGRegSet allocated_regs, bool rev) 2812c896fe29Sbellard { 281391478cefSRichard Henderson int i, n = ARRAY_SIZE(tcg_target_reg_alloc_order); 281491478cefSRichard Henderson const int *order; 2815b6638662SRichard Henderson TCGReg reg; 2816c896fe29Sbellard TCGRegSet reg_ct; 2817c896fe29Sbellard 281807ddf036SRichard Henderson reg_ct = desired_regs & ~allocated_regs; 281991478cefSRichard Henderson order = rev ? indirect_reg_alloc_order : tcg_target_reg_alloc_order; 2820c896fe29Sbellard 2821c896fe29Sbellard /* first try free registers */ 282291478cefSRichard Henderson for(i = 0; i < n; i++) { 282391478cefSRichard Henderson reg = order[i]; 2824f8b2f202SRichard Henderson if (tcg_regset_test_reg(reg_ct, reg) && s->reg_to_temp[reg] == NULL) 2825c896fe29Sbellard return reg; 2826c896fe29Sbellard } 2827c896fe29Sbellard 2828c896fe29Sbellard /* XXX: do better spill choice */ 282991478cefSRichard Henderson for(i = 0; i < n; i++) { 283091478cefSRichard Henderson reg = order[i]; 2831c896fe29Sbellard if (tcg_regset_test_reg(reg_ct, reg)) { 2832b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 2833c896fe29Sbellard return reg; 2834c896fe29Sbellard } 2835c896fe29Sbellard } 2836c896fe29Sbellard 2837c896fe29Sbellard tcg_abort(); 2838c896fe29Sbellard } 2839c896fe29Sbellard 284040ae5c62SRichard Henderson /* Make sure the temporary is in a register. If needed, allocate the register 284140ae5c62SRichard Henderson from DESIRED while avoiding ALLOCATED. */ 284240ae5c62SRichard Henderson static void temp_load(TCGContext *s, TCGTemp *ts, TCGRegSet desired_regs, 284340ae5c62SRichard Henderson TCGRegSet allocated_regs) 284440ae5c62SRichard Henderson { 284540ae5c62SRichard Henderson TCGReg reg; 284640ae5c62SRichard Henderson 284740ae5c62SRichard Henderson switch (ts->val_type) { 284840ae5c62SRichard Henderson case TEMP_VAL_REG: 284940ae5c62SRichard Henderson return; 285040ae5c62SRichard Henderson case TEMP_VAL_CONST: 285191478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 285240ae5c62SRichard Henderson tcg_out_movi(s, ts->type, reg, ts->val); 285340ae5c62SRichard Henderson ts->mem_coherent = 0; 285440ae5c62SRichard Henderson break; 285540ae5c62SRichard Henderson case TEMP_VAL_MEM: 285691478cefSRichard Henderson reg = tcg_reg_alloc(s, desired_regs, allocated_regs, ts->indirect_base); 285740ae5c62SRichard Henderson tcg_out_ld(s, ts->type, reg, ts->mem_base->reg, ts->mem_offset); 285840ae5c62SRichard Henderson ts->mem_coherent = 1; 285940ae5c62SRichard Henderson break; 286040ae5c62SRichard Henderson case TEMP_VAL_DEAD: 286140ae5c62SRichard Henderson default: 286240ae5c62SRichard Henderson tcg_abort(); 286340ae5c62SRichard Henderson } 286440ae5c62SRichard Henderson ts->reg = reg; 286540ae5c62SRichard Henderson ts->val_type = TEMP_VAL_REG; 286640ae5c62SRichard Henderson s->reg_to_temp[reg] = ts; 286740ae5c62SRichard Henderson } 286840ae5c62SRichard Henderson 286959d7c14eSRichard Henderson /* Save a temporary to memory. 'allocated_regs' is used in case a 2870e8996ee0Sbellard temporary registers needs to be allocated to store a constant. */ 287159d7c14eSRichard Henderson static void temp_save(TCGContext *s, TCGTemp *ts, TCGRegSet allocated_regs) 28721ad80729SAurelien Jarno { 28732c0366f0SAurelien Jarno /* The liveness analysis already ensures that globals are back 2874eabb7b91SAurelien Jarno in memory. Keep an tcg_debug_assert for safety. */ 2875f8bf00f1SRichard Henderson tcg_debug_assert(ts->val_type == TEMP_VAL_MEM || ts->fixed_reg); 28761ad80729SAurelien Jarno } 28771ad80729SAurelien Jarno 28789814dd27SDong Xu Wang /* save globals to their canonical location and assume they can be 2879641d5fbeSbellard modified be the following code. 'allocated_regs' is used in case a 2880641d5fbeSbellard temporary registers needs to be allocated to store a constant. */ 2881641d5fbeSbellard static void save_globals(TCGContext *s, TCGRegSet allocated_regs) 2882641d5fbeSbellard { 2883ac3b8891SRichard Henderson int i, n; 2884641d5fbeSbellard 2885ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 2886b13eb728SRichard Henderson temp_save(s, &s->temps[i], allocated_regs); 2887641d5fbeSbellard } 2888e5097dc8Sbellard } 2889e5097dc8Sbellard 28903d5c5f87SAurelien Jarno /* sync globals to their canonical location and assume they can be 28913d5c5f87SAurelien Jarno read by the following code. 'allocated_regs' is used in case a 28923d5c5f87SAurelien Jarno temporary registers needs to be allocated to store a constant. */ 28933d5c5f87SAurelien Jarno static void sync_globals(TCGContext *s, TCGRegSet allocated_regs) 28943d5c5f87SAurelien Jarno { 2895ac3b8891SRichard Henderson int i, n; 28963d5c5f87SAurelien Jarno 2897ac3b8891SRichard Henderson for (i = 0, n = s->nb_globals; i < n; i++) { 289812b9b11aSRichard Henderson TCGTemp *ts = &s->temps[i]; 289912b9b11aSRichard Henderson tcg_debug_assert(ts->val_type != TEMP_VAL_REG 290012b9b11aSRichard Henderson || ts->fixed_reg 290112b9b11aSRichard Henderson || ts->mem_coherent); 29023d5c5f87SAurelien Jarno } 29033d5c5f87SAurelien Jarno } 29043d5c5f87SAurelien Jarno 2905e5097dc8Sbellard /* at the end of a basic block, we assume all temporaries are dead and 2906e8996ee0Sbellard all globals are stored at their canonical location. */ 2907e8996ee0Sbellard static void tcg_reg_alloc_bb_end(TCGContext *s, TCGRegSet allocated_regs) 2908e5097dc8Sbellard { 2909e5097dc8Sbellard int i; 2910e5097dc8Sbellard 2911c896fe29Sbellard for (i = s->nb_globals; i < s->nb_temps; i++) { 2912b13eb728SRichard Henderson TCGTemp *ts = &s->temps[i]; 2913641d5fbeSbellard if (ts->temp_local) { 2914b13eb728SRichard Henderson temp_save(s, ts, allocated_regs); 2915641d5fbeSbellard } else { 29162c0366f0SAurelien Jarno /* The liveness analysis already ensures that temps are dead. 2917eabb7b91SAurelien Jarno Keep an tcg_debug_assert for safety. */ 2918eabb7b91SAurelien Jarno tcg_debug_assert(ts->val_type == TEMP_VAL_DEAD); 2919c896fe29Sbellard } 2920641d5fbeSbellard } 2921e8996ee0Sbellard 2922e8996ee0Sbellard save_globals(s, allocated_regs); 2923c896fe29Sbellard } 2924c896fe29Sbellard 29250fe4fca4SPaolo Bonzini static void tcg_reg_alloc_do_movi(TCGContext *s, TCGTemp *ots, 29260fe4fca4SPaolo Bonzini tcg_target_ulong val, TCGLifeData arg_life) 2927e8996ee0Sbellard { 2928e8996ee0Sbellard if (ots->fixed_reg) { 292959d7c14eSRichard Henderson /* For fixed registers, we do not do any constant propagation. */ 2930e8996ee0Sbellard tcg_out_movi(s, ots->type, ots->reg, val); 293159d7c14eSRichard Henderson return; 293259d7c14eSRichard Henderson } 293359d7c14eSRichard Henderson 293459d7c14eSRichard Henderson /* The movi is not explicitly generated here. */ 2935f8b2f202SRichard Henderson if (ots->val_type == TEMP_VAL_REG) { 2936f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 2937f8b2f202SRichard Henderson } 2938e8996ee0Sbellard ots->val_type = TEMP_VAL_CONST; 2939e8996ee0Sbellard ots->val = val; 294059d7c14eSRichard Henderson ots->mem_coherent = 0; 2941ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 294259d7c14eSRichard Henderson temp_sync(s, ots, s->reserved_regs, IS_DEAD_ARG(0)); 294359d7c14eSRichard Henderson } else if (IS_DEAD_ARG(0)) { 2944f8bf00f1SRichard Henderson temp_dead(s, ots); 29454c4e1ab2SAurelien Jarno } 2946e8996ee0Sbellard } 2947e8996ee0Sbellard 2948dd186292SRichard Henderson static void tcg_reg_alloc_movi(TCGContext *s, const TCGOp *op) 29490fe4fca4SPaolo Bonzini { 295043439139SRichard Henderson TCGTemp *ots = arg_temp(op->args[0]); 2951dd186292SRichard Henderson tcg_target_ulong val = op->args[1]; 29520fe4fca4SPaolo Bonzini 2953dd186292SRichard Henderson tcg_reg_alloc_do_movi(s, ots, val, op->life); 29540fe4fca4SPaolo Bonzini } 29550fe4fca4SPaolo Bonzini 2956dd186292SRichard Henderson static void tcg_reg_alloc_mov(TCGContext *s, const TCGOp *op) 2957c896fe29Sbellard { 2958dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 2959c29c1d7eSAurelien Jarno TCGRegSet allocated_regs; 2960c896fe29Sbellard TCGTemp *ts, *ots; 2961450445d5SRichard Henderson TCGType otype, itype; 2962c896fe29Sbellard 2963d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 296443439139SRichard Henderson ots = arg_temp(op->args[0]); 296543439139SRichard Henderson ts = arg_temp(op->args[1]); 2966450445d5SRichard Henderson 2967450445d5SRichard Henderson /* Note that otype != itype for no-op truncation. */ 2968450445d5SRichard Henderson otype = ots->type; 2969450445d5SRichard Henderson itype = ts->type; 2970c896fe29Sbellard 29710fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_CONST) { 29720fe4fca4SPaolo Bonzini /* propagate constant or generate sti */ 29730fe4fca4SPaolo Bonzini tcg_target_ulong val = ts->val; 29740fe4fca4SPaolo Bonzini if (IS_DEAD_ARG(1)) { 29750fe4fca4SPaolo Bonzini temp_dead(s, ts); 29760fe4fca4SPaolo Bonzini } 29770fe4fca4SPaolo Bonzini tcg_reg_alloc_do_movi(s, ots, val, arg_life); 29780fe4fca4SPaolo Bonzini return; 29790fe4fca4SPaolo Bonzini } 29800fe4fca4SPaolo Bonzini 29810fe4fca4SPaolo Bonzini /* If the source value is in memory we're going to be forced 29820fe4fca4SPaolo Bonzini to have it in a register in order to perform the copy. Copy 29830fe4fca4SPaolo Bonzini the SOURCE value into its own register first, that way we 29840fe4fca4SPaolo Bonzini don't have to reload SOURCE the next time it is used. */ 29850fe4fca4SPaolo Bonzini if (ts->val_type == TEMP_VAL_MEM) { 298640ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[itype], allocated_regs); 2987c29c1d7eSAurelien Jarno } 2988c29c1d7eSAurelien Jarno 29890fe4fca4SPaolo Bonzini tcg_debug_assert(ts->val_type == TEMP_VAL_REG); 2990c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(0) && !ots->fixed_reg) { 2991c29c1d7eSAurelien Jarno /* mov to a non-saved dead register makes no sense (even with 2992c29c1d7eSAurelien Jarno liveness analysis disabled). */ 2993eabb7b91SAurelien Jarno tcg_debug_assert(NEED_SYNC_ARG(0)); 2994c29c1d7eSAurelien Jarno if (!ots->mem_allocated) { 29952272e4a7SRichard Henderson temp_allocate_frame(s, ots); 2996c29c1d7eSAurelien Jarno } 2997b3a62939SRichard Henderson tcg_out_st(s, otype, ts->reg, ots->mem_base->reg, ots->mem_offset); 2998c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1)) { 2999f8bf00f1SRichard Henderson temp_dead(s, ts); 3000c29c1d7eSAurelien Jarno } 3001f8bf00f1SRichard Henderson temp_dead(s, ots); 3002e8996ee0Sbellard } else { 3003c29c1d7eSAurelien Jarno if (IS_DEAD_ARG(1) && !ts->fixed_reg && !ots->fixed_reg) { 3004c29c1d7eSAurelien Jarno /* the mov can be suppressed */ 3005c29c1d7eSAurelien Jarno if (ots->val_type == TEMP_VAL_REG) { 3006f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = NULL; 3007c896fe29Sbellard } 3008c29c1d7eSAurelien Jarno ots->reg = ts->reg; 3009f8bf00f1SRichard Henderson temp_dead(s, ts); 3010c29c1d7eSAurelien Jarno } else { 3011c29c1d7eSAurelien Jarno if (ots->val_type != TEMP_VAL_REG) { 3012c29c1d7eSAurelien Jarno /* When allocating a new register, make sure to not spill the 3013c29c1d7eSAurelien Jarno input one. */ 3014c29c1d7eSAurelien Jarno tcg_regset_set_reg(allocated_regs, ts->reg); 3015450445d5SRichard Henderson ots->reg = tcg_reg_alloc(s, tcg_target_available_regs[otype], 301691478cefSRichard Henderson allocated_regs, ots->indirect_base); 3017c29c1d7eSAurelien Jarno } 3018450445d5SRichard Henderson tcg_out_mov(s, otype, ots->reg, ts->reg); 3019c29c1d7eSAurelien Jarno } 3020c896fe29Sbellard ots->val_type = TEMP_VAL_REG; 3021c896fe29Sbellard ots->mem_coherent = 0; 3022f8b2f202SRichard Henderson s->reg_to_temp[ots->reg] = ots; 3023ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(0)) { 302459d7c14eSRichard Henderson temp_sync(s, ots, allocated_regs, 0); 3025c29c1d7eSAurelien Jarno } 3026ec7a869dSAurelien Jarno } 3027c896fe29Sbellard } 3028c896fe29Sbellard 3029dd186292SRichard Henderson static void tcg_reg_alloc_op(TCGContext *s, const TCGOp *op) 3030c896fe29Sbellard { 3031dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3032dd186292SRichard Henderson const TCGOpDef * const def = &tcg_op_defs[op->opc]; 303382790a87SRichard Henderson TCGRegSet i_allocated_regs; 303482790a87SRichard Henderson TCGRegSet o_allocated_regs; 3035b6638662SRichard Henderson int i, k, nb_iargs, nb_oargs; 3036b6638662SRichard Henderson TCGReg reg; 3037c896fe29Sbellard TCGArg arg; 3038c896fe29Sbellard const TCGArgConstraint *arg_ct; 3039c896fe29Sbellard TCGTemp *ts; 3040c896fe29Sbellard TCGArg new_args[TCG_MAX_OP_ARGS]; 3041c896fe29Sbellard int const_args[TCG_MAX_OP_ARGS]; 3042c896fe29Sbellard 3043c896fe29Sbellard nb_oargs = def->nb_oargs; 3044c896fe29Sbellard nb_iargs = def->nb_iargs; 3045c896fe29Sbellard 3046c896fe29Sbellard /* copy constants */ 3047c896fe29Sbellard memcpy(new_args + nb_oargs + nb_iargs, 3048dd186292SRichard Henderson op->args + nb_oargs + nb_iargs, 3049c896fe29Sbellard sizeof(TCGArg) * def->nb_cargs); 3050c896fe29Sbellard 3051d21369f5SRichard Henderson i_allocated_regs = s->reserved_regs; 3052d21369f5SRichard Henderson o_allocated_regs = s->reserved_regs; 305382790a87SRichard Henderson 3054c896fe29Sbellard /* satisfy input constraints */ 3055c896fe29Sbellard for (k = 0; k < nb_iargs; k++) { 3056c896fe29Sbellard i = def->sorted_args[nb_oargs + k]; 3057dd186292SRichard Henderson arg = op->args[i]; 3058c896fe29Sbellard arg_ct = &def->args_ct[i]; 305943439139SRichard Henderson ts = arg_temp(arg); 306040ae5c62SRichard Henderson 306140ae5c62SRichard Henderson if (ts->val_type == TEMP_VAL_CONST 306240ae5c62SRichard Henderson && tcg_target_const_match(ts->val, ts->type, arg_ct)) { 3063c896fe29Sbellard /* constant is OK for instruction */ 3064c896fe29Sbellard const_args[i] = 1; 3065c896fe29Sbellard new_args[i] = ts->val; 3066c896fe29Sbellard goto iarg_end; 3067c896fe29Sbellard } 306840ae5c62SRichard Henderson 306982790a87SRichard Henderson temp_load(s, ts, arg_ct->u.regs, i_allocated_regs); 307040ae5c62SRichard Henderson 30715ff9d6a4Sbellard if (arg_ct->ct & TCG_CT_IALIAS) { 30725ff9d6a4Sbellard if (ts->fixed_reg) { 30735ff9d6a4Sbellard /* if fixed register, we must allocate a new register 30745ff9d6a4Sbellard if the alias is not the same register */ 3075dd186292SRichard Henderson if (arg != op->args[arg_ct->alias_index]) 30765ff9d6a4Sbellard goto allocate_in_reg; 30775ff9d6a4Sbellard } else { 3078c896fe29Sbellard /* if the input is aliased to an output and if it is 3079c896fe29Sbellard not dead after the instruction, we must allocate 3080c896fe29Sbellard a new register and move it */ 3081866cb6cbSAurelien Jarno if (!IS_DEAD_ARG(i)) { 3082c896fe29Sbellard goto allocate_in_reg; 3083c896fe29Sbellard } 30847e1df267SAurelien Jarno /* check if the current register has already been allocated 30857e1df267SAurelien Jarno for another input aliased to an output */ 30867e1df267SAurelien Jarno int k2, i2; 30877e1df267SAurelien Jarno for (k2 = 0 ; k2 < k ; k2++) { 30887e1df267SAurelien Jarno i2 = def->sorted_args[nb_oargs + k2]; 30897e1df267SAurelien Jarno if ((def->args_ct[i2].ct & TCG_CT_IALIAS) && 30907e1df267SAurelien Jarno (new_args[i2] == ts->reg)) { 30917e1df267SAurelien Jarno goto allocate_in_reg; 30927e1df267SAurelien Jarno } 30937e1df267SAurelien Jarno } 30945ff9d6a4Sbellard } 3095866cb6cbSAurelien Jarno } 3096c896fe29Sbellard reg = ts->reg; 3097c896fe29Sbellard if (tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3098c896fe29Sbellard /* nothing to do : the constraint is satisfied */ 3099c896fe29Sbellard } else { 3100c896fe29Sbellard allocate_in_reg: 3101c896fe29Sbellard /* allocate a new register matching the constraint 3102c896fe29Sbellard and move the temporary register into it */ 310382790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, i_allocated_regs, 310491478cefSRichard Henderson ts->indirect_base); 31053b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3106c896fe29Sbellard } 3107c896fe29Sbellard new_args[i] = reg; 3108c896fe29Sbellard const_args[i] = 0; 310982790a87SRichard Henderson tcg_regset_set_reg(i_allocated_regs, reg); 3110c896fe29Sbellard iarg_end: ; 3111c896fe29Sbellard } 3112c896fe29Sbellard 3113c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3114866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_oargs + nb_iargs; i++) { 3115866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 311643439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3117c896fe29Sbellard } 3118c896fe29Sbellard } 3119c896fe29Sbellard 3120a52ad07eSAurelien Jarno if (def->flags & TCG_OPF_BB_END) { 312182790a87SRichard Henderson tcg_reg_alloc_bb_end(s, i_allocated_regs); 3122a52ad07eSAurelien Jarno } else { 3123c896fe29Sbellard if (def->flags & TCG_OPF_CALL_CLOBBER) { 3124b03cce8eSbellard /* XXX: permit generic clobber register list ? */ 3125c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3126c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 312782790a87SRichard Henderson tcg_reg_free(s, i, i_allocated_regs); 3128c896fe29Sbellard } 3129c896fe29Sbellard } 31303d5c5f87SAurelien Jarno } 31313d5c5f87SAurelien Jarno if (def->flags & TCG_OPF_SIDE_EFFECTS) { 31323d5c5f87SAurelien Jarno /* sync globals if the op has side effects and might trigger 31333d5c5f87SAurelien Jarno an exception. */ 313482790a87SRichard Henderson sync_globals(s, i_allocated_regs); 3135c896fe29Sbellard } 3136c896fe29Sbellard 3137c896fe29Sbellard /* satisfy the output constraints */ 3138c896fe29Sbellard for(k = 0; k < nb_oargs; k++) { 3139c896fe29Sbellard i = def->sorted_args[k]; 3140dd186292SRichard Henderson arg = op->args[i]; 3141c896fe29Sbellard arg_ct = &def->args_ct[i]; 314243439139SRichard Henderson ts = arg_temp(arg); 314317280ff4SRichard Henderson if ((arg_ct->ct & TCG_CT_ALIAS) 314417280ff4SRichard Henderson && !const_args[arg_ct->alias_index]) { 31455ff9d6a4Sbellard reg = new_args[arg_ct->alias_index]; 314682790a87SRichard Henderson } else if (arg_ct->ct & TCG_CT_NEWREG) { 314782790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, 314882790a87SRichard Henderson i_allocated_regs | o_allocated_regs, 314982790a87SRichard Henderson ts->indirect_base); 3150c896fe29Sbellard } else { 3151c896fe29Sbellard /* if fixed register, we try to use it */ 3152c896fe29Sbellard reg = ts->reg; 3153c896fe29Sbellard if (ts->fixed_reg && 3154c896fe29Sbellard tcg_regset_test_reg(arg_ct->u.regs, reg)) { 3155c896fe29Sbellard goto oarg_end; 3156c896fe29Sbellard } 315782790a87SRichard Henderson reg = tcg_reg_alloc(s, arg_ct->u.regs, o_allocated_regs, 315891478cefSRichard Henderson ts->indirect_base); 3159c896fe29Sbellard } 316082790a87SRichard Henderson tcg_regset_set_reg(o_allocated_regs, reg); 3161c896fe29Sbellard /* if a fixed register is used, then a move will be done afterwards */ 3162c896fe29Sbellard if (!ts->fixed_reg) { 3163639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3164f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3165639368ddSAurelien Jarno } 3166c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3167c896fe29Sbellard ts->reg = reg; 3168c896fe29Sbellard /* temp value is modified, so the value kept in memory is 3169c896fe29Sbellard potentially not the same */ 3170c896fe29Sbellard ts->mem_coherent = 0; 3171f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3172c896fe29Sbellard } 3173c896fe29Sbellard oarg_end: 3174c896fe29Sbellard new_args[i] = reg; 3175c896fe29Sbellard } 3176e8996ee0Sbellard } 3177c896fe29Sbellard 3178c896fe29Sbellard /* emit instruction */ 3179d2fd745fSRichard Henderson if (def->flags & TCG_OPF_VECTOR) { 3180d2fd745fSRichard Henderson tcg_out_vec_op(s, op->opc, TCGOP_VECL(op), TCGOP_VECE(op), 3181d2fd745fSRichard Henderson new_args, const_args); 3182d2fd745fSRichard Henderson } else { 3183dd186292SRichard Henderson tcg_out_op(s, op->opc, new_args, const_args); 3184d2fd745fSRichard Henderson } 3185c896fe29Sbellard 3186c896fe29Sbellard /* move the outputs in the correct register if needed */ 3187c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 318843439139SRichard Henderson ts = arg_temp(op->args[i]); 3189c896fe29Sbellard reg = new_args[i]; 3190c896fe29Sbellard if (ts->fixed_reg && ts->reg != reg) { 31913b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3192c896fe29Sbellard } 3193ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 319482790a87SRichard Henderson temp_sync(s, ts, o_allocated_regs, IS_DEAD_ARG(i)); 319559d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3196f8bf00f1SRichard Henderson temp_dead(s, ts); 3197ec7a869dSAurelien Jarno } 3198c896fe29Sbellard } 3199c896fe29Sbellard } 3200c896fe29Sbellard 3201b03cce8eSbellard #ifdef TCG_TARGET_STACK_GROWSUP 3202b03cce8eSbellard #define STACK_DIR(x) (-(x)) 3203b03cce8eSbellard #else 3204b03cce8eSbellard #define STACK_DIR(x) (x) 3205b03cce8eSbellard #endif 3206b03cce8eSbellard 3207dd186292SRichard Henderson static void tcg_reg_alloc_call(TCGContext *s, TCGOp *op) 3208c896fe29Sbellard { 3209cd9090aaSRichard Henderson const int nb_oargs = TCGOP_CALLO(op); 3210cd9090aaSRichard Henderson const int nb_iargs = TCGOP_CALLI(op); 3211dd186292SRichard Henderson const TCGLifeData arg_life = op->life; 3212b6638662SRichard Henderson int flags, nb_regs, i; 3213b6638662SRichard Henderson TCGReg reg; 3214cf066674SRichard Henderson TCGArg arg; 3215c896fe29Sbellard TCGTemp *ts; 3216d3452f1fSRichard Henderson intptr_t stack_offset; 3217d3452f1fSRichard Henderson size_t call_stack_size; 3218cf066674SRichard Henderson tcg_insn_unit *func_addr; 3219cf066674SRichard Henderson int allocate_args; 3220c896fe29Sbellard TCGRegSet allocated_regs; 3221c896fe29Sbellard 3222dd186292SRichard Henderson func_addr = (tcg_insn_unit *)(intptr_t)op->args[nb_oargs + nb_iargs]; 3223dd186292SRichard Henderson flags = op->args[nb_oargs + nb_iargs + 1]; 3224c896fe29Sbellard 32256e17d0c5SStefan Weil nb_regs = ARRAY_SIZE(tcg_target_call_iarg_regs); 3226c45cb8bbSRichard Henderson if (nb_regs > nb_iargs) { 3227c45cb8bbSRichard Henderson nb_regs = nb_iargs; 3228cf066674SRichard Henderson } 3229c896fe29Sbellard 3230c896fe29Sbellard /* assign stack slots first */ 3231c45cb8bbSRichard Henderson call_stack_size = (nb_iargs - nb_regs) * sizeof(tcg_target_long); 3232c896fe29Sbellard call_stack_size = (call_stack_size + TCG_TARGET_STACK_ALIGN - 1) & 3233c896fe29Sbellard ~(TCG_TARGET_STACK_ALIGN - 1); 3234b03cce8eSbellard allocate_args = (call_stack_size > TCG_STATIC_CALL_ARGS_SIZE); 3235b03cce8eSbellard if (allocate_args) { 3236345649c0SBlue Swirl /* XXX: if more than TCG_STATIC_CALL_ARGS_SIZE is needed, 3237345649c0SBlue Swirl preallocate call stack */ 3238345649c0SBlue Swirl tcg_abort(); 3239b03cce8eSbellard } 324039cf05d3Sbellard 324139cf05d3Sbellard stack_offset = TCG_TARGET_CALL_STACK_OFFSET; 3242c45cb8bbSRichard Henderson for (i = nb_regs; i < nb_iargs; i++) { 3243dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 324439cf05d3Sbellard #ifdef TCG_TARGET_STACK_GROWSUP 324539cf05d3Sbellard stack_offset -= sizeof(tcg_target_long); 324639cf05d3Sbellard #endif 324739cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 324843439139SRichard Henderson ts = arg_temp(arg); 324940ae5c62SRichard Henderson temp_load(s, ts, tcg_target_available_regs[ts->type], 325040ae5c62SRichard Henderson s->reserved_regs); 3251e4d5434cSblueswir1 tcg_out_st(s, ts->type, ts->reg, TCG_REG_CALL_STACK, stack_offset); 325239cf05d3Sbellard } 325339cf05d3Sbellard #ifndef TCG_TARGET_STACK_GROWSUP 325439cf05d3Sbellard stack_offset += sizeof(tcg_target_long); 325539cf05d3Sbellard #endif 3256c896fe29Sbellard } 3257c896fe29Sbellard 3258c896fe29Sbellard /* assign input registers */ 3259d21369f5SRichard Henderson allocated_regs = s->reserved_regs; 3260c896fe29Sbellard for (i = 0; i < nb_regs; i++) { 3261dd186292SRichard Henderson arg = op->args[nb_oargs + i]; 326239cf05d3Sbellard if (arg != TCG_CALL_DUMMY_ARG) { 326343439139SRichard Henderson ts = arg_temp(arg); 3264c896fe29Sbellard reg = tcg_target_call_iarg_regs[i]; 3265b3915dbbSRichard Henderson tcg_reg_free(s, reg, allocated_regs); 326640ae5c62SRichard Henderson 3267c896fe29Sbellard if (ts->val_type == TEMP_VAL_REG) { 3268c896fe29Sbellard if (ts->reg != reg) { 32693b6dac34SRichard Henderson tcg_out_mov(s, ts->type, reg, ts->reg); 3270c896fe29Sbellard } 3271c896fe29Sbellard } else { 3272ccb1bb66SRichard Henderson TCGRegSet arg_set = 0; 327340ae5c62SRichard Henderson 327440ae5c62SRichard Henderson tcg_regset_set_reg(arg_set, reg); 327540ae5c62SRichard Henderson temp_load(s, ts, arg_set, allocated_regs); 3276c896fe29Sbellard } 327740ae5c62SRichard Henderson 3278c896fe29Sbellard tcg_regset_set_reg(allocated_regs, reg); 3279c896fe29Sbellard } 328039cf05d3Sbellard } 3281c896fe29Sbellard 3282c896fe29Sbellard /* mark dead temporaries and free the associated registers */ 3283866cb6cbSAurelien Jarno for (i = nb_oargs; i < nb_iargs + nb_oargs; i++) { 3284866cb6cbSAurelien Jarno if (IS_DEAD_ARG(i)) { 328543439139SRichard Henderson temp_dead(s, arg_temp(op->args[i])); 3286c896fe29Sbellard } 3287c896fe29Sbellard } 3288c896fe29Sbellard 3289c896fe29Sbellard /* clobber call registers */ 3290c8074023SRichard Henderson for (i = 0; i < TCG_TARGET_NB_REGS; i++) { 3291c8074023SRichard Henderson if (tcg_regset_test_reg(tcg_target_call_clobber_regs, i)) { 3292b3915dbbSRichard Henderson tcg_reg_free(s, i, allocated_regs); 3293c896fe29Sbellard } 3294c896fe29Sbellard } 3295c896fe29Sbellard 329678505279SAurelien Jarno /* Save globals if they might be written by the helper, sync them if 329778505279SAurelien Jarno they might be read. */ 329878505279SAurelien Jarno if (flags & TCG_CALL_NO_READ_GLOBALS) { 329978505279SAurelien Jarno /* Nothing to do */ 330078505279SAurelien Jarno } else if (flags & TCG_CALL_NO_WRITE_GLOBALS) { 330178505279SAurelien Jarno sync_globals(s, allocated_regs); 330278505279SAurelien Jarno } else { 3303e8996ee0Sbellard save_globals(s, allocated_regs); 3304b9c18f56Saurel32 } 3305c896fe29Sbellard 3306cf066674SRichard Henderson tcg_out_call(s, func_addr); 3307c896fe29Sbellard 3308c896fe29Sbellard /* assign output registers and emit moves if needed */ 3309c896fe29Sbellard for(i = 0; i < nb_oargs; i++) { 3310dd186292SRichard Henderson arg = op->args[i]; 331143439139SRichard Henderson ts = arg_temp(arg); 3312c896fe29Sbellard reg = tcg_target_call_oarg_regs[i]; 3313eabb7b91SAurelien Jarno tcg_debug_assert(s->reg_to_temp[reg] == NULL); 331434b1a49cSRichard Henderson 3315c896fe29Sbellard if (ts->fixed_reg) { 3316c896fe29Sbellard if (ts->reg != reg) { 33173b6dac34SRichard Henderson tcg_out_mov(s, ts->type, ts->reg, reg); 3318c896fe29Sbellard } 3319c896fe29Sbellard } else { 3320639368ddSAurelien Jarno if (ts->val_type == TEMP_VAL_REG) { 3321f8b2f202SRichard Henderson s->reg_to_temp[ts->reg] = NULL; 3322639368ddSAurelien Jarno } 3323c896fe29Sbellard ts->val_type = TEMP_VAL_REG; 3324c896fe29Sbellard ts->reg = reg; 3325c896fe29Sbellard ts->mem_coherent = 0; 3326f8b2f202SRichard Henderson s->reg_to_temp[reg] = ts; 3327ec7a869dSAurelien Jarno if (NEED_SYNC_ARG(i)) { 332859d7c14eSRichard Henderson temp_sync(s, ts, allocated_regs, IS_DEAD_ARG(i)); 332959d7c14eSRichard Henderson } else if (IS_DEAD_ARG(i)) { 3330f8bf00f1SRichard Henderson temp_dead(s, ts); 3331c896fe29Sbellard } 3332c896fe29Sbellard } 33338c11ad25SAurelien Jarno } 3334c896fe29Sbellard } 3335c896fe29Sbellard 3336c896fe29Sbellard #ifdef CONFIG_PROFILER 3337c896fe29Sbellard 3338c3fac113SEmilio G. Cota /* avoid copy/paste errors */ 3339c3fac113SEmilio G. Cota #define PROF_ADD(to, from, field) \ 3340c3fac113SEmilio G. Cota do { \ 3341c3fac113SEmilio G. Cota (to)->field += atomic_read(&((from)->field)); \ 3342c3fac113SEmilio G. Cota } while (0) 3343c896fe29Sbellard 3344c3fac113SEmilio G. Cota #define PROF_MAX(to, from, field) \ 3345c3fac113SEmilio G. Cota do { \ 3346c3fac113SEmilio G. Cota typeof((from)->field) val__ = atomic_read(&((from)->field)); \ 3347c3fac113SEmilio G. Cota if (val__ > (to)->field) { \ 3348c3fac113SEmilio G. Cota (to)->field = val__; \ 3349c3fac113SEmilio G. Cota } \ 3350c3fac113SEmilio G. Cota } while (0) 3351c3fac113SEmilio G. Cota 3352c3fac113SEmilio G. Cota /* Pass in a zero'ed @prof */ 3353c3fac113SEmilio G. Cota static inline 3354c3fac113SEmilio G. Cota void tcg_profile_snapshot(TCGProfile *prof, bool counters, bool table) 3355c896fe29Sbellard { 33563468b59eSEmilio G. Cota unsigned int n_ctxs = atomic_read(&n_tcg_ctxs); 3357c3fac113SEmilio G. Cota unsigned int i; 3358c3fac113SEmilio G. Cota 33593468b59eSEmilio G. Cota for (i = 0; i < n_ctxs; i++) { 33603468b59eSEmilio G. Cota TCGContext *s = atomic_read(&tcg_ctxs[i]); 33613468b59eSEmilio G. Cota const TCGProfile *orig = &s->prof; 3362c3fac113SEmilio G. Cota 3363c3fac113SEmilio G. Cota if (counters) { 3364c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count1); 3365c3fac113SEmilio G. Cota PROF_ADD(prof, orig, tb_count); 3366c3fac113SEmilio G. Cota PROF_ADD(prof, orig, op_count); 3367c3fac113SEmilio G. Cota PROF_MAX(prof, orig, op_count_max); 3368c3fac113SEmilio G. Cota PROF_ADD(prof, orig, temp_count); 3369c3fac113SEmilio G. Cota PROF_MAX(prof, orig, temp_count_max); 3370c3fac113SEmilio G. Cota PROF_ADD(prof, orig, del_op_count); 3371c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_in_len); 3372c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_out_len); 3373c3fac113SEmilio G. Cota PROF_ADD(prof, orig, search_out_len); 3374c3fac113SEmilio G. Cota PROF_ADD(prof, orig, interm_time); 3375c3fac113SEmilio G. Cota PROF_ADD(prof, orig, code_time); 3376c3fac113SEmilio G. Cota PROF_ADD(prof, orig, la_time); 3377c3fac113SEmilio G. Cota PROF_ADD(prof, orig, opt_time); 3378c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_count); 3379c3fac113SEmilio G. Cota PROF_ADD(prof, orig, restore_time); 3380c3fac113SEmilio G. Cota } 3381c3fac113SEmilio G. Cota if (table) { 3382c896fe29Sbellard int i; 3383d70724ceSzhanghailiang 338415fc7daaSRichard Henderson for (i = 0; i < NB_OPS; i++) { 3385c3fac113SEmilio G. Cota PROF_ADD(prof, orig, table_op_count[i]); 3386c3fac113SEmilio G. Cota } 3387c3fac113SEmilio G. Cota } 3388c3fac113SEmilio G. Cota } 3389c3fac113SEmilio G. Cota } 3390c3fac113SEmilio G. Cota 3391c3fac113SEmilio G. Cota #undef PROF_ADD 3392c3fac113SEmilio G. Cota #undef PROF_MAX 3393c3fac113SEmilio G. Cota 3394c3fac113SEmilio G. Cota static void tcg_profile_snapshot_counters(TCGProfile *prof) 3395c3fac113SEmilio G. Cota { 3396c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, true, false); 3397c3fac113SEmilio G. Cota } 3398c3fac113SEmilio G. Cota 3399c3fac113SEmilio G. Cota static void tcg_profile_snapshot_table(TCGProfile *prof) 3400c3fac113SEmilio G. Cota { 3401c3fac113SEmilio G. Cota tcg_profile_snapshot(prof, false, true); 3402c3fac113SEmilio G. Cota } 3403c3fac113SEmilio G. Cota 3404c3fac113SEmilio G. Cota void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3405c3fac113SEmilio G. Cota { 3406c3fac113SEmilio G. Cota TCGProfile prof = {}; 3407c3fac113SEmilio G. Cota int i; 3408c3fac113SEmilio G. Cota 3409c3fac113SEmilio G. Cota tcg_profile_snapshot_table(&prof); 3410c3fac113SEmilio G. Cota for (i = 0; i < NB_OPS; i++) { 3411246ae24dSMax Filippov cpu_fprintf(f, "%s %" PRId64 "\n", tcg_op_defs[i].name, 3412c3fac113SEmilio G. Cota prof.table_op_count[i]); 3413c896fe29Sbellard } 3414c896fe29Sbellard } 3415246ae24dSMax Filippov #else 3416246ae24dSMax Filippov void tcg_dump_op_count(FILE *f, fprintf_function cpu_fprintf) 3417246ae24dSMax Filippov { 3418246ae24dSMax Filippov cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3419246ae24dSMax Filippov } 3420c896fe29Sbellard #endif 3421c896fe29Sbellard 3422c896fe29Sbellard 34235bd2ec3dSAlex Bennée int tcg_gen_code(TCGContext *s, TranslationBlock *tb) 3424c896fe29Sbellard { 3425c3fac113SEmilio G. Cota #ifdef CONFIG_PROFILER 3426c3fac113SEmilio G. Cota TCGProfile *prof = &s->prof; 3427c3fac113SEmilio G. Cota #endif 342815fa08f8SRichard Henderson int i, num_insns; 342915fa08f8SRichard Henderson TCGOp *op; 3430c896fe29Sbellard 343104fe6400SRichard Henderson #ifdef CONFIG_PROFILER 343204fe6400SRichard Henderson { 3433*c1f543b7SEmilio G. Cota int n = 0; 343404fe6400SRichard Henderson 343515fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 343615fa08f8SRichard Henderson n++; 343715fa08f8SRichard Henderson } 3438c3fac113SEmilio G. Cota atomic_set(&prof->op_count, prof->op_count + n); 3439c3fac113SEmilio G. Cota if (n > prof->op_count_max) { 3440c3fac113SEmilio G. Cota atomic_set(&prof->op_count_max, n); 344104fe6400SRichard Henderson } 344204fe6400SRichard Henderson 344304fe6400SRichard Henderson n = s->nb_temps; 3444c3fac113SEmilio G. Cota atomic_set(&prof->temp_count, prof->temp_count + n); 3445c3fac113SEmilio G. Cota if (n > prof->temp_count_max) { 3446c3fac113SEmilio G. Cota atomic_set(&prof->temp_count_max, n); 344704fe6400SRichard Henderson } 344804fe6400SRichard Henderson } 344904fe6400SRichard Henderson #endif 345004fe6400SRichard Henderson 3451c896fe29Sbellard #ifdef DEBUG_DISAS 3452d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP) 3453d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 34541ee73216SRichard Henderson qemu_log_lock(); 345593fcfe39Saliguori qemu_log("OP:\n"); 3456eeacee4dSBlue Swirl tcg_dump_ops(s); 345793fcfe39Saliguori qemu_log("\n"); 34581ee73216SRichard Henderson qemu_log_unlock(); 3459c896fe29Sbellard } 3460c896fe29Sbellard #endif 3461c896fe29Sbellard 3462c5cc28ffSAurelien Jarno #ifdef CONFIG_PROFILER 3463c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time - profile_getclock()); 3464c5cc28ffSAurelien Jarno #endif 3465c5cc28ffSAurelien Jarno 34668f2e8c07SKirill Batuzov #ifdef USE_TCG_OPTIMIZATIONS 3467c45cb8bbSRichard Henderson tcg_optimize(s); 34688f2e8c07SKirill Batuzov #endif 34698f2e8c07SKirill Batuzov 3470a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3471c3fac113SEmilio G. Cota atomic_set(&prof->opt_time, prof->opt_time + profile_getclock()); 3472c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time - profile_getclock()); 3473a23a9ec6Sbellard #endif 3474c5cc28ffSAurelien Jarno 3475b83eabeaSRichard Henderson liveness_pass_1(s); 34765a18407fSRichard Henderson 34775a18407fSRichard Henderson if (s->nb_indirects > 0) { 34785a18407fSRichard Henderson #ifdef DEBUG_DISAS 34795a18407fSRichard Henderson if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_IND) 34805a18407fSRichard Henderson && qemu_log_in_addr_range(tb->pc))) { 34811ee73216SRichard Henderson qemu_log_lock(); 34825a18407fSRichard Henderson qemu_log("OP before indirect lowering:\n"); 34835a18407fSRichard Henderson tcg_dump_ops(s); 34845a18407fSRichard Henderson qemu_log("\n"); 34851ee73216SRichard Henderson qemu_log_unlock(); 34865a18407fSRichard Henderson } 34875a18407fSRichard Henderson #endif 34885a18407fSRichard Henderson /* Replace indirect temps with direct temps. */ 3489b83eabeaSRichard Henderson if (liveness_pass_2(s)) { 34905a18407fSRichard Henderson /* If changes were made, re-run liveness. */ 3491b83eabeaSRichard Henderson liveness_pass_1(s); 34925a18407fSRichard Henderson } 34935a18407fSRichard Henderson } 3494c5cc28ffSAurelien Jarno 3495a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3496c3fac113SEmilio G. Cota atomic_set(&prof->la_time, prof->la_time + profile_getclock()); 3497a23a9ec6Sbellard #endif 3498c896fe29Sbellard 3499c896fe29Sbellard #ifdef DEBUG_DISAS 3500d977e1c2SAlex Bennée if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP_OPT) 3501d977e1c2SAlex Bennée && qemu_log_in_addr_range(tb->pc))) { 35021ee73216SRichard Henderson qemu_log_lock(); 3503c5cc28ffSAurelien Jarno qemu_log("OP after optimization and liveness analysis:\n"); 3504eeacee4dSBlue Swirl tcg_dump_ops(s); 350593fcfe39Saliguori qemu_log("\n"); 35061ee73216SRichard Henderson qemu_log_unlock(); 3507c896fe29Sbellard } 3508c896fe29Sbellard #endif 3509c896fe29Sbellard 3510c896fe29Sbellard tcg_reg_alloc_start(s); 3511c896fe29Sbellard 3512e7e168f4SEmilio G. Cota s->code_buf = tb->tc.ptr; 3513e7e168f4SEmilio G. Cota s->code_ptr = tb->tc.ptr; 3514c896fe29Sbellard 3515659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 35166001f772SLaurent Vivier QSIMPLEQ_INIT(&s->ldst_labels); 3517659ef5cbSRichard Henderson #endif 351857a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 351957a26946SRichard Henderson s->pool_labels = NULL; 352057a26946SRichard Henderson #endif 35219ecefc84SRichard Henderson 3522fca8a500SRichard Henderson num_insns = -1; 352315fa08f8SRichard Henderson QTAILQ_FOREACH(op, &s->ops, link) { 3524c45cb8bbSRichard Henderson TCGOpcode opc = op->opc; 3525b3db8758Sblueswir1 3526c896fe29Sbellard #ifdef CONFIG_PROFILER 3527c3fac113SEmilio G. Cota atomic_set(&prof->table_op_count[opc], prof->table_op_count[opc] + 1); 3528c896fe29Sbellard #endif 3529c45cb8bbSRichard Henderson 3530c896fe29Sbellard switch (opc) { 3531c896fe29Sbellard case INDEX_op_mov_i32: 3532c896fe29Sbellard case INDEX_op_mov_i64: 3533d2fd745fSRichard Henderson case INDEX_op_mov_vec: 3534dd186292SRichard Henderson tcg_reg_alloc_mov(s, op); 3535c896fe29Sbellard break; 3536e8996ee0Sbellard case INDEX_op_movi_i32: 3537e8996ee0Sbellard case INDEX_op_movi_i64: 3538d2fd745fSRichard Henderson case INDEX_op_dupi_vec: 3539dd186292SRichard Henderson tcg_reg_alloc_movi(s, op); 3540e8996ee0Sbellard break; 3541765b842aSRichard Henderson case INDEX_op_insn_start: 3542fca8a500SRichard Henderson if (num_insns >= 0) { 35439f754620SRichard Henderson size_t off = tcg_current_code_size(s); 35449f754620SRichard Henderson s->gen_insn_end_off[num_insns] = off; 35459f754620SRichard Henderson /* Assert that we do not overflow our stored offset. */ 35469f754620SRichard Henderson assert(s->gen_insn_end_off[num_insns] == off); 3547fca8a500SRichard Henderson } 3548fca8a500SRichard Henderson num_insns++; 3549bad729e2SRichard Henderson for (i = 0; i < TARGET_INSN_START_WORDS; ++i) { 3550bad729e2SRichard Henderson target_ulong a; 3551bad729e2SRichard Henderson #if TARGET_LONG_BITS > TCG_TARGET_REG_BITS 3552efee3746SRichard Henderson a = deposit64(op->args[i * 2], 32, 32, op->args[i * 2 + 1]); 3553bad729e2SRichard Henderson #else 3554efee3746SRichard Henderson a = op->args[i]; 3555bad729e2SRichard Henderson #endif 3556fca8a500SRichard Henderson s->gen_insn_data[num_insns][i] = a; 3557bad729e2SRichard Henderson } 3558c896fe29Sbellard break; 35595ff9d6a4Sbellard case INDEX_op_discard: 356043439139SRichard Henderson temp_dead(s, arg_temp(op->args[0])); 35615ff9d6a4Sbellard break; 3562c896fe29Sbellard case INDEX_op_set_label: 3563e8996ee0Sbellard tcg_reg_alloc_bb_end(s, s->reserved_regs); 3564efee3746SRichard Henderson tcg_out_label(s, arg_label(op->args[0]), s->code_ptr); 3565c896fe29Sbellard break; 3566c896fe29Sbellard case INDEX_op_call: 3567dd186292SRichard Henderson tcg_reg_alloc_call(s, op); 3568c45cb8bbSRichard Henderson break; 3569c896fe29Sbellard default: 357025c4d9ccSRichard Henderson /* Sanity check that we've not introduced any unhandled opcodes. */ 3571be0f34b5SRichard Henderson tcg_debug_assert(tcg_op_supported(opc)); 3572c896fe29Sbellard /* Note: in order to speed up the code, it would be much 3573c896fe29Sbellard faster to have specialized register allocator functions for 3574c896fe29Sbellard some common argument patterns */ 3575dd186292SRichard Henderson tcg_reg_alloc_op(s, op); 3576c896fe29Sbellard break; 3577c896fe29Sbellard } 35788d8fdbaeSAurelien Jarno #ifdef CONFIG_DEBUG_TCG 3579c896fe29Sbellard check_regs(s); 3580c896fe29Sbellard #endif 3581b125f9dcSRichard Henderson /* Test for (pending) buffer overflow. The assumption is that any 3582b125f9dcSRichard Henderson one operation beginning below the high water mark cannot overrun 3583b125f9dcSRichard Henderson the buffer completely. Thus we can test for overflow after 3584b125f9dcSRichard Henderson generating code without having to check during generation. */ 3585644da9b3SJohn Clarke if (unlikely((void *)s->code_ptr > s->code_gen_highwater)) { 3586b125f9dcSRichard Henderson return -1; 3587b125f9dcSRichard Henderson } 3588c896fe29Sbellard } 3589fca8a500SRichard Henderson tcg_debug_assert(num_insns >= 0); 3590fca8a500SRichard Henderson s->gen_insn_end_off[num_insns] = tcg_current_code_size(s); 3591c45cb8bbSRichard Henderson 3592b76f0d8cSYeongkyoon Lee /* Generate TB finalization at the end of block */ 3593659ef5cbSRichard Henderson #ifdef TCG_TARGET_NEED_LDST_LABELS 3594659ef5cbSRichard Henderson if (!tcg_out_ldst_finalize(s)) { 359523dceda6SRichard Henderson return -1; 359623dceda6SRichard Henderson } 3597659ef5cbSRichard Henderson #endif 359857a26946SRichard Henderson #ifdef TCG_TARGET_NEED_POOL_LABELS 359957a26946SRichard Henderson if (!tcg_out_pool_finalize(s)) { 360057a26946SRichard Henderson return -1; 360157a26946SRichard Henderson } 360257a26946SRichard Henderson #endif 3603c896fe29Sbellard 3604c896fe29Sbellard /* flush instruction cache */ 36051813e175SRichard Henderson flush_icache_range((uintptr_t)s->code_buf, (uintptr_t)s->code_ptr); 36062aeabc08SStefan Weil 36071813e175SRichard Henderson return tcg_current_code_size(s); 3608c896fe29Sbellard } 3609c896fe29Sbellard 3610a23a9ec6Sbellard #ifdef CONFIG_PROFILER 3611405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3612a23a9ec6Sbellard { 3613c3fac113SEmilio G. Cota TCGProfile prof = {}; 3614c3fac113SEmilio G. Cota const TCGProfile *s; 3615c3fac113SEmilio G. Cota int64_t tb_count; 3616c3fac113SEmilio G. Cota int64_t tb_div_count; 3617c3fac113SEmilio G. Cota int64_t tot; 3618c3fac113SEmilio G. Cota 3619c3fac113SEmilio G. Cota tcg_profile_snapshot_counters(&prof); 3620c3fac113SEmilio G. Cota s = &prof; 3621c3fac113SEmilio G. Cota tb_count = s->tb_count; 3622c3fac113SEmilio G. Cota tb_div_count = tb_count ? tb_count : 1; 3623c3fac113SEmilio G. Cota tot = s->interm_time + s->code_time; 3624a23a9ec6Sbellard 3625a23a9ec6Sbellard cpu_fprintf(f, "JIT cycles %" PRId64 " (%0.3f s at 2.4 GHz)\n", 3626a23a9ec6Sbellard tot, tot / 2.4e9); 3627a23a9ec6Sbellard cpu_fprintf(f, "translated TBs %" PRId64 " (aborted=%" PRId64 " %0.1f%%)\n", 3628fca8a500SRichard Henderson tb_count, s->tb_count1 - tb_count, 3629fca8a500SRichard Henderson (double)(s->tb_count1 - s->tb_count) 3630fca8a500SRichard Henderson / (s->tb_count1 ? s->tb_count1 : 1) * 100.0); 3631a23a9ec6Sbellard cpu_fprintf(f, "avg ops/TB %0.1f max=%d\n", 3632fca8a500SRichard Henderson (double)s->op_count / tb_div_count, s->op_count_max); 3633a23a9ec6Sbellard cpu_fprintf(f, "deleted ops/TB %0.2f\n", 3634fca8a500SRichard Henderson (double)s->del_op_count / tb_div_count); 3635a23a9ec6Sbellard cpu_fprintf(f, "avg temps/TB %0.2f max=%d\n", 3636fca8a500SRichard Henderson (double)s->temp_count / tb_div_count, s->temp_count_max); 3637fca8a500SRichard Henderson cpu_fprintf(f, "avg host code/TB %0.1f\n", 3638fca8a500SRichard Henderson (double)s->code_out_len / tb_div_count); 3639fca8a500SRichard Henderson cpu_fprintf(f, "avg search data/TB %0.1f\n", 3640fca8a500SRichard Henderson (double)s->search_out_len / tb_div_count); 3641a23a9ec6Sbellard 3642a23a9ec6Sbellard cpu_fprintf(f, "cycles/op %0.1f\n", 3643a23a9ec6Sbellard s->op_count ? (double)tot / s->op_count : 0); 3644a23a9ec6Sbellard cpu_fprintf(f, "cycles/in byte %0.1f\n", 3645a23a9ec6Sbellard s->code_in_len ? (double)tot / s->code_in_len : 0); 3646a23a9ec6Sbellard cpu_fprintf(f, "cycles/out byte %0.1f\n", 3647a23a9ec6Sbellard s->code_out_len ? (double)tot / s->code_out_len : 0); 3648fca8a500SRichard Henderson cpu_fprintf(f, "cycles/search byte %0.1f\n", 3649fca8a500SRichard Henderson s->search_out_len ? (double)tot / s->search_out_len : 0); 3650fca8a500SRichard Henderson if (tot == 0) { 3651a23a9ec6Sbellard tot = 1; 3652fca8a500SRichard Henderson } 3653a23a9ec6Sbellard cpu_fprintf(f, " gen_interm time %0.1f%%\n", 3654a23a9ec6Sbellard (double)s->interm_time / tot * 100.0); 3655a23a9ec6Sbellard cpu_fprintf(f, " gen_code time %0.1f%%\n", 3656a23a9ec6Sbellard (double)s->code_time / tot * 100.0); 3657c5cc28ffSAurelien Jarno cpu_fprintf(f, "optim./code time %0.1f%%\n", 3658c5cc28ffSAurelien Jarno (double)s->opt_time / (s->code_time ? s->code_time : 1) 3659c5cc28ffSAurelien Jarno * 100.0); 3660a23a9ec6Sbellard cpu_fprintf(f, "liveness/code time %0.1f%%\n", 3661a23a9ec6Sbellard (double)s->la_time / (s->code_time ? s->code_time : 1) * 100.0); 3662a23a9ec6Sbellard cpu_fprintf(f, "cpu_restore count %" PRId64 "\n", 3663a23a9ec6Sbellard s->restore_count); 3664a23a9ec6Sbellard cpu_fprintf(f, " avg cycles %0.1f\n", 3665a23a9ec6Sbellard s->restore_count ? (double)s->restore_time / s->restore_count : 0); 3666a23a9ec6Sbellard } 3667a23a9ec6Sbellard #else 3668405cf9ffSStefan Weil void tcg_dump_info(FILE *f, fprintf_function cpu_fprintf) 3669a23a9ec6Sbellard { 367024bf7b3aSbellard cpu_fprintf(f, "[TCG profiler not compiled]\n"); 3671a23a9ec6Sbellard } 3672a23a9ec6Sbellard #endif 3673813da627SRichard Henderson 3674813da627SRichard Henderson #ifdef ELF_HOST_MACHINE 36755872bbf2SRichard Henderson /* In order to use this feature, the backend needs to do three things: 36765872bbf2SRichard Henderson 36775872bbf2SRichard Henderson (1) Define ELF_HOST_MACHINE to indicate both what value to 36785872bbf2SRichard Henderson put into the ELF image and to indicate support for the feature. 36795872bbf2SRichard Henderson 36805872bbf2SRichard Henderson (2) Define tcg_register_jit. This should create a buffer containing 36815872bbf2SRichard Henderson the contents of a .debug_frame section that describes the post- 36825872bbf2SRichard Henderson prologue unwind info for the tcg machine. 36835872bbf2SRichard Henderson 36845872bbf2SRichard Henderson (3) Call tcg_register_jit_int, with the constructed .debug_frame. 36855872bbf2SRichard Henderson */ 3686813da627SRichard Henderson 3687813da627SRichard Henderson /* Begin GDB interface. THE FOLLOWING MUST MATCH GDB DOCS. */ 3688813da627SRichard Henderson typedef enum { 3689813da627SRichard Henderson JIT_NOACTION = 0, 3690813da627SRichard Henderson JIT_REGISTER_FN, 3691813da627SRichard Henderson JIT_UNREGISTER_FN 3692813da627SRichard Henderson } jit_actions_t; 3693813da627SRichard Henderson 3694813da627SRichard Henderson struct jit_code_entry { 3695813da627SRichard Henderson struct jit_code_entry *next_entry; 3696813da627SRichard Henderson struct jit_code_entry *prev_entry; 3697813da627SRichard Henderson const void *symfile_addr; 3698813da627SRichard Henderson uint64_t symfile_size; 3699813da627SRichard Henderson }; 3700813da627SRichard Henderson 3701813da627SRichard Henderson struct jit_descriptor { 3702813da627SRichard Henderson uint32_t version; 3703813da627SRichard Henderson uint32_t action_flag; 3704813da627SRichard Henderson struct jit_code_entry *relevant_entry; 3705813da627SRichard Henderson struct jit_code_entry *first_entry; 3706813da627SRichard Henderson }; 3707813da627SRichard Henderson 3708813da627SRichard Henderson void __jit_debug_register_code(void) __attribute__((noinline)); 3709813da627SRichard Henderson void __jit_debug_register_code(void) 3710813da627SRichard Henderson { 3711813da627SRichard Henderson asm(""); 3712813da627SRichard Henderson } 3713813da627SRichard Henderson 3714813da627SRichard Henderson /* Must statically initialize the version, because GDB may check 3715813da627SRichard Henderson the version before we can set it. */ 3716813da627SRichard Henderson struct jit_descriptor __jit_debug_descriptor = { 1, 0, 0, 0 }; 3717813da627SRichard Henderson 3718813da627SRichard Henderson /* End GDB interface. */ 3719813da627SRichard Henderson 3720813da627SRichard Henderson static int find_string(const char *strtab, const char *str) 3721813da627SRichard Henderson { 3722813da627SRichard Henderson const char *p = strtab + 1; 3723813da627SRichard Henderson 3724813da627SRichard Henderson while (1) { 3725813da627SRichard Henderson if (strcmp(p, str) == 0) { 3726813da627SRichard Henderson return p - strtab; 3727813da627SRichard Henderson } 3728813da627SRichard Henderson p += strlen(p) + 1; 3729813da627SRichard Henderson } 3730813da627SRichard Henderson } 3731813da627SRichard Henderson 37325872bbf2SRichard Henderson static void tcg_register_jit_int(void *buf_ptr, size_t buf_size, 37332c90784aSRichard Henderson const void *debug_frame, 37342c90784aSRichard Henderson size_t debug_frame_size) 3735813da627SRichard Henderson { 37365872bbf2SRichard Henderson struct __attribute__((packed)) DebugInfo { 37375872bbf2SRichard Henderson uint32_t len; 37385872bbf2SRichard Henderson uint16_t version; 37395872bbf2SRichard Henderson uint32_t abbrev; 37405872bbf2SRichard Henderson uint8_t ptr_size; 37415872bbf2SRichard Henderson uint8_t cu_die; 37425872bbf2SRichard Henderson uint16_t cu_lang; 37435872bbf2SRichard Henderson uintptr_t cu_low_pc; 37445872bbf2SRichard Henderson uintptr_t cu_high_pc; 37455872bbf2SRichard Henderson uint8_t fn_die; 37465872bbf2SRichard Henderson char fn_name[16]; 37475872bbf2SRichard Henderson uintptr_t fn_low_pc; 37485872bbf2SRichard Henderson uintptr_t fn_high_pc; 37495872bbf2SRichard Henderson uint8_t cu_eoc; 37505872bbf2SRichard Henderson }; 3751813da627SRichard Henderson 3752813da627SRichard Henderson struct ElfImage { 3753813da627SRichard Henderson ElfW(Ehdr) ehdr; 3754813da627SRichard Henderson ElfW(Phdr) phdr; 37555872bbf2SRichard Henderson ElfW(Shdr) shdr[7]; 37565872bbf2SRichard Henderson ElfW(Sym) sym[2]; 37575872bbf2SRichard Henderson struct DebugInfo di; 37585872bbf2SRichard Henderson uint8_t da[24]; 37595872bbf2SRichard Henderson char str[80]; 37605872bbf2SRichard Henderson }; 37615872bbf2SRichard Henderson 37625872bbf2SRichard Henderson struct ElfImage *img; 37635872bbf2SRichard Henderson 37645872bbf2SRichard Henderson static const struct ElfImage img_template = { 37655872bbf2SRichard Henderson .ehdr = { 37665872bbf2SRichard Henderson .e_ident[EI_MAG0] = ELFMAG0, 37675872bbf2SRichard Henderson .e_ident[EI_MAG1] = ELFMAG1, 37685872bbf2SRichard Henderson .e_ident[EI_MAG2] = ELFMAG2, 37695872bbf2SRichard Henderson .e_ident[EI_MAG3] = ELFMAG3, 37705872bbf2SRichard Henderson .e_ident[EI_CLASS] = ELF_CLASS, 37715872bbf2SRichard Henderson .e_ident[EI_DATA] = ELF_DATA, 37725872bbf2SRichard Henderson .e_ident[EI_VERSION] = EV_CURRENT, 37735872bbf2SRichard Henderson .e_type = ET_EXEC, 37745872bbf2SRichard Henderson .e_machine = ELF_HOST_MACHINE, 37755872bbf2SRichard Henderson .e_version = EV_CURRENT, 37765872bbf2SRichard Henderson .e_phoff = offsetof(struct ElfImage, phdr), 37775872bbf2SRichard Henderson .e_shoff = offsetof(struct ElfImage, shdr), 37785872bbf2SRichard Henderson .e_ehsize = sizeof(ElfW(Shdr)), 37795872bbf2SRichard Henderson .e_phentsize = sizeof(ElfW(Phdr)), 37805872bbf2SRichard Henderson .e_phnum = 1, 37815872bbf2SRichard Henderson .e_shentsize = sizeof(ElfW(Shdr)), 37825872bbf2SRichard Henderson .e_shnum = ARRAY_SIZE(img->shdr), 37835872bbf2SRichard Henderson .e_shstrndx = ARRAY_SIZE(img->shdr) - 1, 3784abbb3eaeSRichard Henderson #ifdef ELF_HOST_FLAGS 3785abbb3eaeSRichard Henderson .e_flags = ELF_HOST_FLAGS, 3786abbb3eaeSRichard Henderson #endif 3787abbb3eaeSRichard Henderson #ifdef ELF_OSABI 3788abbb3eaeSRichard Henderson .e_ident[EI_OSABI] = ELF_OSABI, 3789abbb3eaeSRichard Henderson #endif 37905872bbf2SRichard Henderson }, 37915872bbf2SRichard Henderson .phdr = { 37925872bbf2SRichard Henderson .p_type = PT_LOAD, 37935872bbf2SRichard Henderson .p_flags = PF_X, 37945872bbf2SRichard Henderson }, 37955872bbf2SRichard Henderson .shdr = { 37965872bbf2SRichard Henderson [0] = { .sh_type = SHT_NULL }, 37975872bbf2SRichard Henderson /* Trick: The contents of code_gen_buffer are not present in 37985872bbf2SRichard Henderson this fake ELF file; that got allocated elsewhere. Therefore 37995872bbf2SRichard Henderson we mark .text as SHT_NOBITS (similar to .bss) so that readers 38005872bbf2SRichard Henderson will not look for contents. We can record any address. */ 38015872bbf2SRichard Henderson [1] = { /* .text */ 38025872bbf2SRichard Henderson .sh_type = SHT_NOBITS, 38035872bbf2SRichard Henderson .sh_flags = SHF_EXECINSTR | SHF_ALLOC, 38045872bbf2SRichard Henderson }, 38055872bbf2SRichard Henderson [2] = { /* .debug_info */ 38065872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 38075872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, di), 38085872bbf2SRichard Henderson .sh_size = sizeof(struct DebugInfo), 38095872bbf2SRichard Henderson }, 38105872bbf2SRichard Henderson [3] = { /* .debug_abbrev */ 38115872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 38125872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, da), 38135872bbf2SRichard Henderson .sh_size = sizeof(img->da), 38145872bbf2SRichard Henderson }, 38155872bbf2SRichard Henderson [4] = { /* .debug_frame */ 38165872bbf2SRichard Henderson .sh_type = SHT_PROGBITS, 38175872bbf2SRichard Henderson .sh_offset = sizeof(struct ElfImage), 38185872bbf2SRichard Henderson }, 38195872bbf2SRichard Henderson [5] = { /* .symtab */ 38205872bbf2SRichard Henderson .sh_type = SHT_SYMTAB, 38215872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, sym), 38225872bbf2SRichard Henderson .sh_size = sizeof(img->sym), 38235872bbf2SRichard Henderson .sh_info = 1, 38245872bbf2SRichard Henderson .sh_link = ARRAY_SIZE(img->shdr) - 1, 38255872bbf2SRichard Henderson .sh_entsize = sizeof(ElfW(Sym)), 38265872bbf2SRichard Henderson }, 38275872bbf2SRichard Henderson [6] = { /* .strtab */ 38285872bbf2SRichard Henderson .sh_type = SHT_STRTAB, 38295872bbf2SRichard Henderson .sh_offset = offsetof(struct ElfImage, str), 38305872bbf2SRichard Henderson .sh_size = sizeof(img->str), 38315872bbf2SRichard Henderson } 38325872bbf2SRichard Henderson }, 38335872bbf2SRichard Henderson .sym = { 38345872bbf2SRichard Henderson [1] = { /* code_gen_buffer */ 38355872bbf2SRichard Henderson .st_info = ELF_ST_INFO(STB_GLOBAL, STT_FUNC), 38365872bbf2SRichard Henderson .st_shndx = 1, 38375872bbf2SRichard Henderson } 38385872bbf2SRichard Henderson }, 38395872bbf2SRichard Henderson .di = { 38405872bbf2SRichard Henderson .len = sizeof(struct DebugInfo) - 4, 38415872bbf2SRichard Henderson .version = 2, 38425872bbf2SRichard Henderson .ptr_size = sizeof(void *), 38435872bbf2SRichard Henderson .cu_die = 1, 38445872bbf2SRichard Henderson .cu_lang = 0x8001, /* DW_LANG_Mips_Assembler */ 38455872bbf2SRichard Henderson .fn_die = 2, 38465872bbf2SRichard Henderson .fn_name = "code_gen_buffer" 38475872bbf2SRichard Henderson }, 38485872bbf2SRichard Henderson .da = { 38495872bbf2SRichard Henderson 1, /* abbrev number (the cu) */ 38505872bbf2SRichard Henderson 0x11, 1, /* DW_TAG_compile_unit, has children */ 38515872bbf2SRichard Henderson 0x13, 0x5, /* DW_AT_language, DW_FORM_data2 */ 38525872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 38535872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 38545872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 38555872bbf2SRichard Henderson 2, /* abbrev number (the fn) */ 38565872bbf2SRichard Henderson 0x2e, 0, /* DW_TAG_subprogram, no children */ 38575872bbf2SRichard Henderson 0x3, 0x8, /* DW_AT_name, DW_FORM_string */ 38585872bbf2SRichard Henderson 0x11, 0x1, /* DW_AT_low_pc, DW_FORM_addr */ 38595872bbf2SRichard Henderson 0x12, 0x1, /* DW_AT_high_pc, DW_FORM_addr */ 38605872bbf2SRichard Henderson 0, 0, /* end of abbrev */ 38615872bbf2SRichard Henderson 0 /* no more abbrev */ 38625872bbf2SRichard Henderson }, 38635872bbf2SRichard Henderson .str = "\0" ".text\0" ".debug_info\0" ".debug_abbrev\0" 38645872bbf2SRichard Henderson ".debug_frame\0" ".symtab\0" ".strtab\0" "code_gen_buffer", 3865813da627SRichard Henderson }; 3866813da627SRichard Henderson 3867813da627SRichard Henderson /* We only need a single jit entry; statically allocate it. */ 3868813da627SRichard Henderson static struct jit_code_entry one_entry; 3869813da627SRichard Henderson 38705872bbf2SRichard Henderson uintptr_t buf = (uintptr_t)buf_ptr; 3871813da627SRichard Henderson size_t img_size = sizeof(struct ElfImage) + debug_frame_size; 38722c90784aSRichard Henderson DebugFrameHeader *dfh; 3873813da627SRichard Henderson 38745872bbf2SRichard Henderson img = g_malloc(img_size); 38755872bbf2SRichard Henderson *img = img_template; 3876813da627SRichard Henderson 38775872bbf2SRichard Henderson img->phdr.p_vaddr = buf; 38785872bbf2SRichard Henderson img->phdr.p_paddr = buf; 38795872bbf2SRichard Henderson img->phdr.p_memsz = buf_size; 3880813da627SRichard Henderson 38815872bbf2SRichard Henderson img->shdr[1].sh_name = find_string(img->str, ".text"); 38825872bbf2SRichard Henderson img->shdr[1].sh_addr = buf; 38835872bbf2SRichard Henderson img->shdr[1].sh_size = buf_size; 3884813da627SRichard Henderson 38855872bbf2SRichard Henderson img->shdr[2].sh_name = find_string(img->str, ".debug_info"); 38865872bbf2SRichard Henderson img->shdr[3].sh_name = find_string(img->str, ".debug_abbrev"); 38875872bbf2SRichard Henderson 38885872bbf2SRichard Henderson img->shdr[4].sh_name = find_string(img->str, ".debug_frame"); 38895872bbf2SRichard Henderson img->shdr[4].sh_size = debug_frame_size; 38905872bbf2SRichard Henderson 38915872bbf2SRichard Henderson img->shdr[5].sh_name = find_string(img->str, ".symtab"); 38925872bbf2SRichard Henderson img->shdr[6].sh_name = find_string(img->str, ".strtab"); 38935872bbf2SRichard Henderson 38945872bbf2SRichard Henderson img->sym[1].st_name = find_string(img->str, "code_gen_buffer"); 38955872bbf2SRichard Henderson img->sym[1].st_value = buf; 38965872bbf2SRichard Henderson img->sym[1].st_size = buf_size; 38975872bbf2SRichard Henderson 38985872bbf2SRichard Henderson img->di.cu_low_pc = buf; 389945aba097SRichard Henderson img->di.cu_high_pc = buf + buf_size; 39005872bbf2SRichard Henderson img->di.fn_low_pc = buf; 390145aba097SRichard Henderson img->di.fn_high_pc = buf + buf_size; 3902813da627SRichard Henderson 39032c90784aSRichard Henderson dfh = (DebugFrameHeader *)(img + 1); 39042c90784aSRichard Henderson memcpy(dfh, debug_frame, debug_frame_size); 39052c90784aSRichard Henderson dfh->fde.func_start = buf; 39062c90784aSRichard Henderson dfh->fde.func_len = buf_size; 39072c90784aSRichard Henderson 3908813da627SRichard Henderson #ifdef DEBUG_JIT 3909813da627SRichard Henderson /* Enable this block to be able to debug the ELF image file creation. 3910813da627SRichard Henderson One can use readelf, objdump, or other inspection utilities. */ 3911813da627SRichard Henderson { 3912813da627SRichard Henderson FILE *f = fopen("/tmp/qemu.jit", "w+b"); 3913813da627SRichard Henderson if (f) { 39145872bbf2SRichard Henderson if (fwrite(img, img_size, 1, f) != img_size) { 3915813da627SRichard Henderson /* Avoid stupid unused return value warning for fwrite. */ 3916813da627SRichard Henderson } 3917813da627SRichard Henderson fclose(f); 3918813da627SRichard Henderson } 3919813da627SRichard Henderson } 3920813da627SRichard Henderson #endif 3921813da627SRichard Henderson 3922813da627SRichard Henderson one_entry.symfile_addr = img; 3923813da627SRichard Henderson one_entry.symfile_size = img_size; 3924813da627SRichard Henderson 3925813da627SRichard Henderson __jit_debug_descriptor.action_flag = JIT_REGISTER_FN; 3926813da627SRichard Henderson __jit_debug_descriptor.relevant_entry = &one_entry; 3927813da627SRichard Henderson __jit_debug_descriptor.first_entry = &one_entry; 3928813da627SRichard Henderson __jit_debug_register_code(); 3929813da627SRichard Henderson } 3930813da627SRichard Henderson #else 39315872bbf2SRichard Henderson /* No support for the feature. Provide the entry point expected by exec.c, 39325872bbf2SRichard Henderson and implement the internal function we declared earlier. */ 3933813da627SRichard Henderson 3934813da627SRichard Henderson static void tcg_register_jit_int(void *buf, size_t size, 39352c90784aSRichard Henderson const void *debug_frame, 39362c90784aSRichard Henderson size_t debug_frame_size) 3937813da627SRichard Henderson { 3938813da627SRichard Henderson } 3939813da627SRichard Henderson 3940813da627SRichard Henderson void tcg_register_jit(void *buf, size_t buf_size) 3941813da627SRichard Henderson { 3942813da627SRichard Henderson } 3943813da627SRichard Henderson #endif /* ELF_HOST_MACHINE */ 3944db432672SRichard Henderson 3945db432672SRichard Henderson #if !TCG_TARGET_MAYBE_vec 3946db432672SRichard Henderson void tcg_expand_vec_op(TCGOpcode o, TCGType t, unsigned e, TCGArg a0, ...) 3947db432672SRichard Henderson { 3948db432672SRichard Henderson g_assert_not_reached(); 3949db432672SRichard Henderson } 3950db432672SRichard Henderson #endif 3951